We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 3ee6c67 commit 1057cb5Copy full SHA for 1057cb5
tests/lmeval/configs/vl_fp8_dynamic_per_token.yaml
@@ -8,10 +8,16 @@ lmeval:
8
model_args:
9
dtype: bfloat16
10
convert_img_format: True
11
- task: mmmu_val_literature
+ task: chartqa
12
apply_chat_template: True
13
num_fewshot: 0
14
- batch_size: 8
15
- # dense model achieves accuracy of 0.833
+ batch_size: 100
+ limit: 100
16
+ # test runs in 26m
17
+ # dense model achieves exact_match accuracy of 0.530
18
+ # dense model achieves relaxed_accuracy of 0.780
19
+ # dense model achieves anywhere_accuracy of 0.800
20
metrics:
- acc,none: 0.833
21
+ exact_match,none: 0.530
22
+ relaxed_accuracy,none: 0.780
23
+ anywhere_accuracy,none: 0.810
0 commit comments