Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Merge pull request #195 from junming-yang/leaderboard
Browse files- gen_table.py +1 -1
- meta_data.py +1 -1
gen_table.py
CHANGED
@@ -63,7 +63,7 @@ def BUILD_L1_DF(results, fields):
|
|
63 |
check_box = {}
|
64 |
check_box['essential'] = ['Method', 'Parameters (B)', 'Language Model', 'Vision Model']
|
65 |
# revise there to set defualt dataset
|
66 |
-
defualt_dataset = ['MMBench_TEST_EN', 'MMStar', 'MME', 'MMMU_VAL', 'MathVista', 'OCRBench', 'MMVet']
|
67 |
check_box['required'] = ['Avg Score', 'Avg Rank'] + defualt_dataset
|
68 |
check_box['avg'] = ['Avg Score', 'Avg Rank']
|
69 |
check_box['all'] = check_box['avg'] + fields
|
|
|
63 |
check_box = {}
|
64 |
check_box['essential'] = ['Method', 'Parameters (B)', 'Language Model', 'Vision Model']
|
65 |
# revise there to set defualt dataset
|
66 |
+
defualt_dataset = ['MMBench_TEST_EN', 'MMBench_TEST_CN', 'MMStar', 'MME', 'MMMU_VAL', 'MathVista', 'OCRBench', 'MMVet', 'AI2D', 'HallusionBench', 'LLaVABench', 'SEEDBench_IMG']
|
67 |
check_box['required'] = ['Avg Score', 'Avg Rank'] + defualt_dataset
|
68 |
check_box['avg'] = ['Avg Score', 'Avg Rank']
|
69 |
check_box['all'] = check_box['avg'] + fields
|
meta_data.py
CHANGED
@@ -22,7 +22,7 @@ META_FIELDS = ['Method', 'Parameters (B)', 'Language Model', 'Vision Model', 'Op
|
|
22 |
MAIN_FIELDS = [
|
23 |
'MMBench_TEST_EN', 'MMBench_TEST_CN', 'MMStar', 'MME',
|
24 |
'MMMU_VAL', 'MathVista', 'OCRBench', 'AI2D',
|
25 |
-
'HallusionBench', 'SEEDBench_IMG', 'MMVet', 'LLaVABench'
|
26 |
]
|
27 |
MMBENCH_FIELDS = ['MMBench_TEST_EN', 'MMBench_DEV_EN', 'MMBench_TEST_CN', 'MMBench_DEV_CN', 'CCBench']
|
28 |
MODEL_SIZE = ['<10B', '10B-20B', '20B-40B', '>40B', 'Unknown']
|
|
|
22 |
MAIN_FIELDS = [
|
23 |
'MMBench_TEST_EN', 'MMBench_TEST_CN', 'MMStar', 'MME',
|
24 |
'MMMU_VAL', 'MathVista', 'OCRBench', 'AI2D',
|
25 |
+
'HallusionBench', 'SEEDBench_IMG', 'MMVet', 'LLaVABench', 'CCBench', 'RealWorldQA'
|
26 |
]
|
27 |
MMBENCH_FIELDS = ['MMBench_TEST_EN', 'MMBench_DEV_EN', 'MMBench_TEST_CN', 'MMBench_DEV_CN', 'CCBench']
|
28 |
MODEL_SIZE = ['<10B', '10B-20B', '20B-40B', '>40B', 'Unknown']
|