|
from copy import deepcopy |
|
|
|
naive_mathbench_summary_groups = [ |
|
{ |
|
'name': 'mathbench-college', |
|
'subsets': [ |
|
['mathbench-college-single_choice_cn', 'acc_1'], |
|
['mathbench-college-cloze_en', 'accuracy'], |
|
] |
|
}, |
|
{ |
|
'name': 'mathbench-high', |
|
'subsets': [ |
|
['mathbench-high-single_choice_cn', 'acc_1'], |
|
['mathbench-high-single_choice_en', 'acc_1'], |
|
] |
|
}, |
|
{ |
|
'name': 'mathbench-middle', |
|
'subsets': [ |
|
['mathbench-middle-single_choice_cn', 'acc_1'], |
|
] |
|
}, |
|
{ |
|
'name': 'mathbench-primary', |
|
'subsets': [ |
|
['mathbench-primary-cloze_cn', 'accuracy'], |
|
] |
|
}, |
|
{ |
|
'name': 'mathbench', |
|
'subsets': [ |
|
'mathbench-college', |
|
'mathbench-high', |
|
'mathbench-middle', |
|
'mathbench-primary', |
|
], |
|
}, |
|
{ |
|
'name': 'mathbench-college-circular', |
|
'subsets': [ |
|
['mathbench-college-single_choice_cn', 'perf_4'], |
|
] |
|
}, |
|
{ |
|
'name': 'mathbench-high-circular', |
|
'subsets': [ |
|
['mathbench-high-single_choice_cn', 'perf_4'], |
|
['mathbench-high-single_choice_en', 'perf_4'], |
|
] |
|
}, |
|
{ |
|
'name': 'mathbench-middle-circular', |
|
'subsets': [ |
|
['mathbench-middle-single_choice_cn', 'perf_4'], |
|
] |
|
}, |
|
{ |
|
'name': 'mathbench-circular', |
|
'subsets': [ |
|
'mathbench-college-circular', |
|
'mathbench-high-circular', |
|
'mathbench-middle-circular', |
|
], |
|
}, |
|
{ |
|
'name': 'mathbench-circular-and-cloze', |
|
'subsets': [ |
|
'mathbench-college-circular', |
|
'mathbench-high-circular', |
|
'mathbench-middle-circular', |
|
'mathbench-college-cloze_en', |
|
'mathbench-primary-cloze_cn', |
|
], |
|
} |
|
] |
|
|
|
agent_mathbench_summary_groups = [] |
|
for item in naive_mathbench_summary_groups: |
|
item = deepcopy(item) |
|
item['name'] = item['name'] + '-agent' |
|
if isinstance(item['subsets'][0], str): |
|
item['subsets'] = [i + '-agent' for i in item['subsets']] |
|
else: |
|
item['subsets'] = [[i[0] + '-agent', i[1]] for i in item['subsets']] |
|
agent_mathbench_summary_groups.append(item) |
|
|
|
mathbench_summary_groups = naive_mathbench_summary_groups + agent_mathbench_summary_groups |
|
|