|
from copy import deepcopy |
|
|
|
_base_summary_groups = [ |
|
{ |
|
'name': 'teval-instruct_v1', |
|
'metric': 'format_metric', |
|
'subsets': [ |
|
['teval-instruct_v1', 'string_format_metric'], |
|
['teval-instruct_v1', 'json_format_metric'], |
|
] |
|
}, |
|
{ |
|
'name': 'teval-instruct_v1', |
|
'metric': 'args_em_metric', |
|
'subsets': [ |
|
['teval-instruct_v1', 'string_args_em_metric'], |
|
['teval-instruct_v1', 'json_args_em_metric'], |
|
] |
|
}, |
|
{ |
|
'name': 'teval-instruct_v1', |
|
'metric': 'string_metric', |
|
'subsets': [ |
|
['teval-instruct_v1', 'string_format_metric'], |
|
['teval-instruct_v1', 'string_args_em_metric'], |
|
] |
|
}, |
|
{ |
|
'name': 'teval-instruct_v1', |
|
'metric': 'json_metric', |
|
'subsets': [ |
|
['teval-instruct_v1', 'json_format_metric'], |
|
['teval-instruct_v1', 'json_args_em_metric'], |
|
] |
|
}, |
|
{ |
|
'name': 'copy_teval-review_str_v1', |
|
'subsets': [ |
|
['teval-review_str_v1', 'review_quality'], |
|
], |
|
}, |
|
{ |
|
'name': 'teval', |
|
'subsets': [ |
|
['teval-instruct_v1', 'format_metric'], |
|
['teval-instruct_v1', 'args_em_metric'], |
|
['teval-plan_str_v1', 'f1_score'], |
|
['teval-plan_json_v1', 'f1_score'], |
|
['teval-reason_str_v1', 'thought'], |
|
['teval-reason_retrieve_understand_json_v1', 'thought'], |
|
['teval-retrieve_str_v1', 'name'], |
|
['teval-reason_retrieve_understand_json_v1', 'name'], |
|
['teval-understand_str_v1', 'args'], |
|
['teval-reason_retrieve_understand_json_v1', 'args'], |
|
['teval-review_str_v1', 'review_quality'], |
|
['copy_teval-review_str_v1', 'naive_average'], |
|
] |
|
}, |
|
] |
|
|
|
teval_summary_groups = [] |
|
|
|
|
|
for group in _base_summary_groups: |
|
group = deepcopy(group) |
|
teval_summary_groups.append(group) |
|
|
|
|
|
for group in _base_summary_groups: |
|
group = deepcopy(group) |
|
group['name'] = group['name'] + '_zh' |
|
group['subsets'] = [[subset[0] + '_zh', subset[1]] for subset in group['subsets']] |
|
teval_summary_groups.append(group) |
|
|
|
|