File size: 1,951 Bytes
256a159
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
from mmengine.config import read_base

with read_base():
    from .groups.plugineval import plugineval_summary_groups

summarizer = dict(
    dataset_abbrs=[
        ['plugin_eval', 'naive_average'],
        ['plugin_eval-instruct_v1', 'string_metric'],  # 指令跟随能力-string格式
        ['plugin_eval-instruct_v1', 'json_metric'],  # 指令跟随能力-json格式
        ['plugin_eval-plan_str_v1', 'f1_score'],  # 规划能力-string格式
        ['plugin_eval-plan_json_v1', 'f1_score'],  # 规划能力-json格式
        ['plugin_eval-reason_str_v1', 'thought'],  # 推理能力-string格式
        ['plugin_eval-reason_retrieve_understand_json_v1', 'thought'],  # 推理能力-json格式
        ['plugin_eval-retrieve_str_v1', 'name'],  # 检索能力-string格式
        ['plugin_eval-reason_retrieve_understand_json_v1', 'name'],  # 检索能力-json格式
        ['plugin_eval-understand_str_v1', 'args'],  # 理解能力-string格式
        ['plugin_eval-reason_retrieve_understand_json_v1', 'args'],  # 理解能力-json格式
        ['plugin_eval-review_str_v1', 'review_quality'],   # 反思能力-string格式

        ['plugin_eval_zh', 'naive_average'],
        ['plugin_eval-instruct_v1_zh', 'string_metric'],
        ['plugin_eval-instruct_v1_zh', 'json_metric'],
        ['plugin_eval-plan_str_v1_zh', 'f1_score'],
        ['plugin_eval-plan_json_v1_zh', 'f1_score'],
        ['plugin_eval-reason_str_v1_zh', 'thought'],
        ['plugin_eval-reason_retrieve_understand_json_v1_zh', 'thought'],
        ['plugin_eval-retrieve_str_v1_zh', 'name'],
        ['plugin_eval-reason_retrieve_understand_json_v1_zh', 'name'],
        ['plugin_eval-understand_str_v1_zh', 'args'],
        ['plugin_eval-reason_retrieve_understand_json_v1_zh', 'args'],
        ['plugin_eval-review_str_v1_zh', 'review_quality'],
    ],
    summary_groups=sum(
        [v for k, v in locals().items() if k.endswith("_summary_groups")], [])
)