File size: 1,770 Bytes
256a159
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
from opencompass.openicl.icl_prompt_template import PromptTemplate
from opencompass.openicl.icl_retriever import ZeroRetriever
from opencompass.openicl.icl_inferencer import PPLInferencer
from opencompass.openicl.icl_evaluator import AccEvaluator
from opencompass.datasets import ARCDataset

ARC_e_reader_cfg = dict(
    input_columns=['question', 'textA', 'textB', 'textC', 'textD'],
    output_column='answerKey')

ARC_e_infer_cfg = dict(
    prompt_template=dict(
        type=PromptTemplate,
        template={
            "A":
            dict(
                round=[
                    dict(role="HUMAN", prompt="Question: {question}\nAnswer: "),
                    dict(role="BOT", prompt="{textA}")
                ], ),
            "B":
            dict(
                round=[
                    dict(role="HUMAN", prompt="Question: {question}\nAnswer: "),
                    dict(role="BOT", prompt="{textB}")
                ], ),
            "C":
            dict(
                round=[
                    dict(role="HUMAN", prompt="Question: {question}\nAnswer: "),
                    dict(role="BOT", prompt="{textC}")
                ], ),
            "D":
            dict(
                round=[
                    dict(role="HUMAN", prompt="Question: {question}\nAnswer: "),
                    dict(role="BOT", prompt="{textD}")
                ], ),
        }),
    retriever=dict(type=ZeroRetriever),
    inferencer=dict(type=PPLInferencer))

ARC_e_eval_cfg = dict(evaluator=dict(type=AccEvaluator))

ARC_e_datasets = [
    dict(
        type=ARCDataset,
        abbr='ARC-e',
        path='./data/ARC/ARC-e/ARC-Easy-Dev.jsonl',
        reader_cfg=ARC_e_reader_cfg,
        infer_cfg=ARC_e_infer_cfg,
        eval_cfg=ARC_e_eval_cfg)
]