TwT-6
/

api-demo

Model card Files Files and versions Community

File size: 2,589 Bytes

256a159

from opencompass.models.claude_api.claude_api import Claude
from opencompass.models.claude_api.postprocessors import (
    flores_postprocess, gsm8k_postprocess, humaneval_postprocess,
    lcsts_postprocess, mbpp_postprocess, strategyqa_pred_postprocess)
from opencompass.utils.text_postprocessors import last_option_postprocess

agieval_single_choice_sets = [
    'gaokao-chinese',
    'gaokao-english',
    'gaokao-geography',
    'gaokao-history',
    'gaokao-biology',
    'gaokao-chemistry',
    'gaokao-mathqa',
    'logiqa-zh',
    'lsat-ar',
    'lsat-lr',
    'lsat-rc',
    'logiqa-en',
    'sat-math',
    'sat-en',
    'sat-en-without-passage',
    'aqua-rat',
]
agieval_multiple_choices_sets = [
    'gaokao-physics',
    'jec-qa-kd',
    'jec-qa-ca',
]

claude_postprocessors = {
    'ceval-*': dict(type=last_option_postprocess, options='ABCD'),
    'bustm-*': dict(type=last_option_postprocess, options='AB'),
    'hellaswag': dict(type=last_option_postprocess, options='ABCD'),
    'lukaemon_mmlu_*': dict(type=last_option_postprocess, options='ABCD'),
    'openbookqa*': dict(type=last_option_postprocess, options='ABCD'),
    'piqa': dict(type=last_option_postprocess, options='AB'),
    'race-*': dict(type=last_option_postprocess, options='ABCD'),
    'summedits': dict(type=last_option_postprocess, options='AB'),
    'BoolQ': dict(type=last_option_postprocess, options='AB'),
    'CB': dict(type=last_option_postprocess, options='ABC'),
    'MultiRC': dict(type=last_option_postprocess, options='AB'),
    'RTE': dict(type=last_option_postprocess, options='AB'),
    'WiC': dict(type=last_option_postprocess, options='AB'),
    'WSC': dict(type=last_option_postprocess, options='AB'),
    'winogrande': dict(type=last_option_postprocess, options='AB'),
    'gsm8k': dict(type=gsm8k_postprocess),
    'openai_humaneval': dict(type=humaneval_postprocess),
    'lcsts': dict(type=lcsts_postprocess),
    'mbpp': dict(type=mbpp_postprocess),
    'strategyqa': dict(type=strategyqa_pred_postprocess),
    'commonsense_qa': dict(type=last_option_postprocess, options='ABCDE'),
    'flores_100_*-zho_simpl': dict(type=flores_postprocess),
}

for _name in agieval_multiple_choices_sets + agieval_single_choice_sets:
    claude_postprocessors[f'agieval-{_name}'] = dict(type=last_option_postprocess, options='ABCDE')

models = [
    dict(abbr='Claude',
        type=Claude,
        path='claude-1',
        key='YOUR_CLAUDE_KEY',
        query_per_second=1,
        max_out_len=2048, max_seq_len=2048, batch_size=2,
        pred_postprocessor=claude_postprocessors,
    ),
]