TwT-6
/

api-demo

Model card Files Files and versions Community

api-demo / opencompass-my-api /configs /summarizers /compass_math.py

TwT-6

Upload 2667 files

256a159 verified 8 months ago

raw

history blame

2.02 kB

	# This summarizer is used for `./datasets/compassbench_v1_math/compassbench_v1_math_gen`

	compassbench_v1_math_groups = [
	{'name': 'math_acc_1_and_fill_in_blank', 'subsets': [['compassbench_v1_math-high-single_choice_cn', 'acc_1'], ['compassbench_v1_math-high-single_choice_en', 'acc_1'], ['compassbench_v1_math-middle-single_choice_cn', 'acc_1'], ['compassbench_v1_math-middle-single_choice_en', 'acc_1'], ['compassbench_v1_math-primary-cloze_cn', 'accuracy'], ['compassbench_v1_math-primary-cloze_en', 'accuracy']]},
	{'name': 'math_perf_4_and_fill_in_blank', 'subsets': [['compassbench_v1_math-high-single_choice_cn', 'perf_4'], ['compassbench_v1_math-high-single_choice_en', 'perf_4'], ['compassbench_v1_math-middle-single_choice_cn', 'perf_4'], ['compassbench_v1_math-middle-single_choice_en', 'perf_4'], ['compassbench_v1_math-primary-cloze_cn', 'accuracy'], ['compassbench_v1_math-primary-cloze_en', 'accuracy']]},
	{'name': 'math_perf_4_and_fill_in_blank_cn', 'subsets': [['compassbench_v1_math-high-single_choice_cn', 'perf_4'], ['compassbench_v1_math-middle-single_choice_cn', 'perf_4'], ['compassbench_v1_math-primary-cloze_cn', 'accuracy']]},
	{'name': 'math_perf_4_and_fill_in_blank_en', 'subsets': [['compassbench_v1_math-high-single_choice_en', 'perf_4'], ['compassbench_v1_math-middle-single_choice_en', 'perf_4'], ['compassbench_v1_math-primary-cloze_en', 'accuracy']]},
	]


	summarizer = dict(
	dataset_abbrs=[
	'math_perf_4_and_fill_in_blank',
	'math_perf_4_and_fill_in_blank_cn',
	'math_perf_4_and_fill_in_blank_en',
	['compassbench_v1_math-high-single_choice_cn', 'perf_4'],
	['compassbench_v1_math-high-single_choice_en', 'perf_4'],
	['compassbench_v1_math-middle-single_choice_cn', 'perf_4'],
	['compassbench_v1_math-middle-single_choice_en', 'perf_4'],
	['compassbench_v1_math-primary-cloze_cn', 'accuracy'],
	['compassbench_v1_math-primary-cloze_en', 'accuracy'],
	],
	summary_groups=compassbench_v1_math_groups,
	)