File size: 15,368 Bytes
256a159
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
LICENSE
README.md
setup.py
opencompass/__init__.py
opencompass/registry.py
opencompass.egg-info/PKG-INFO
opencompass.egg-info/SOURCES.txt
opencompass.egg-info/dependency_links.txt
opencompass.egg-info/requires.txt
opencompass.egg-info/top_level.txt
opencompass/datasets/FinanceIQ.py
opencompass/datasets/GaokaoBench.py
opencompass/datasets/OpenFinData.py
opencompass/datasets/TheoremQA.py
opencompass/datasets/__init__.py
opencompass/datasets/advglue.py
opencompass/datasets/afqmcd.py
opencompass/datasets/anli.py
opencompass/datasets/anthropics_evals.py
opencompass/datasets/arc.py
opencompass/datasets/ax.py
opencompass/datasets/base.py
opencompass/datasets/bbh.py
opencompass/datasets/boolq.py
opencompass/datasets/bustum.py
opencompass/datasets/c3.py
opencompass/datasets/cb.py
opencompass/datasets/ceval.py
opencompass/datasets/chid.py
opencompass/datasets/cibench.py
opencompass/datasets/circular.py
opencompass/datasets/civilcomments.py
opencompass/datasets/clozeTest_maxmin.py
opencompass/datasets/cluewsc.py
opencompass/datasets/cmb.py
opencompass/datasets/cmmlu.py
opencompass/datasets/cmnli.py
opencompass/datasets/cmrc.py
opencompass/datasets/commonsenseqa.py
opencompass/datasets/commonsenseqa_cn.py
opencompass/datasets/copa.py
opencompass/datasets/crowspairs.py
opencompass/datasets/crowspairs_cn.py
opencompass/datasets/csl.py
opencompass/datasets/custom.py
opencompass/datasets/cvalues.py
opencompass/datasets/drcd.py
opencompass/datasets/drop.py
opencompass/datasets/ds1000.py
opencompass/datasets/ds1000_interpreter.py
opencompass/datasets/eprstmt.py
opencompass/datasets/flores.py
opencompass/datasets/game24.py
opencompass/datasets/govrepcrs.py
opencompass/datasets/gpqa.py
opencompass/datasets/gsm8k.py
opencompass/datasets/gsm_hard.py
opencompass/datasets/hellaswag.py
opencompass/datasets/huggingface.py
opencompass/datasets/humaneval.py
opencompass/datasets/humaneval_multi.py
opencompass/datasets/humanevalx.py
opencompass/datasets/hungarian_math.py
opencompass/datasets/iwslt2017.py
opencompass/datasets/jigsawmultilingual.py
opencompass/datasets/jsonl.py
opencompass/datasets/kaoshi.py
opencompass/datasets/lambada.py
opencompass/datasets/lcsts.py
opencompass/datasets/lmeval.py
opencompass/datasets/mastermath2024v1.py
opencompass/datasets/math.py
opencompass/datasets/math401.py
opencompass/datasets/math_intern.py
opencompass/datasets/mathbench.py
opencompass/datasets/mbpp.py
opencompass/datasets/mmlu.py
opencompass/datasets/multirc.py
opencompass/datasets/narrativeqa.py
opencompass/datasets/natural_question.py
opencompass/datasets/natural_question_cn.py
opencompass/datasets/obqa.py
opencompass/datasets/piqa.py
opencompass/datasets/py150.py
opencompass/datasets/qasper.py
opencompass/datasets/qaspercut.py
opencompass/datasets/race.py
opencompass/datasets/realtoxicprompts.py
opencompass/datasets/record.py
opencompass/datasets/rolebench.py
opencompass/datasets/safety.py
opencompass/datasets/scibench.py
opencompass/datasets/siqa.py
opencompass/datasets/squad20.py
opencompass/datasets/storycloze.py
opencompass/datasets/strategyqa.py
opencompass/datasets/summedits.py
opencompass/datasets/summscreen.py
opencompass/datasets/svamp.py
opencompass/datasets/tabmwp.py
opencompass/datasets/tnews.py
opencompass/datasets/triviaqa.py
opencompass/datasets/triviaqarc.py
opencompass/datasets/truthfulqa.py
opencompass/datasets/tydiqa.py
opencompass/datasets/wic.py
opencompass/datasets/wikibench.py
opencompass/datasets/winograd.py
opencompass/datasets/winogrande.py
opencompass/datasets/wnli.py
opencompass/datasets/wsc.py
opencompass/datasets/xcopa.py
opencompass/datasets/xiezhi.py
opencompass/datasets/xlsum.py
opencompass/datasets/xsum.py
opencompass/datasets/NPHardEval/__init__.py
opencompass/datasets/NPHardEval/cmp_GCP_D.py
opencompass/datasets/NPHardEval/cmp_KSP.py
opencompass/datasets/NPHardEval/cmp_TSP_D.py
opencompass/datasets/NPHardEval/hard_GCP.py
opencompass/datasets/NPHardEval/hard_MSP.py
opencompass/datasets/NPHardEval/hard_TSP.py
opencompass/datasets/NPHardEval/p_BSP.py
opencompass/datasets/NPHardEval/p_EDP.py
opencompass/datasets/NPHardEval/p_SPP.py
opencompass/datasets/NPHardEval/prompts.py
opencompass/datasets/NPHardEval/utils.py
opencompass/datasets/agieval/__init__.py
opencompass/datasets/agieval/agieval.py
opencompass/datasets/agieval/constructions.py
opencompass/datasets/agieval/dataset_loader.py
opencompass/datasets/agieval/evaluation.py
opencompass/datasets/agieval/math_equivalence.py
opencompass/datasets/agieval/post_process.py
opencompass/datasets/agieval/utils.py
opencompass/datasets/infinitebench/__init__.py
opencompass/datasets/infinitebench/infinitebench_codedebug.py
opencompass/datasets/infinitebench/infinitebench_coderun.py
opencompass/datasets/infinitebench/infinitebench_endia.py
opencompass/datasets/infinitebench/infinitebench_enmc.py
opencompass/datasets/infinitebench/infinitebench_enqa.py
opencompass/datasets/infinitebench/infinitebench_ensum.py
opencompass/datasets/infinitebench/infinitebench_mathcalc.py
opencompass/datasets/infinitebench/infinitebench_mathfind.py
opencompass/datasets/infinitebench/infinitebench_retrievekv.py
opencompass/datasets/infinitebench/infinitebench_retrievenumber.py
opencompass/datasets/infinitebench/infinitebench_retrievepasskey.py
opencompass/datasets/infinitebench/infinitebench_zhqa.py
opencompass/datasets/infinitebench/utils.py
opencompass/datasets/lawbench/__init__.py
opencompass/datasets/lawbench/lawbench.py
opencompass/datasets/leval/__init__.py
opencompass/datasets/leval/evaluators.py
opencompass/datasets/leval/leval_coursera.py
opencompass/datasets/leval/leval_financial_qa.py
opencompass/datasets/leval/leval_gov_report_summ.py
opencompass/datasets/leval/leval_gsm100.py
opencompass/datasets/leval/leval_legal_contract_qa.py
opencompass/datasets/leval/leval_meeting_summ.py
opencompass/datasets/leval/leval_multidoc_qa.py
opencompass/datasets/leval/leval_narrattive_qa.py
opencompass/datasets/leval/leval_natural_question.py
opencompass/datasets/leval/leval_news_summ.py
opencompass/datasets/leval/leval_paper_assistant.py
opencompass/datasets/leval/leval_patent_summ.py
opencompass/datasets/leval/leval_quality.py
opencompass/datasets/leval/leval_review_summ.py
opencompass/datasets/leval/leval_scientific_qa.py
opencompass/datasets/leval/leval_topic_retrieval.py
opencompass/datasets/leval/leval_tpo.py
opencompass/datasets/leval/leval_tvshow_summ.py
opencompass/datasets/longbench/__init__.py
opencompass/datasets/longbench/evaluators.py
opencompass/datasets/longbench/longbench_2wikim_qa.py
opencompass/datasets/longbench/longbench_dureader.py
opencompass/datasets/longbench/longbench_gov_report.py
opencompass/datasets/longbench/longbench_hotpot_qa.py
opencompass/datasets/longbench/longbench_lcc.py
opencompass/datasets/longbench/longbench_lsht.py
opencompass/datasets/longbench/longbench_multi_news.py
opencompass/datasets/longbench/longbench_multifieldqa_en.py
opencompass/datasets/longbench/longbench_multifieldqa_zh.py
opencompass/datasets/longbench/longbench_musique.py
opencompass/datasets/longbench/longbench_narrative_qa.py
opencompass/datasets/longbench/longbench_passage_count.py
opencompass/datasets/longbench/longbench_passage_retrieval_en.py
opencompass/datasets/longbench/longbench_passage_retrieval_zh.py
opencompass/datasets/longbench/longbench_qasper.py
opencompass/datasets/longbench/longbench_qmsum.py
opencompass/datasets/longbench/longbench_repobench.py
opencompass/datasets/longbench/longbench_samsum.py
opencompass/datasets/longbench/longbench_trec.py
opencompass/datasets/longbench/longbench_trivia_qa.py
opencompass/datasets/longbench/longbench_vcsum.py
opencompass/datasets/lveval/__init__.py
opencompass/datasets/lveval/evaluators.py
opencompass/datasets/lveval/lveval_cmrc_mixup.py
opencompass/datasets/lveval/lveval_dureader_mixup.py
opencompass/datasets/lveval/lveval_factrecall_en.py
opencompass/datasets/lveval/lveval_factrecall_zh.py
opencompass/datasets/lveval/lveval_hotpotwikiqa_mixup.py
opencompass/datasets/lveval/lveval_lic_mixup.py
opencompass/datasets/lveval/lveval_loogle_CR_mixup.py
opencompass/datasets/lveval/lveval_loogle_MIR_mixup.py
opencompass/datasets/lveval/lveval_loogle_SD_mixup.py
opencompass/datasets/lveval/lveval_multifieldqa_en_mixup.py
opencompass/datasets/lveval/lveval_multifieldqa_zh_mixup.py
opencompass/datasets/medbench/__init__.py
opencompass/datasets/medbench/constructions.py
opencompass/datasets/medbench/dataset_loader.py
opencompass/datasets/medbench/evaluation.py
opencompass/datasets/medbench/math_equivalence.py
opencompass/datasets/medbench/medbench.py
opencompass/datasets/medbench/post_process.py
opencompass/datasets/medbench/utils.py
opencompass/datasets/reasonbench/ReasonBenchDataset.py
opencompass/datasets/reasonbench/__init__.py
opencompass/datasets/subjective/__init__.py
opencompass/datasets/subjective/alignbench.py
opencompass/datasets/subjective/compass_arena.py
opencompass/datasets/subjective/corev2.py
opencompass/datasets/subjective/creationbench.py
opencompass/datasets/subjective/information_retrival.py
opencompass/datasets/subjective/mtbench.py
opencompass/datasets/subjective/multiround.py
opencompass/datasets/subjective/subjective_cmp.py
opencompass/datasets/teval/__init__.py
opencompass/datasets/teval/schema.py
opencompass/datasets/teval/evaluators/__init__.py
opencompass/datasets/teval/evaluators/instruct_evaluator.py
opencompass/datasets/teval/evaluators/planning_evaluator.py
opencompass/datasets/teval/evaluators/reason_retrieve_understand_evaluator.py
opencompass/datasets/teval/evaluators/review_evaluator.py
opencompass/datasets/teval/utils/__init__.py
opencompass/datasets/teval/utils/convert_results.py
opencompass/datasets/teval/utils/format_load.py
opencompass/datasets/teval/utils/meta_template.py
opencompass/datasets/teval/utils/template.py
opencompass/metrics/__init__.py
opencompass/metrics/dump_results.py
opencompass/metrics/mme_score.py
opencompass/metrics/seedbench.py
opencompass/models/__init__.py
opencompass/models/accessory.py
opencompass/models/ai360_api.py
opencompass/models/alaya.py
opencompass/models/baichuan_api.py
opencompass/models/baidu_api.py
opencompass/models/base.py
opencompass/models/base_api.py
opencompass/models/bytedance_api.py
opencompass/models/gemini_api.py
opencompass/models/glm.py
opencompass/models/huggingface.py
opencompass/models/intern_model.py
opencompass/models/krgpt_api.py
opencompass/models/lagent.py
opencompass/models/langchain.py
opencompass/models/lightllm_api.py
opencompass/models/llama2.py
opencompass/models/lmdeploy_pytorch.py
opencompass/models/minimax_api.py
opencompass/models/mixtral.py
opencompass/models/modelscope.py
opencompass/models/moonshot_api.py
opencompass/models/nanbeige_api.py
opencompass/models/openai_api.py
opencompass/models/pangu_api.py
opencompass/models/qwen_api.py
opencompass/models/sensetime_api.py
opencompass/models/turbomind.py
opencompass/models/turbomind_api.py
opencompass/models/turbomind_tis.py
opencompass/models/vllm.py
opencompass/models/xunfei_api.py
opencompass/models/zhipuai_api.py
opencompass/models/zhipuai_v2_api.py
opencompass/models/claude_api/__init__.py
opencompass/models/claude_api/claude_api.py
opencompass/models/claude_api/postprocessors.py
opencompass/openicl/__init__.py
opencompass/openicl/icl_dataset_reader.py
opencompass/openicl/icl_prompt_template.py
opencompass/openicl/icl_evaluator/__init__.py
opencompass/openicl/icl_evaluator/icl_agent_evaluator.py
opencompass/openicl/icl_evaluator/icl_aucroc_evaluator.py
opencompass/openicl/icl_evaluator/icl_base_evaluator.py
opencompass/openicl/icl_evaluator/icl_circular_evaluator.py
opencompass/openicl/icl_evaluator/icl_em_evaluator.py
opencompass/openicl/icl_evaluator/icl_hf_evaluator.py
opencompass/openicl/icl_evaluator/icl_jieba_rouge_evaluator.py
opencompass/openicl/icl_evaluator/icl_misc_evaluator.py
opencompass/openicl/icl_evaluator/icl_plugin_evaluator.py
opencompass/openicl/icl_evaluator/icl_toxic_evaluator.py
opencompass/openicl/icl_evaluator/lm_evaluator.py
opencompass/openicl/icl_inferencer/__init__.py
opencompass/openicl/icl_inferencer/icl_agent_inferencer.py
opencompass/openicl/icl_inferencer/icl_attack_inferencer.py
opencompass/openicl/icl_inferencer/icl_base_inferencer.py
opencompass/openicl/icl_inferencer/icl_chat_inferencer.py
opencompass/openicl/icl_inferencer/icl_clp_inferencer.py
opencompass/openicl/icl_inferencer/icl_gen_inferencer.py
opencompass/openicl/icl_inferencer/icl_ll_inferencer.py
opencompass/openicl/icl_inferencer/icl_mink_percent_inferencer.py
opencompass/openicl/icl_inferencer/icl_ppl_inferencer.py
opencompass/openicl/icl_inferencer/icl_ppl_only_inferencer.py
opencompass/openicl/icl_inferencer/icl_sc_inferencer.py
opencompass/openicl/icl_inferencer/icl_tot_inferencer.py
opencompass/openicl/icl_retriever/__init__.py
opencompass/openicl/icl_retriever/icl_base_retriever.py
opencompass/openicl/icl_retriever/icl_bm25_retriever.py
opencompass/openicl/icl_retriever/icl_dpp_retriever.py
opencompass/openicl/icl_retriever/icl_fix_k_retriever.py
opencompass/openicl/icl_retriever/icl_mdl_retriever.py
opencompass/openicl/icl_retriever/icl_random_retriever.py
opencompass/openicl/icl_retriever/icl_topk_retriever.py
opencompass/openicl/icl_retriever/icl_votek_retriever.py
opencompass/openicl/icl_retriever/icl_zero_retriever.py
opencompass/openicl/utils/__init__.py
opencompass/openicl/utils/logging.py
opencompass/partitioners/__init__.py
opencompass/partitioners/base.py
opencompass/partitioners/mm_naive.py
opencompass/partitioners/naive.py
opencompass/partitioners/num_worker.py
opencompass/partitioners/size.py
opencompass/partitioners/sub_naive.py
opencompass/partitioners/sub_size.py
opencompass/runners/__init__.py
opencompass/runners/base.py
opencompass/runners/dlc.py
opencompass/runners/local.py
opencompass/runners/local_api.py
opencompass/runners/slurm.py
opencompass/runners/slurm_sequential.py
opencompass/summarizers/__init__.py
opencompass/summarizers/circular.py
opencompass/summarizers/default.py
opencompass/summarizers/multi_model.py
opencompass/summarizers/needlebench.py
opencompass/summarizers/summarizer_pretrain.py
opencompass/summarizers/subjective/__init__.py
opencompass/summarizers/subjective/alignmentbench.py
opencompass/summarizers/subjective/alpacaeval.py
opencompass/summarizers/subjective/compass_arena.py
opencompass/summarizers/subjective/corev2.py
opencompass/summarizers/subjective/creationbench.py
opencompass/summarizers/subjective/information_retrival.py
opencompass/summarizers/subjective/mtbench.py
opencompass/summarizers/subjective/multiround.py
opencompass/summarizers/subjective/subjective_post_process.py
opencompass/summarizers/subjective/utils.py
opencompass/tasks/__init__.py
opencompass/tasks/base.py
opencompass/tasks/llm_eval.py
opencompass/tasks/mm_infer.py
opencompass/tasks/openicl_attack.py
opencompass/tasks/openicl_eval.py
opencompass/tasks/openicl_infer.py
opencompass/tasks/subjective_eval.py
opencompass/utils/__init__.py
opencompass/utils/abbr.py
opencompass/utils/auxiliary.py
opencompass/utils/build.py
opencompass/utils/collect_env.py
opencompass/utils/dependency.py
opencompass/utils/file.py
opencompass/utils/fileio.py
opencompass/utils/lark.py
opencompass/utils/logging.py
opencompass/utils/menu.py
opencompass/utils/prompt.py
opencompass/utils/run.py
opencompass/utils/text_postprocessors.py
opencompass/utils/types.py