File size: 15,368 Bytes
256a159 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 |
LICENSE README.md setup.py opencompass/__init__.py opencompass/registry.py opencompass.egg-info/PKG-INFO opencompass.egg-info/SOURCES.txt opencompass.egg-info/dependency_links.txt opencompass.egg-info/requires.txt opencompass.egg-info/top_level.txt opencompass/datasets/FinanceIQ.py opencompass/datasets/GaokaoBench.py opencompass/datasets/OpenFinData.py opencompass/datasets/TheoremQA.py opencompass/datasets/__init__.py opencompass/datasets/advglue.py opencompass/datasets/afqmcd.py opencompass/datasets/anli.py opencompass/datasets/anthropics_evals.py opencompass/datasets/arc.py opencompass/datasets/ax.py opencompass/datasets/base.py opencompass/datasets/bbh.py opencompass/datasets/boolq.py opencompass/datasets/bustum.py opencompass/datasets/c3.py opencompass/datasets/cb.py opencompass/datasets/ceval.py opencompass/datasets/chid.py opencompass/datasets/cibench.py opencompass/datasets/circular.py opencompass/datasets/civilcomments.py opencompass/datasets/clozeTest_maxmin.py opencompass/datasets/cluewsc.py opencompass/datasets/cmb.py opencompass/datasets/cmmlu.py opencompass/datasets/cmnli.py opencompass/datasets/cmrc.py opencompass/datasets/commonsenseqa.py opencompass/datasets/commonsenseqa_cn.py opencompass/datasets/copa.py opencompass/datasets/crowspairs.py opencompass/datasets/crowspairs_cn.py opencompass/datasets/csl.py opencompass/datasets/custom.py opencompass/datasets/cvalues.py opencompass/datasets/drcd.py opencompass/datasets/drop.py opencompass/datasets/ds1000.py opencompass/datasets/ds1000_interpreter.py opencompass/datasets/eprstmt.py opencompass/datasets/flores.py opencompass/datasets/game24.py opencompass/datasets/govrepcrs.py opencompass/datasets/gpqa.py opencompass/datasets/gsm8k.py opencompass/datasets/gsm_hard.py opencompass/datasets/hellaswag.py opencompass/datasets/huggingface.py opencompass/datasets/humaneval.py opencompass/datasets/humaneval_multi.py opencompass/datasets/humanevalx.py opencompass/datasets/hungarian_math.py opencompass/datasets/iwslt2017.py opencompass/datasets/jigsawmultilingual.py opencompass/datasets/jsonl.py opencompass/datasets/kaoshi.py opencompass/datasets/lambada.py opencompass/datasets/lcsts.py opencompass/datasets/lmeval.py opencompass/datasets/mastermath2024v1.py opencompass/datasets/math.py opencompass/datasets/math401.py opencompass/datasets/math_intern.py opencompass/datasets/mathbench.py opencompass/datasets/mbpp.py opencompass/datasets/mmlu.py opencompass/datasets/multirc.py opencompass/datasets/narrativeqa.py opencompass/datasets/natural_question.py opencompass/datasets/natural_question_cn.py opencompass/datasets/obqa.py opencompass/datasets/piqa.py opencompass/datasets/py150.py opencompass/datasets/qasper.py opencompass/datasets/qaspercut.py opencompass/datasets/race.py opencompass/datasets/realtoxicprompts.py opencompass/datasets/record.py opencompass/datasets/rolebench.py opencompass/datasets/safety.py opencompass/datasets/scibench.py opencompass/datasets/siqa.py opencompass/datasets/squad20.py opencompass/datasets/storycloze.py opencompass/datasets/strategyqa.py opencompass/datasets/summedits.py opencompass/datasets/summscreen.py opencompass/datasets/svamp.py opencompass/datasets/tabmwp.py opencompass/datasets/tnews.py opencompass/datasets/triviaqa.py opencompass/datasets/triviaqarc.py opencompass/datasets/truthfulqa.py opencompass/datasets/tydiqa.py opencompass/datasets/wic.py opencompass/datasets/wikibench.py opencompass/datasets/winograd.py opencompass/datasets/winogrande.py opencompass/datasets/wnli.py opencompass/datasets/wsc.py opencompass/datasets/xcopa.py opencompass/datasets/xiezhi.py opencompass/datasets/xlsum.py opencompass/datasets/xsum.py opencompass/datasets/NPHardEval/__init__.py opencompass/datasets/NPHardEval/cmp_GCP_D.py opencompass/datasets/NPHardEval/cmp_KSP.py opencompass/datasets/NPHardEval/cmp_TSP_D.py opencompass/datasets/NPHardEval/hard_GCP.py opencompass/datasets/NPHardEval/hard_MSP.py opencompass/datasets/NPHardEval/hard_TSP.py opencompass/datasets/NPHardEval/p_BSP.py opencompass/datasets/NPHardEval/p_EDP.py opencompass/datasets/NPHardEval/p_SPP.py opencompass/datasets/NPHardEval/prompts.py opencompass/datasets/NPHardEval/utils.py opencompass/datasets/agieval/__init__.py opencompass/datasets/agieval/agieval.py opencompass/datasets/agieval/constructions.py opencompass/datasets/agieval/dataset_loader.py opencompass/datasets/agieval/evaluation.py opencompass/datasets/agieval/math_equivalence.py opencompass/datasets/agieval/post_process.py opencompass/datasets/agieval/utils.py opencompass/datasets/infinitebench/__init__.py opencompass/datasets/infinitebench/infinitebench_codedebug.py opencompass/datasets/infinitebench/infinitebench_coderun.py opencompass/datasets/infinitebench/infinitebench_endia.py opencompass/datasets/infinitebench/infinitebench_enmc.py opencompass/datasets/infinitebench/infinitebench_enqa.py opencompass/datasets/infinitebench/infinitebench_ensum.py opencompass/datasets/infinitebench/infinitebench_mathcalc.py opencompass/datasets/infinitebench/infinitebench_mathfind.py opencompass/datasets/infinitebench/infinitebench_retrievekv.py opencompass/datasets/infinitebench/infinitebench_retrievenumber.py opencompass/datasets/infinitebench/infinitebench_retrievepasskey.py opencompass/datasets/infinitebench/infinitebench_zhqa.py opencompass/datasets/infinitebench/utils.py opencompass/datasets/lawbench/__init__.py opencompass/datasets/lawbench/lawbench.py opencompass/datasets/leval/__init__.py opencompass/datasets/leval/evaluators.py opencompass/datasets/leval/leval_coursera.py opencompass/datasets/leval/leval_financial_qa.py opencompass/datasets/leval/leval_gov_report_summ.py opencompass/datasets/leval/leval_gsm100.py opencompass/datasets/leval/leval_legal_contract_qa.py opencompass/datasets/leval/leval_meeting_summ.py opencompass/datasets/leval/leval_multidoc_qa.py opencompass/datasets/leval/leval_narrattive_qa.py opencompass/datasets/leval/leval_natural_question.py opencompass/datasets/leval/leval_news_summ.py opencompass/datasets/leval/leval_paper_assistant.py opencompass/datasets/leval/leval_patent_summ.py opencompass/datasets/leval/leval_quality.py opencompass/datasets/leval/leval_review_summ.py opencompass/datasets/leval/leval_scientific_qa.py opencompass/datasets/leval/leval_topic_retrieval.py opencompass/datasets/leval/leval_tpo.py opencompass/datasets/leval/leval_tvshow_summ.py opencompass/datasets/longbench/__init__.py opencompass/datasets/longbench/evaluators.py opencompass/datasets/longbench/longbench_2wikim_qa.py opencompass/datasets/longbench/longbench_dureader.py opencompass/datasets/longbench/longbench_gov_report.py opencompass/datasets/longbench/longbench_hotpot_qa.py opencompass/datasets/longbench/longbench_lcc.py opencompass/datasets/longbench/longbench_lsht.py opencompass/datasets/longbench/longbench_multi_news.py opencompass/datasets/longbench/longbench_multifieldqa_en.py opencompass/datasets/longbench/longbench_multifieldqa_zh.py opencompass/datasets/longbench/longbench_musique.py opencompass/datasets/longbench/longbench_narrative_qa.py opencompass/datasets/longbench/longbench_passage_count.py opencompass/datasets/longbench/longbench_passage_retrieval_en.py opencompass/datasets/longbench/longbench_passage_retrieval_zh.py opencompass/datasets/longbench/longbench_qasper.py opencompass/datasets/longbench/longbench_qmsum.py opencompass/datasets/longbench/longbench_repobench.py opencompass/datasets/longbench/longbench_samsum.py opencompass/datasets/longbench/longbench_trec.py opencompass/datasets/longbench/longbench_trivia_qa.py opencompass/datasets/longbench/longbench_vcsum.py opencompass/datasets/lveval/__init__.py opencompass/datasets/lveval/evaluators.py opencompass/datasets/lveval/lveval_cmrc_mixup.py opencompass/datasets/lveval/lveval_dureader_mixup.py opencompass/datasets/lveval/lveval_factrecall_en.py opencompass/datasets/lveval/lveval_factrecall_zh.py opencompass/datasets/lveval/lveval_hotpotwikiqa_mixup.py opencompass/datasets/lveval/lveval_lic_mixup.py opencompass/datasets/lveval/lveval_loogle_CR_mixup.py opencompass/datasets/lveval/lveval_loogle_MIR_mixup.py opencompass/datasets/lveval/lveval_loogle_SD_mixup.py opencompass/datasets/lveval/lveval_multifieldqa_en_mixup.py opencompass/datasets/lveval/lveval_multifieldqa_zh_mixup.py opencompass/datasets/medbench/__init__.py opencompass/datasets/medbench/constructions.py opencompass/datasets/medbench/dataset_loader.py opencompass/datasets/medbench/evaluation.py opencompass/datasets/medbench/math_equivalence.py opencompass/datasets/medbench/medbench.py opencompass/datasets/medbench/post_process.py opencompass/datasets/medbench/utils.py opencompass/datasets/reasonbench/ReasonBenchDataset.py opencompass/datasets/reasonbench/__init__.py opencompass/datasets/subjective/__init__.py opencompass/datasets/subjective/alignbench.py opencompass/datasets/subjective/compass_arena.py opencompass/datasets/subjective/corev2.py opencompass/datasets/subjective/creationbench.py opencompass/datasets/subjective/information_retrival.py opencompass/datasets/subjective/mtbench.py opencompass/datasets/subjective/multiround.py opencompass/datasets/subjective/subjective_cmp.py opencompass/datasets/teval/__init__.py opencompass/datasets/teval/schema.py opencompass/datasets/teval/evaluators/__init__.py opencompass/datasets/teval/evaluators/instruct_evaluator.py opencompass/datasets/teval/evaluators/planning_evaluator.py opencompass/datasets/teval/evaluators/reason_retrieve_understand_evaluator.py opencompass/datasets/teval/evaluators/review_evaluator.py opencompass/datasets/teval/utils/__init__.py opencompass/datasets/teval/utils/convert_results.py opencompass/datasets/teval/utils/format_load.py opencompass/datasets/teval/utils/meta_template.py opencompass/datasets/teval/utils/template.py opencompass/metrics/__init__.py opencompass/metrics/dump_results.py opencompass/metrics/mme_score.py opencompass/metrics/seedbench.py opencompass/models/__init__.py opencompass/models/accessory.py opencompass/models/ai360_api.py opencompass/models/alaya.py opencompass/models/baichuan_api.py opencompass/models/baidu_api.py opencompass/models/base.py opencompass/models/base_api.py opencompass/models/bytedance_api.py opencompass/models/gemini_api.py opencompass/models/glm.py opencompass/models/huggingface.py opencompass/models/intern_model.py opencompass/models/krgpt_api.py opencompass/models/lagent.py opencompass/models/langchain.py opencompass/models/lightllm_api.py opencompass/models/llama2.py opencompass/models/lmdeploy_pytorch.py opencompass/models/minimax_api.py opencompass/models/mixtral.py opencompass/models/modelscope.py opencompass/models/moonshot_api.py opencompass/models/nanbeige_api.py opencompass/models/openai_api.py opencompass/models/pangu_api.py opencompass/models/qwen_api.py opencompass/models/sensetime_api.py opencompass/models/turbomind.py opencompass/models/turbomind_api.py opencompass/models/turbomind_tis.py opencompass/models/vllm.py opencompass/models/xunfei_api.py opencompass/models/zhipuai_api.py opencompass/models/zhipuai_v2_api.py opencompass/models/claude_api/__init__.py opencompass/models/claude_api/claude_api.py opencompass/models/claude_api/postprocessors.py opencompass/openicl/__init__.py opencompass/openicl/icl_dataset_reader.py opencompass/openicl/icl_prompt_template.py opencompass/openicl/icl_evaluator/__init__.py opencompass/openicl/icl_evaluator/icl_agent_evaluator.py opencompass/openicl/icl_evaluator/icl_aucroc_evaluator.py opencompass/openicl/icl_evaluator/icl_base_evaluator.py opencompass/openicl/icl_evaluator/icl_circular_evaluator.py opencompass/openicl/icl_evaluator/icl_em_evaluator.py opencompass/openicl/icl_evaluator/icl_hf_evaluator.py opencompass/openicl/icl_evaluator/icl_jieba_rouge_evaluator.py opencompass/openicl/icl_evaluator/icl_misc_evaluator.py opencompass/openicl/icl_evaluator/icl_plugin_evaluator.py opencompass/openicl/icl_evaluator/icl_toxic_evaluator.py opencompass/openicl/icl_evaluator/lm_evaluator.py opencompass/openicl/icl_inferencer/__init__.py opencompass/openicl/icl_inferencer/icl_agent_inferencer.py opencompass/openicl/icl_inferencer/icl_attack_inferencer.py opencompass/openicl/icl_inferencer/icl_base_inferencer.py opencompass/openicl/icl_inferencer/icl_chat_inferencer.py opencompass/openicl/icl_inferencer/icl_clp_inferencer.py opencompass/openicl/icl_inferencer/icl_gen_inferencer.py opencompass/openicl/icl_inferencer/icl_ll_inferencer.py opencompass/openicl/icl_inferencer/icl_mink_percent_inferencer.py opencompass/openicl/icl_inferencer/icl_ppl_inferencer.py opencompass/openicl/icl_inferencer/icl_ppl_only_inferencer.py opencompass/openicl/icl_inferencer/icl_sc_inferencer.py opencompass/openicl/icl_inferencer/icl_tot_inferencer.py opencompass/openicl/icl_retriever/__init__.py opencompass/openicl/icl_retriever/icl_base_retriever.py opencompass/openicl/icl_retriever/icl_bm25_retriever.py opencompass/openicl/icl_retriever/icl_dpp_retriever.py opencompass/openicl/icl_retriever/icl_fix_k_retriever.py opencompass/openicl/icl_retriever/icl_mdl_retriever.py opencompass/openicl/icl_retriever/icl_random_retriever.py opencompass/openicl/icl_retriever/icl_topk_retriever.py opencompass/openicl/icl_retriever/icl_votek_retriever.py opencompass/openicl/icl_retriever/icl_zero_retriever.py opencompass/openicl/utils/__init__.py opencompass/openicl/utils/logging.py opencompass/partitioners/__init__.py opencompass/partitioners/base.py opencompass/partitioners/mm_naive.py opencompass/partitioners/naive.py opencompass/partitioners/num_worker.py opencompass/partitioners/size.py opencompass/partitioners/sub_naive.py opencompass/partitioners/sub_size.py opencompass/runners/__init__.py opencompass/runners/base.py opencompass/runners/dlc.py opencompass/runners/local.py opencompass/runners/local_api.py opencompass/runners/slurm.py opencompass/runners/slurm_sequential.py opencompass/summarizers/__init__.py opencompass/summarizers/circular.py opencompass/summarizers/default.py opencompass/summarizers/multi_model.py opencompass/summarizers/needlebench.py opencompass/summarizers/summarizer_pretrain.py opencompass/summarizers/subjective/__init__.py opencompass/summarizers/subjective/alignmentbench.py opencompass/summarizers/subjective/alpacaeval.py opencompass/summarizers/subjective/compass_arena.py opencompass/summarizers/subjective/corev2.py opencompass/summarizers/subjective/creationbench.py opencompass/summarizers/subjective/information_retrival.py opencompass/summarizers/subjective/mtbench.py opencompass/summarizers/subjective/multiround.py opencompass/summarizers/subjective/subjective_post_process.py opencompass/summarizers/subjective/utils.py opencompass/tasks/__init__.py opencompass/tasks/base.py opencompass/tasks/llm_eval.py opencompass/tasks/mm_infer.py opencompass/tasks/openicl_attack.py opencompass/tasks/openicl_eval.py opencompass/tasks/openicl_infer.py opencompass/tasks/subjective_eval.py opencompass/utils/__init__.py opencompass/utils/abbr.py opencompass/utils/auxiliary.py opencompass/utils/build.py opencompass/utils/collect_env.py opencompass/utils/dependency.py opencompass/utils/file.py opencompass/utils/fileio.py opencompass/utils/lark.py opencompass/utils/logging.py opencompass/utils/menu.py opencompass/utils/prompt.py opencompass/utils/run.py opencompass/utils/text_postprocessors.py opencompass/utils/types.py |