LICENSE README.md setup.py opencompass/__init__.py opencompass/registry.py opencompass.egg-info/PKG-INFO opencompass.egg-info/SOURCES.txt opencompass.egg-info/dependency_links.txt opencompass.egg-info/requires.txt opencompass.egg-info/top_level.txt opencompass/datasets/FinanceIQ.py opencompass/datasets/GaokaoBench.py opencompass/datasets/OpenFinData.py opencompass/datasets/TheoremQA.py opencompass/datasets/__init__.py opencompass/datasets/advglue.py opencompass/datasets/afqmcd.py opencompass/datasets/anli.py opencompass/datasets/anthropics_evals.py opencompass/datasets/arc.py opencompass/datasets/ax.py opencompass/datasets/base.py opencompass/datasets/bbh.py opencompass/datasets/boolq.py opencompass/datasets/bustum.py opencompass/datasets/c3.py opencompass/datasets/cb.py opencompass/datasets/ceval.py opencompass/datasets/chid.py opencompass/datasets/cibench.py opencompass/datasets/circular.py opencompass/datasets/civilcomments.py opencompass/datasets/clozeTest_maxmin.py opencompass/datasets/cluewsc.py opencompass/datasets/cmb.py opencompass/datasets/cmmlu.py opencompass/datasets/cmnli.py opencompass/datasets/cmrc.py opencompass/datasets/commonsenseqa.py opencompass/datasets/commonsenseqa_cn.py opencompass/datasets/copa.py opencompass/datasets/crowspairs.py opencompass/datasets/crowspairs_cn.py opencompass/datasets/csl.py opencompass/datasets/custom.py opencompass/datasets/cvalues.py opencompass/datasets/drcd.py opencompass/datasets/drop.py opencompass/datasets/ds1000.py opencompass/datasets/ds1000_interpreter.py opencompass/datasets/eprstmt.py opencompass/datasets/flores.py opencompass/datasets/game24.py opencompass/datasets/govrepcrs.py opencompass/datasets/gpqa.py opencompass/datasets/gsm8k.py opencompass/datasets/gsm_hard.py opencompass/datasets/hellaswag.py opencompass/datasets/huggingface.py opencompass/datasets/humaneval.py opencompass/datasets/humaneval_multi.py opencompass/datasets/humanevalx.py opencompass/datasets/hungarian_math.py opencompass/datasets/iwslt2017.py opencompass/datasets/jigsawmultilingual.py opencompass/datasets/jsonl.py opencompass/datasets/kaoshi.py opencompass/datasets/lambada.py opencompass/datasets/lcsts.py opencompass/datasets/lmeval.py opencompass/datasets/mastermath2024v1.py opencompass/datasets/math.py opencompass/datasets/math401.py opencompass/datasets/math_intern.py opencompass/datasets/mathbench.py opencompass/datasets/mbpp.py opencompass/datasets/mmlu.py opencompass/datasets/multirc.py opencompass/datasets/narrativeqa.py opencompass/datasets/natural_question.py opencompass/datasets/natural_question_cn.py opencompass/datasets/obqa.py opencompass/datasets/piqa.py opencompass/datasets/py150.py opencompass/datasets/qasper.py opencompass/datasets/qaspercut.py opencompass/datasets/race.py opencompass/datasets/realtoxicprompts.py opencompass/datasets/record.py opencompass/datasets/rolebench.py opencompass/datasets/safety.py opencompass/datasets/scibench.py opencompass/datasets/siqa.py opencompass/datasets/squad20.py opencompass/datasets/storycloze.py opencompass/datasets/strategyqa.py opencompass/datasets/summedits.py opencompass/datasets/summscreen.py opencompass/datasets/svamp.py opencompass/datasets/tabmwp.py opencompass/datasets/tnews.py opencompass/datasets/triviaqa.py opencompass/datasets/triviaqarc.py opencompass/datasets/truthfulqa.py opencompass/datasets/tydiqa.py opencompass/datasets/wic.py opencompass/datasets/wikibench.py opencompass/datasets/winograd.py opencompass/datasets/winogrande.py opencompass/datasets/wnli.py opencompass/datasets/wsc.py opencompass/datasets/xcopa.py opencompass/datasets/xiezhi.py opencompass/datasets/xlsum.py opencompass/datasets/xsum.py opencompass/datasets/NPHardEval/__init__.py opencompass/datasets/NPHardEval/cmp_GCP_D.py opencompass/datasets/NPHardEval/cmp_KSP.py opencompass/datasets/NPHardEval/cmp_TSP_D.py opencompass/datasets/NPHardEval/hard_GCP.py opencompass/datasets/NPHardEval/hard_MSP.py opencompass/datasets/NPHardEval/hard_TSP.py opencompass/datasets/NPHardEval/p_BSP.py opencompass/datasets/NPHardEval/p_EDP.py opencompass/datasets/NPHardEval/p_SPP.py opencompass/datasets/NPHardEval/prompts.py opencompass/datasets/NPHardEval/utils.py opencompass/datasets/agieval/__init__.py opencompass/datasets/agieval/agieval.py opencompass/datasets/agieval/constructions.py opencompass/datasets/agieval/dataset_loader.py opencompass/datasets/agieval/evaluation.py opencompass/datasets/agieval/math_equivalence.py opencompass/datasets/agieval/post_process.py opencompass/datasets/agieval/utils.py opencompass/datasets/infinitebench/__init__.py opencompass/datasets/infinitebench/infinitebench_codedebug.py opencompass/datasets/infinitebench/infinitebench_coderun.py opencompass/datasets/infinitebench/infinitebench_endia.py opencompass/datasets/infinitebench/infinitebench_enmc.py opencompass/datasets/infinitebench/infinitebench_enqa.py opencompass/datasets/infinitebench/infinitebench_ensum.py opencompass/datasets/infinitebench/infinitebench_mathcalc.py opencompass/datasets/infinitebench/infinitebench_mathfind.py opencompass/datasets/infinitebench/infinitebench_retrievekv.py opencompass/datasets/infinitebench/infinitebench_retrievenumber.py opencompass/datasets/infinitebench/infinitebench_retrievepasskey.py opencompass/datasets/infinitebench/infinitebench_zhqa.py opencompass/datasets/infinitebench/utils.py opencompass/datasets/lawbench/__init__.py opencompass/datasets/lawbench/lawbench.py opencompass/datasets/leval/__init__.py opencompass/datasets/leval/evaluators.py opencompass/datasets/leval/leval_coursera.py opencompass/datasets/leval/leval_financial_qa.py opencompass/datasets/leval/leval_gov_report_summ.py opencompass/datasets/leval/leval_gsm100.py opencompass/datasets/leval/leval_legal_contract_qa.py opencompass/datasets/leval/leval_meeting_summ.py opencompass/datasets/leval/leval_multidoc_qa.py opencompass/datasets/leval/leval_narrattive_qa.py opencompass/datasets/leval/leval_natural_question.py opencompass/datasets/leval/leval_news_summ.py opencompass/datasets/leval/leval_paper_assistant.py opencompass/datasets/leval/leval_patent_summ.py opencompass/datasets/leval/leval_quality.py opencompass/datasets/leval/leval_review_summ.py opencompass/datasets/leval/leval_scientific_qa.py opencompass/datasets/leval/leval_topic_retrieval.py opencompass/datasets/leval/leval_tpo.py opencompass/datasets/leval/leval_tvshow_summ.py opencompass/datasets/longbench/__init__.py opencompass/datasets/longbench/evaluators.py opencompass/datasets/longbench/longbench_2wikim_qa.py opencompass/datasets/longbench/longbench_dureader.py opencompass/datasets/longbench/longbench_gov_report.py opencompass/datasets/longbench/longbench_hotpot_qa.py opencompass/datasets/longbench/longbench_lcc.py opencompass/datasets/longbench/longbench_lsht.py opencompass/datasets/longbench/longbench_multi_news.py opencompass/datasets/longbench/longbench_multifieldqa_en.py opencompass/datasets/longbench/longbench_multifieldqa_zh.py opencompass/datasets/longbench/longbench_musique.py opencompass/datasets/longbench/longbench_narrative_qa.py opencompass/datasets/longbench/longbench_passage_count.py opencompass/datasets/longbench/longbench_passage_retrieval_en.py opencompass/datasets/longbench/longbench_passage_retrieval_zh.py opencompass/datasets/longbench/longbench_qasper.py opencompass/datasets/longbench/longbench_qmsum.py opencompass/datasets/longbench/longbench_repobench.py opencompass/datasets/longbench/longbench_samsum.py opencompass/datasets/longbench/longbench_trec.py opencompass/datasets/longbench/longbench_trivia_qa.py opencompass/datasets/longbench/longbench_vcsum.py opencompass/datasets/lveval/__init__.py opencompass/datasets/lveval/evaluators.py opencompass/datasets/lveval/lveval_cmrc_mixup.py opencompass/datasets/lveval/lveval_dureader_mixup.py opencompass/datasets/lveval/lveval_factrecall_en.py opencompass/datasets/lveval/lveval_factrecall_zh.py opencompass/datasets/lveval/lveval_hotpotwikiqa_mixup.py opencompass/datasets/lveval/lveval_lic_mixup.py opencompass/datasets/lveval/lveval_loogle_CR_mixup.py opencompass/datasets/lveval/lveval_loogle_MIR_mixup.py opencompass/datasets/lveval/lveval_loogle_SD_mixup.py opencompass/datasets/lveval/lveval_multifieldqa_en_mixup.py opencompass/datasets/lveval/lveval_multifieldqa_zh_mixup.py opencompass/datasets/medbench/__init__.py opencompass/datasets/medbench/constructions.py opencompass/datasets/medbench/dataset_loader.py opencompass/datasets/medbench/evaluation.py opencompass/datasets/medbench/math_equivalence.py opencompass/datasets/medbench/medbench.py opencompass/datasets/medbench/post_process.py opencompass/datasets/medbench/utils.py opencompass/datasets/reasonbench/ReasonBenchDataset.py opencompass/datasets/reasonbench/__init__.py opencompass/datasets/subjective/__init__.py opencompass/datasets/subjective/alignbench.py opencompass/datasets/subjective/compass_arena.py opencompass/datasets/subjective/corev2.py opencompass/datasets/subjective/creationbench.py opencompass/datasets/subjective/information_retrival.py opencompass/datasets/subjective/mtbench.py opencompass/datasets/subjective/multiround.py opencompass/datasets/subjective/subjective_cmp.py opencompass/datasets/teval/__init__.py opencompass/datasets/teval/schema.py opencompass/datasets/teval/evaluators/__init__.py opencompass/datasets/teval/evaluators/instruct_evaluator.py opencompass/datasets/teval/evaluators/planning_evaluator.py opencompass/datasets/teval/evaluators/reason_retrieve_understand_evaluator.py opencompass/datasets/teval/evaluators/review_evaluator.py opencompass/datasets/teval/utils/__init__.py opencompass/datasets/teval/utils/convert_results.py opencompass/datasets/teval/utils/format_load.py opencompass/datasets/teval/utils/meta_template.py opencompass/datasets/teval/utils/template.py opencompass/metrics/__init__.py opencompass/metrics/dump_results.py opencompass/metrics/mme_score.py opencompass/metrics/seedbench.py opencompass/models/__init__.py opencompass/models/accessory.py opencompass/models/ai360_api.py opencompass/models/alaya.py opencompass/models/baichuan_api.py opencompass/models/baidu_api.py opencompass/models/base.py opencompass/models/base_api.py opencompass/models/bytedance_api.py opencompass/models/gemini_api.py opencompass/models/glm.py opencompass/models/huggingface.py opencompass/models/intern_model.py opencompass/models/krgpt_api.py opencompass/models/lagent.py opencompass/models/langchain.py opencompass/models/lightllm_api.py opencompass/models/llama2.py opencompass/models/lmdeploy_pytorch.py opencompass/models/minimax_api.py opencompass/models/mixtral.py opencompass/models/modelscope.py opencompass/models/moonshot_api.py opencompass/models/nanbeige_api.py opencompass/models/openai_api.py opencompass/models/pangu_api.py opencompass/models/qwen_api.py opencompass/models/sensetime_api.py opencompass/models/turbomind.py opencompass/models/turbomind_api.py opencompass/models/turbomind_tis.py opencompass/models/vllm.py opencompass/models/xunfei_api.py opencompass/models/zhipuai_api.py opencompass/models/zhipuai_v2_api.py opencompass/models/claude_api/__init__.py opencompass/models/claude_api/claude_api.py opencompass/models/claude_api/postprocessors.py opencompass/openicl/__init__.py opencompass/openicl/icl_dataset_reader.py opencompass/openicl/icl_prompt_template.py opencompass/openicl/icl_evaluator/__init__.py opencompass/openicl/icl_evaluator/icl_agent_evaluator.py opencompass/openicl/icl_evaluator/icl_aucroc_evaluator.py opencompass/openicl/icl_evaluator/icl_base_evaluator.py opencompass/openicl/icl_evaluator/icl_circular_evaluator.py opencompass/openicl/icl_evaluator/icl_em_evaluator.py opencompass/openicl/icl_evaluator/icl_hf_evaluator.py opencompass/openicl/icl_evaluator/icl_jieba_rouge_evaluator.py opencompass/openicl/icl_evaluator/icl_misc_evaluator.py opencompass/openicl/icl_evaluator/icl_plugin_evaluator.py opencompass/openicl/icl_evaluator/icl_toxic_evaluator.py opencompass/openicl/icl_evaluator/lm_evaluator.py opencompass/openicl/icl_inferencer/__init__.py opencompass/openicl/icl_inferencer/icl_agent_inferencer.py opencompass/openicl/icl_inferencer/icl_attack_inferencer.py opencompass/openicl/icl_inferencer/icl_base_inferencer.py opencompass/openicl/icl_inferencer/icl_chat_inferencer.py opencompass/openicl/icl_inferencer/icl_clp_inferencer.py opencompass/openicl/icl_inferencer/icl_gen_inferencer.py opencompass/openicl/icl_inferencer/icl_ll_inferencer.py opencompass/openicl/icl_inferencer/icl_mink_percent_inferencer.py opencompass/openicl/icl_inferencer/icl_ppl_inferencer.py opencompass/openicl/icl_inferencer/icl_ppl_only_inferencer.py opencompass/openicl/icl_inferencer/icl_sc_inferencer.py opencompass/openicl/icl_inferencer/icl_tot_inferencer.py opencompass/openicl/icl_retriever/__init__.py opencompass/openicl/icl_retriever/icl_base_retriever.py opencompass/openicl/icl_retriever/icl_bm25_retriever.py opencompass/openicl/icl_retriever/icl_dpp_retriever.py opencompass/openicl/icl_retriever/icl_fix_k_retriever.py opencompass/openicl/icl_retriever/icl_mdl_retriever.py opencompass/openicl/icl_retriever/icl_random_retriever.py opencompass/openicl/icl_retriever/icl_topk_retriever.py opencompass/openicl/icl_retriever/icl_votek_retriever.py opencompass/openicl/icl_retriever/icl_zero_retriever.py opencompass/openicl/utils/__init__.py opencompass/openicl/utils/logging.py opencompass/partitioners/__init__.py opencompass/partitioners/base.py opencompass/partitioners/mm_naive.py opencompass/partitioners/naive.py opencompass/partitioners/num_worker.py opencompass/partitioners/size.py opencompass/partitioners/sub_naive.py opencompass/partitioners/sub_size.py opencompass/runners/__init__.py opencompass/runners/base.py opencompass/runners/dlc.py opencompass/runners/local.py opencompass/runners/local_api.py opencompass/runners/slurm.py opencompass/runners/slurm_sequential.py opencompass/summarizers/__init__.py opencompass/summarizers/circular.py opencompass/summarizers/default.py opencompass/summarizers/multi_model.py opencompass/summarizers/needlebench.py opencompass/summarizers/summarizer_pretrain.py opencompass/summarizers/subjective/__init__.py opencompass/summarizers/subjective/alignmentbench.py opencompass/summarizers/subjective/alpacaeval.py opencompass/summarizers/subjective/compass_arena.py opencompass/summarizers/subjective/corev2.py opencompass/summarizers/subjective/creationbench.py opencompass/summarizers/subjective/information_retrival.py opencompass/summarizers/subjective/mtbench.py opencompass/summarizers/subjective/multiround.py opencompass/summarizers/subjective/subjective_post_process.py opencompass/summarizers/subjective/utils.py opencompass/tasks/__init__.py opencompass/tasks/base.py opencompass/tasks/llm_eval.py opencompass/tasks/mm_infer.py opencompass/tasks/openicl_attack.py opencompass/tasks/openicl_eval.py opencompass/tasks/openicl_infer.py opencompass/tasks/subjective_eval.py opencompass/utils/__init__.py opencompass/utils/abbr.py opencompass/utils/auxiliary.py opencompass/utils/build.py opencompass/utils/collect_env.py opencompass/utils/dependency.py opencompass/utils/file.py opencompass/utils/fileio.py opencompass/utils/lark.py opencompass/utils/logging.py opencompass/utils/menu.py opencompass/utils/prompt.py opencompass/utils/run.py opencompass/utils/text_postprocessors.py opencompass/utils/types.py