|
LICENSE |
|
README.md |
|
setup.py |
|
opencompass/__init__.py |
|
opencompass/registry.py |
|
opencompass.egg-info/PKG-INFO |
|
opencompass.egg-info/SOURCES.txt |
|
opencompass.egg-info/dependency_links.txt |
|
opencompass.egg-info/requires.txt |
|
opencompass.egg-info/top_level.txt |
|
opencompass/datasets/FinanceIQ.py |
|
opencompass/datasets/GaokaoBench.py |
|
opencompass/datasets/OpenFinData.py |
|
opencompass/datasets/TheoremQA.py |
|
opencompass/datasets/__init__.py |
|
opencompass/datasets/advglue.py |
|
opencompass/datasets/afqmcd.py |
|
opencompass/datasets/anli.py |
|
opencompass/datasets/anthropics_evals.py |
|
opencompass/datasets/arc.py |
|
opencompass/datasets/ax.py |
|
opencompass/datasets/base.py |
|
opencompass/datasets/bbh.py |
|
opencompass/datasets/boolq.py |
|
opencompass/datasets/bustum.py |
|
opencompass/datasets/c3.py |
|
opencompass/datasets/cb.py |
|
opencompass/datasets/ceval.py |
|
opencompass/datasets/chid.py |
|
opencompass/datasets/cibench.py |
|
opencompass/datasets/circular.py |
|
opencompass/datasets/civilcomments.py |
|
opencompass/datasets/clozeTest_maxmin.py |
|
opencompass/datasets/cluewsc.py |
|
opencompass/datasets/cmb.py |
|
opencompass/datasets/cmmlu.py |
|
opencompass/datasets/cmnli.py |
|
opencompass/datasets/cmrc.py |
|
opencompass/datasets/commonsenseqa.py |
|
opencompass/datasets/commonsenseqa_cn.py |
|
opencompass/datasets/copa.py |
|
opencompass/datasets/crowspairs.py |
|
opencompass/datasets/crowspairs_cn.py |
|
opencompass/datasets/csl.py |
|
opencompass/datasets/custom.py |
|
opencompass/datasets/cvalues.py |
|
opencompass/datasets/drcd.py |
|
opencompass/datasets/drop.py |
|
opencompass/datasets/ds1000.py |
|
opencompass/datasets/ds1000_interpreter.py |
|
opencompass/datasets/eprstmt.py |
|
opencompass/datasets/flores.py |
|
opencompass/datasets/game24.py |
|
opencompass/datasets/govrepcrs.py |
|
opencompass/datasets/gpqa.py |
|
opencompass/datasets/gsm8k.py |
|
opencompass/datasets/gsm_hard.py |
|
opencompass/datasets/hellaswag.py |
|
opencompass/datasets/huggingface.py |
|
opencompass/datasets/humaneval.py |
|
opencompass/datasets/humaneval_multi.py |
|
opencompass/datasets/humanevalx.py |
|
opencompass/datasets/hungarian_math.py |
|
opencompass/datasets/iwslt2017.py |
|
opencompass/datasets/jigsawmultilingual.py |
|
opencompass/datasets/jsonl.py |
|
opencompass/datasets/kaoshi.py |
|
opencompass/datasets/lambada.py |
|
opencompass/datasets/lcsts.py |
|
opencompass/datasets/lmeval.py |
|
opencompass/datasets/mastermath2024v1.py |
|
opencompass/datasets/math.py |
|
opencompass/datasets/math401.py |
|
opencompass/datasets/math_intern.py |
|
opencompass/datasets/mathbench.py |
|
opencompass/datasets/mbpp.py |
|
opencompass/datasets/mmlu.py |
|
opencompass/datasets/multirc.py |
|
opencompass/datasets/narrativeqa.py |
|
opencompass/datasets/natural_question.py |
|
opencompass/datasets/natural_question_cn.py |
|
opencompass/datasets/obqa.py |
|
opencompass/datasets/piqa.py |
|
opencompass/datasets/py150.py |
|
opencompass/datasets/qasper.py |
|
opencompass/datasets/qaspercut.py |
|
opencompass/datasets/race.py |
|
opencompass/datasets/realtoxicprompts.py |
|
opencompass/datasets/record.py |
|
opencompass/datasets/rolebench.py |
|
opencompass/datasets/safety.py |
|
opencompass/datasets/scibench.py |
|
opencompass/datasets/siqa.py |
|
opencompass/datasets/squad20.py |
|
opencompass/datasets/storycloze.py |
|
opencompass/datasets/strategyqa.py |
|
opencompass/datasets/summedits.py |
|
opencompass/datasets/summscreen.py |
|
opencompass/datasets/svamp.py |
|
opencompass/datasets/tabmwp.py |
|
opencompass/datasets/tnews.py |
|
opencompass/datasets/triviaqa.py |
|
opencompass/datasets/triviaqarc.py |
|
opencompass/datasets/truthfulqa.py |
|
opencompass/datasets/tydiqa.py |
|
opencompass/datasets/wic.py |
|
opencompass/datasets/wikibench.py |
|
opencompass/datasets/winograd.py |
|
opencompass/datasets/winogrande.py |
|
opencompass/datasets/wnli.py |
|
opencompass/datasets/wsc.py |
|
opencompass/datasets/xcopa.py |
|
opencompass/datasets/xiezhi.py |
|
opencompass/datasets/xlsum.py |
|
opencompass/datasets/xsum.py |
|
opencompass/datasets/NPHardEval/__init__.py |
|
opencompass/datasets/NPHardEval/cmp_GCP_D.py |
|
opencompass/datasets/NPHardEval/cmp_KSP.py |
|
opencompass/datasets/NPHardEval/cmp_TSP_D.py |
|
opencompass/datasets/NPHardEval/hard_GCP.py |
|
opencompass/datasets/NPHardEval/hard_MSP.py |
|
opencompass/datasets/NPHardEval/hard_TSP.py |
|
opencompass/datasets/NPHardEval/p_BSP.py |
|
opencompass/datasets/NPHardEval/p_EDP.py |
|
opencompass/datasets/NPHardEval/p_SPP.py |
|
opencompass/datasets/NPHardEval/prompts.py |
|
opencompass/datasets/NPHardEval/utils.py |
|
opencompass/datasets/agieval/__init__.py |
|
opencompass/datasets/agieval/agieval.py |
|
opencompass/datasets/agieval/constructions.py |
|
opencompass/datasets/agieval/dataset_loader.py |
|
opencompass/datasets/agieval/evaluation.py |
|
opencompass/datasets/agieval/math_equivalence.py |
|
opencompass/datasets/agieval/post_process.py |
|
opencompass/datasets/agieval/utils.py |
|
opencompass/datasets/infinitebench/__init__.py |
|
opencompass/datasets/infinitebench/infinitebench_codedebug.py |
|
opencompass/datasets/infinitebench/infinitebench_coderun.py |
|
opencompass/datasets/infinitebench/infinitebench_endia.py |
|
opencompass/datasets/infinitebench/infinitebench_enmc.py |
|
opencompass/datasets/infinitebench/infinitebench_enqa.py |
|
opencompass/datasets/infinitebench/infinitebench_ensum.py |
|
opencompass/datasets/infinitebench/infinitebench_mathcalc.py |
|
opencompass/datasets/infinitebench/infinitebench_mathfind.py |
|
opencompass/datasets/infinitebench/infinitebench_retrievekv.py |
|
opencompass/datasets/infinitebench/infinitebench_retrievenumber.py |
|
opencompass/datasets/infinitebench/infinitebench_retrievepasskey.py |
|
opencompass/datasets/infinitebench/infinitebench_zhqa.py |
|
opencompass/datasets/infinitebench/utils.py |
|
opencompass/datasets/lawbench/__init__.py |
|
opencompass/datasets/lawbench/lawbench.py |
|
opencompass/datasets/leval/__init__.py |
|
opencompass/datasets/leval/evaluators.py |
|
opencompass/datasets/leval/leval_coursera.py |
|
opencompass/datasets/leval/leval_financial_qa.py |
|
opencompass/datasets/leval/leval_gov_report_summ.py |
|
opencompass/datasets/leval/leval_gsm100.py |
|
opencompass/datasets/leval/leval_legal_contract_qa.py |
|
opencompass/datasets/leval/leval_meeting_summ.py |
|
opencompass/datasets/leval/leval_multidoc_qa.py |
|
opencompass/datasets/leval/leval_narrattive_qa.py |
|
opencompass/datasets/leval/leval_natural_question.py |
|
opencompass/datasets/leval/leval_news_summ.py |
|
opencompass/datasets/leval/leval_paper_assistant.py |
|
opencompass/datasets/leval/leval_patent_summ.py |
|
opencompass/datasets/leval/leval_quality.py |
|
opencompass/datasets/leval/leval_review_summ.py |
|
opencompass/datasets/leval/leval_scientific_qa.py |
|
opencompass/datasets/leval/leval_topic_retrieval.py |
|
opencompass/datasets/leval/leval_tpo.py |
|
opencompass/datasets/leval/leval_tvshow_summ.py |
|
opencompass/datasets/longbench/__init__.py |
|
opencompass/datasets/longbench/evaluators.py |
|
opencompass/datasets/longbench/longbench_2wikim_qa.py |
|
opencompass/datasets/longbench/longbench_dureader.py |
|
opencompass/datasets/longbench/longbench_gov_report.py |
|
opencompass/datasets/longbench/longbench_hotpot_qa.py |
|
opencompass/datasets/longbench/longbench_lcc.py |
|
opencompass/datasets/longbench/longbench_lsht.py |
|
opencompass/datasets/longbench/longbench_multi_news.py |
|
opencompass/datasets/longbench/longbench_multifieldqa_en.py |
|
opencompass/datasets/longbench/longbench_multifieldqa_zh.py |
|
opencompass/datasets/longbench/longbench_musique.py |
|
opencompass/datasets/longbench/longbench_narrative_qa.py |
|
opencompass/datasets/longbench/longbench_passage_count.py |
|
opencompass/datasets/longbench/longbench_passage_retrieval_en.py |
|
opencompass/datasets/longbench/longbench_passage_retrieval_zh.py |
|
opencompass/datasets/longbench/longbench_qasper.py |
|
opencompass/datasets/longbench/longbench_qmsum.py |
|
opencompass/datasets/longbench/longbench_repobench.py |
|
opencompass/datasets/longbench/longbench_samsum.py |
|
opencompass/datasets/longbench/longbench_trec.py |
|
opencompass/datasets/longbench/longbench_trivia_qa.py |
|
opencompass/datasets/longbench/longbench_vcsum.py |
|
opencompass/datasets/lveval/__init__.py |
|
opencompass/datasets/lveval/evaluators.py |
|
opencompass/datasets/lveval/lveval_cmrc_mixup.py |
|
opencompass/datasets/lveval/lveval_dureader_mixup.py |
|
opencompass/datasets/lveval/lveval_factrecall_en.py |
|
opencompass/datasets/lveval/lveval_factrecall_zh.py |
|
opencompass/datasets/lveval/lveval_hotpotwikiqa_mixup.py |
|
opencompass/datasets/lveval/lveval_lic_mixup.py |
|
opencompass/datasets/lveval/lveval_loogle_CR_mixup.py |
|
opencompass/datasets/lveval/lveval_loogle_MIR_mixup.py |
|
opencompass/datasets/lveval/lveval_loogle_SD_mixup.py |
|
opencompass/datasets/lveval/lveval_multifieldqa_en_mixup.py |
|
opencompass/datasets/lveval/lveval_multifieldqa_zh_mixup.py |
|
opencompass/datasets/medbench/__init__.py |
|
opencompass/datasets/medbench/constructions.py |
|
opencompass/datasets/medbench/dataset_loader.py |
|
opencompass/datasets/medbench/evaluation.py |
|
opencompass/datasets/medbench/math_equivalence.py |
|
opencompass/datasets/medbench/medbench.py |
|
opencompass/datasets/medbench/post_process.py |
|
opencompass/datasets/medbench/utils.py |
|
opencompass/datasets/reasonbench/ReasonBenchDataset.py |
|
opencompass/datasets/reasonbench/__init__.py |
|
opencompass/datasets/subjective/__init__.py |
|
opencompass/datasets/subjective/alignbench.py |
|
opencompass/datasets/subjective/compass_arena.py |
|
opencompass/datasets/subjective/corev2.py |
|
opencompass/datasets/subjective/creationbench.py |
|
opencompass/datasets/subjective/information_retrival.py |
|
opencompass/datasets/subjective/mtbench.py |
|
opencompass/datasets/subjective/multiround.py |
|
opencompass/datasets/subjective/subjective_cmp.py |
|
opencompass/datasets/teval/__init__.py |
|
opencompass/datasets/teval/schema.py |
|
opencompass/datasets/teval/evaluators/__init__.py |
|
opencompass/datasets/teval/evaluators/instruct_evaluator.py |
|
opencompass/datasets/teval/evaluators/planning_evaluator.py |
|
opencompass/datasets/teval/evaluators/reason_retrieve_understand_evaluator.py |
|
opencompass/datasets/teval/evaluators/review_evaluator.py |
|
opencompass/datasets/teval/utils/__init__.py |
|
opencompass/datasets/teval/utils/convert_results.py |
|
opencompass/datasets/teval/utils/format_load.py |
|
opencompass/datasets/teval/utils/meta_template.py |
|
opencompass/datasets/teval/utils/template.py |
|
opencompass/metrics/__init__.py |
|
opencompass/metrics/dump_results.py |
|
opencompass/metrics/mme_score.py |
|
opencompass/metrics/seedbench.py |
|
opencompass/models/__init__.py |
|
opencompass/models/accessory.py |
|
opencompass/models/ai360_api.py |
|
opencompass/models/alaya.py |
|
opencompass/models/baichuan_api.py |
|
opencompass/models/baidu_api.py |
|
opencompass/models/base.py |
|
opencompass/models/base_api.py |
|
opencompass/models/bytedance_api.py |
|
opencompass/models/gemini_api.py |
|
opencompass/models/glm.py |
|
opencompass/models/huggingface.py |
|
opencompass/models/intern_model.py |
|
opencompass/models/krgpt_api.py |
|
opencompass/models/lagent.py |
|
opencompass/models/langchain.py |
|
opencompass/models/lightllm_api.py |
|
opencompass/models/llama2.py |
|
opencompass/models/lmdeploy_pytorch.py |
|
opencompass/models/minimax_api.py |
|
opencompass/models/mixtral.py |
|
opencompass/models/modelscope.py |
|
opencompass/models/moonshot_api.py |
|
opencompass/models/nanbeige_api.py |
|
opencompass/models/openai_api.py |
|
opencompass/models/pangu_api.py |
|
opencompass/models/qwen_api.py |
|
opencompass/models/sensetime_api.py |
|
opencompass/models/turbomind.py |
|
opencompass/models/turbomind_api.py |
|
opencompass/models/turbomind_tis.py |
|
opencompass/models/vllm.py |
|
opencompass/models/xunfei_api.py |
|
opencompass/models/zhipuai_api.py |
|
opencompass/models/zhipuai_v2_api.py |
|
opencompass/models/claude_api/__init__.py |
|
opencompass/models/claude_api/claude_api.py |
|
opencompass/models/claude_api/postprocessors.py |
|
opencompass/openicl/__init__.py |
|
opencompass/openicl/icl_dataset_reader.py |
|
opencompass/openicl/icl_prompt_template.py |
|
opencompass/openicl/icl_evaluator/__init__.py |
|
opencompass/openicl/icl_evaluator/icl_agent_evaluator.py |
|
opencompass/openicl/icl_evaluator/icl_aucroc_evaluator.py |
|
opencompass/openicl/icl_evaluator/icl_base_evaluator.py |
|
opencompass/openicl/icl_evaluator/icl_circular_evaluator.py |
|
opencompass/openicl/icl_evaluator/icl_em_evaluator.py |
|
opencompass/openicl/icl_evaluator/icl_hf_evaluator.py |
|
opencompass/openicl/icl_evaluator/icl_jieba_rouge_evaluator.py |
|
opencompass/openicl/icl_evaluator/icl_misc_evaluator.py |
|
opencompass/openicl/icl_evaluator/icl_plugin_evaluator.py |
|
opencompass/openicl/icl_evaluator/icl_toxic_evaluator.py |
|
opencompass/openicl/icl_evaluator/lm_evaluator.py |
|
opencompass/openicl/icl_inferencer/__init__.py |
|
opencompass/openicl/icl_inferencer/icl_agent_inferencer.py |
|
opencompass/openicl/icl_inferencer/icl_attack_inferencer.py |
|
opencompass/openicl/icl_inferencer/icl_base_inferencer.py |
|
opencompass/openicl/icl_inferencer/icl_chat_inferencer.py |
|
opencompass/openicl/icl_inferencer/icl_clp_inferencer.py |
|
opencompass/openicl/icl_inferencer/icl_gen_inferencer.py |
|
opencompass/openicl/icl_inferencer/icl_ll_inferencer.py |
|
opencompass/openicl/icl_inferencer/icl_mink_percent_inferencer.py |
|
opencompass/openicl/icl_inferencer/icl_ppl_inferencer.py |
|
opencompass/openicl/icl_inferencer/icl_ppl_only_inferencer.py |
|
opencompass/openicl/icl_inferencer/icl_sc_inferencer.py |
|
opencompass/openicl/icl_inferencer/icl_tot_inferencer.py |
|
opencompass/openicl/icl_retriever/__init__.py |
|
opencompass/openicl/icl_retriever/icl_base_retriever.py |
|
opencompass/openicl/icl_retriever/icl_bm25_retriever.py |
|
opencompass/openicl/icl_retriever/icl_dpp_retriever.py |
|
opencompass/openicl/icl_retriever/icl_fix_k_retriever.py |
|
opencompass/openicl/icl_retriever/icl_mdl_retriever.py |
|
opencompass/openicl/icl_retriever/icl_random_retriever.py |
|
opencompass/openicl/icl_retriever/icl_topk_retriever.py |
|
opencompass/openicl/icl_retriever/icl_votek_retriever.py |
|
opencompass/openicl/icl_retriever/icl_zero_retriever.py |
|
opencompass/openicl/utils/__init__.py |
|
opencompass/openicl/utils/logging.py |
|
opencompass/partitioners/__init__.py |
|
opencompass/partitioners/base.py |
|
opencompass/partitioners/mm_naive.py |
|
opencompass/partitioners/naive.py |
|
opencompass/partitioners/num_worker.py |
|
opencompass/partitioners/size.py |
|
opencompass/partitioners/sub_naive.py |
|
opencompass/partitioners/sub_size.py |
|
opencompass/runners/__init__.py |
|
opencompass/runners/base.py |
|
opencompass/runners/dlc.py |
|
opencompass/runners/local.py |
|
opencompass/runners/local_api.py |
|
opencompass/runners/slurm.py |
|
opencompass/runners/slurm_sequential.py |
|
opencompass/summarizers/__init__.py |
|
opencompass/summarizers/circular.py |
|
opencompass/summarizers/default.py |
|
opencompass/summarizers/multi_model.py |
|
opencompass/summarizers/needlebench.py |
|
opencompass/summarizers/summarizer_pretrain.py |
|
opencompass/summarizers/subjective/__init__.py |
|
opencompass/summarizers/subjective/alignmentbench.py |
|
opencompass/summarizers/subjective/alpacaeval.py |
|
opencompass/summarizers/subjective/compass_arena.py |
|
opencompass/summarizers/subjective/corev2.py |
|
opencompass/summarizers/subjective/creationbench.py |
|
opencompass/summarizers/subjective/information_retrival.py |
|
opencompass/summarizers/subjective/mtbench.py |
|
opencompass/summarizers/subjective/multiround.py |
|
opencompass/summarizers/subjective/subjective_post_process.py |
|
opencompass/summarizers/subjective/utils.py |
|
opencompass/tasks/__init__.py |
|
opencompass/tasks/base.py |
|
opencompass/tasks/llm_eval.py |
|
opencompass/tasks/mm_infer.py |
|
opencompass/tasks/openicl_attack.py |
|
opencompass/tasks/openicl_eval.py |
|
opencompass/tasks/openicl_infer.py |
|
opencompass/tasks/subjective_eval.py |
|
opencompass/utils/__init__.py |
|
opencompass/utils/abbr.py |
|
opencompass/utils/auxiliary.py |
|
opencompass/utils/build.py |
|
opencompass/utils/collect_env.py |
|
opencompass/utils/dependency.py |
|
opencompass/utils/file.py |
|
opencompass/utils/fileio.py |
|
opencompass/utils/lark.py |
|
opencompass/utils/logging.py |
|
opencompass/utils/menu.py |
|
opencompass/utils/prompt.py |
|
opencompass/utils/run.py |
|
opencompass/utils/text_postprocessors.py |
|
opencompass/utils/types.py |