README.md
ms_opencompass.egg-info/PKG-INFO
ms_opencompass.egg-info/SOURCES.txt
ms_opencompass.egg-info/dependency_links.txt
ms_opencompass.egg-info/entry_points.txt
ms_opencompass.egg-info/requires.txt
ms_opencompass.egg-info/top_level.txt
opencompass/__init__.py
opencompass/registry.py
opencompass/cli/__init__.py
opencompass/cli/arguments.py
opencompass/cli/main.py
opencompass/configs/__init__.py
opencompass/configs/eval_PMMEval.py
opencompass/configs/eval_TheoremQA.py
opencompass/configs/eval_academic_leaderboard_202407.py
opencompass/configs/eval_alaya.py
opencompass/configs/eval_api_demo.py
opencompass/configs/eval_attack.py
opencompass/configs/eval_babilong.py
opencompass/configs/eval_base_demo.py
opencompass/configs/eval_bluelm_32k_lveval.py
opencompass/configs/eval_charm_mem.py
opencompass/configs/eval_charm_rea.py
opencompass/configs/eval_chat_agent.py
opencompass/configs/eval_chat_agent_baseline.py
opencompass/configs/eval_chat_demo.py
opencompass/configs/eval_chat_last.py
opencompass/configs/eval_chembench.py
opencompass/configs/eval_cibench.py
opencompass/configs/eval_cibench_api.py
opencompass/configs/eval_circular.py
opencompass/configs/eval_claude.py
opencompass/configs/eval_code_passk.py
opencompass/configs/eval_code_passk_repeat_dataset.py
opencompass/configs/eval_codeagent.py
opencompass/configs/eval_codegeex2.py
opencompass/configs/eval_compassarena_subjectivebench.py
opencompass/configs/eval_contamination.py
opencompass/configs/eval_corebench_2409_base_objective.py
opencompass/configs/eval_corebench_2409_chat_objective.py
opencompass/configs/eval_corebench_2409_longcontext.py
opencompass/configs/eval_corebench_2409_subjective.py
opencompass/configs/eval_demo.py
opencompass/configs/eval_dingo.py
opencompass/configs/eval_ds1000_interpreter.py
opencompass/configs/eval_edgellm_demo.py
opencompass/configs/eval_gpt3.5.py
opencompass/configs/eval_gpt4.py
opencompass/configs/eval_hellobench.py
opencompass/configs/eval_hf_llama2.py
opencompass/configs/eval_hf_llama_7b.py
opencompass/configs/eval_inference_ppl.py
opencompass/configs/eval_internLM.py
opencompass/configs/eval_internlm2_chat_keyset.py
opencompass/configs/eval_internlm2_keyset.py
opencompass/configs/eval_internlm_7b.py
opencompass/configs/eval_internlm_chat_lmdeploy_apiserver.py
opencompass/configs/eval_internlm_chat_turbomind.py
opencompass/configs/eval_internlm_flames_chat.py
opencompass/configs/eval_internlm_lmdeploy_apiserver.py
opencompass/configs/eval_internlm_math_chat.py
opencompass/configs/eval_internlm_turbomind.py
opencompass/configs/eval_judgerbench.py
opencompass/configs/eval_korbench.py
opencompass/configs/eval_lightllm.py
opencompass/configs/eval_llama2_7b.py
opencompass/configs/eval_llama2_7b_lveval.py
opencompass/configs/eval_llama3_instruct.py
opencompass/configs/eval_llm_compression.py
opencompass/configs/eval_lmdeploy_demo.py
opencompass/configs/eval_math_llm_judge.py
opencompass/configs/eval_math_llm_judge_internal.py
opencompass/configs/eval_mathbench.py
opencompass/configs/eval_mmlu_pro.py
opencompass/configs/eval_mmlu_with_zero_retriever_overwritten.py
opencompass/configs/eval_modelscope_datasets.py
opencompass/configs/eval_multi_prompt_demo.py
opencompass/configs/eval_musr.py
opencompass/configs/eval_needlebench.py
opencompass/configs/eval_openai_format_task.py
opencompass/configs/eval_openai_format_task_teval_v2.py
opencompass/configs/eval_openai_format_task_teval_v2_qwen.py
opencompass/configs/eval_qwen_7b.py
opencompass/configs/eval_qwen_7b_chat.py
opencompass/configs/eval_qwen_7b_chat_lawbench.py
opencompass/configs/eval_ruler.py
opencompass/configs/eval_ruler_fix_tokenizer.py
opencompass/configs/eval_rwkv5_3b.py
opencompass/configs/eval_simpleqa.py
opencompass/configs/eval_subjective.py
opencompass/configs/eval_subjective_alpacaeval_official.py
opencompass/configs/eval_teval.py
opencompass/configs/eval_teval_v2.py
opencompass/configs/eval_with_model_dataset_combinations.py
opencompass/configs/datasets/__init__.py
opencompass/configs/datasets/ARC_c/ARC_c_clean_ppl.py
opencompass/configs/datasets/ARC_c/ARC_c_cot_gen_926652.py
opencompass/configs/datasets/ARC_c/ARC_c_few_shot_gen_e9b043.py
opencompass/configs/datasets/ARC_c/ARC_c_few_shot_ppl.py
opencompass/configs/datasets/ARC_c/ARC_c_gen.py
opencompass/configs/datasets/ARC_c/ARC_c_gen_1e0de5.py
opencompass/configs/datasets/ARC_c/ARC_c_ppl.py
opencompass/configs/datasets/ARC_c/ARC_c_ppl_2ef631.py
opencompass/configs/datasets/ARC_c/ARC_c_ppl_a450bd.py
opencompass/configs/datasets/ARC_c/ARC_c_ppl_d52a21.py
opencompass/configs/datasets/ARC_c/__init__.py
opencompass/configs/datasets/ARC_e/ARC_e_gen.py
opencompass/configs/datasets/ARC_e/ARC_e_gen_1e0de5.py
opencompass/configs/datasets/ARC_e/ARC_e_ppl.py
opencompass/configs/datasets/ARC_e/ARC_e_ppl_2ef631.py
opencompass/configs/datasets/ARC_e/ARC_e_ppl_a450bd.py
opencompass/configs/datasets/ARC_e/ARC_e_ppl_d52a21.py
opencompass/configs/datasets/ARC_e/__init__.py
opencompass/configs/datasets/CIBench/CIBench_generation_gen_8ab0dc.py
opencompass/configs/datasets/CIBench/CIBench_generation_oracle_gen_c4a7c1.py
opencompass/configs/datasets/CIBench/CIBench_template_gen_e6b12a.py
opencompass/configs/datasets/CIBench/CIBench_template_oracle_gen_fecda1.py
opencompass/configs/datasets/CIBench/__init__.py
opencompass/configs/datasets/CLUE_C3/CLUE_C3_gen.py
opencompass/configs/datasets/CLUE_C3/CLUE_C3_gen_8c358f.py
opencompass/configs/datasets/CLUE_C3/CLUE_C3_ppl.py
opencompass/configs/datasets/CLUE_C3/CLUE_C3_ppl_56b537.py
opencompass/configs/datasets/CLUE_C3/CLUE_C3_ppl_e24a31.py
opencompass/configs/datasets/CLUE_C3/__init__.py
opencompass/configs/datasets/CLUE_CMRC/CLUE_CMRC_gen.py
opencompass/configs/datasets/CLUE_CMRC/CLUE_CMRC_gen_1bd3c8.py
opencompass/configs/datasets/CLUE_CMRC/CLUE_CMRC_gen_3749cd.py
opencompass/configs/datasets/CLUE_CMRC/CLUE_CMRC_gen_8484b9.py
opencompass/configs/datasets/CLUE_CMRC/CLUE_CMRC_gen_941108.py
opencompass/configs/datasets/CLUE_CMRC/__init__.py
opencompass/configs/datasets/CLUE_DRCD/CLUE_DRCD_gen.py
opencompass/configs/datasets/CLUE_DRCD/CLUE_DRCD_gen_1bd3c8.py
opencompass/configs/datasets/CLUE_DRCD/CLUE_DRCD_gen_3749cd.py
opencompass/configs/datasets/CLUE_DRCD/CLUE_DRCD_gen_8484b9.py
opencompass/configs/datasets/CLUE_DRCD/CLUE_DRCD_gen_941108.py
opencompass/configs/datasets/CLUE_DRCD/__init__.py
opencompass/configs/datasets/CLUE_afqmc/CLUE_afqmc_gen.py
opencompass/configs/datasets/CLUE_afqmc/CLUE_afqmc_gen_901306.py
opencompass/configs/datasets/CLUE_afqmc/CLUE_afqmc_ppl.py
opencompass/configs/datasets/CLUE_afqmc/CLUE_afqmc_ppl_378c5b.py
opencompass/configs/datasets/CLUE_afqmc/CLUE_afqmc_ppl_6507d7.py
opencompass/configs/datasets/CLUE_afqmc/CLUE_afqmc_ppl_7b0c1e.py
opencompass/configs/datasets/CLUE_afqmc/__init__.py
opencompass/configs/datasets/CLUE_cmnli/CLUE_cmnli_gen.py
opencompass/configs/datasets/CLUE_cmnli/CLUE_cmnli_gen_1abf97.py
opencompass/configs/datasets/CLUE_cmnli/CLUE_cmnli_gen_51e956.py
opencompass/configs/datasets/CLUE_cmnli/CLUE_cmnli_ppl.py
opencompass/configs/datasets/CLUE_cmnli/CLUE_cmnli_ppl_98dd6e.py
opencompass/configs/datasets/CLUE_cmnli/CLUE_cmnli_ppl_ef69e7.py
opencompass/configs/datasets/CLUE_cmnli/CLUE_cmnli_ppl_fdc6de.py
opencompass/configs/datasets/CLUE_cmnli/__init__.py
opencompass/configs/datasets/CLUE_ocnli/CLUE_ocnli_gen.py
opencompass/configs/datasets/CLUE_ocnli/CLUE_ocnli_gen_51e956.py
opencompass/configs/datasets/CLUE_ocnli/CLUE_ocnli_gen_c4cb6c.py
opencompass/configs/datasets/CLUE_ocnli/CLUE_ocnli_ppl.py
opencompass/configs/datasets/CLUE_ocnli/CLUE_ocnli_ppl_98dd6e.py
opencompass/configs/datasets/CLUE_ocnli/CLUE_ocnli_ppl_ef69e7.py
opencompass/configs/datasets/CLUE_ocnli/CLUE_ocnli_ppl_fdc6de.py
opencompass/configs/datasets/CLUE_ocnli/__init__.py
opencompass/configs/datasets/ChemBench/ChemBench_gen.py
opencompass/configs/datasets/ChemBench/__init__.py
opencompass/configs/datasets/FewCLUE_bustm/FewCLUE_bustm_gen.py
opencompass/configs/datasets/FewCLUE_bustm/FewCLUE_bustm_gen_634f41.py
opencompass/configs/datasets/FewCLUE_bustm/FewCLUE_bustm_ppl.py
opencompass/configs/datasets/FewCLUE_bustm/FewCLUE_bustm_ppl_4b16c0.py
opencompass/configs/datasets/FewCLUE_bustm/FewCLUE_bustm_ppl_9ef540.py
opencompass/configs/datasets/FewCLUE_bustm/FewCLUE_bustm_ppl_e53034.py
opencompass/configs/datasets/FewCLUE_bustm/__init__.py
opencompass/configs/datasets/FewCLUE_chid/FewCLUE_chid_gen.py
opencompass/configs/datasets/FewCLUE_chid/FewCLUE_chid_gen_0a29a2.py
opencompass/configs/datasets/FewCLUE_chid/FewCLUE_chid_ppl.py
opencompass/configs/datasets/FewCLUE_chid/FewCLUE_chid_ppl_8f2872.py
opencompass/configs/datasets/FewCLUE_chid/FewCLUE_chid_ppl_acccb5.py
opencompass/configs/datasets/FewCLUE_chid/__init__.py
opencompass/configs/datasets/FewCLUE_cluewsc/FewCLUE_cluewsc_gen.py
opencompass/configs/datasets/FewCLUE_cluewsc/FewCLUE_cluewsc_gen_c68933.py
opencompass/configs/datasets/FewCLUE_cluewsc/FewCLUE_cluewsc_ppl.py
opencompass/configs/datasets/FewCLUE_cluewsc/FewCLUE_cluewsc_ppl_12e4e0.py
opencompass/configs/datasets/FewCLUE_cluewsc/FewCLUE_cluewsc_ppl_4284a0.py
opencompass/configs/datasets/FewCLUE_cluewsc/FewCLUE_cluewsc_ppl_868415.py
opencompass/configs/datasets/FewCLUE_cluewsc/__init__.py
opencompass/configs/datasets/FewCLUE_csl/FewCLUE_csl_gen.py
opencompass/configs/datasets/FewCLUE_csl/FewCLUE_csl_gen_28b223.py
opencompass/configs/datasets/FewCLUE_csl/FewCLUE_csl_gen_87f4a8.py
opencompass/configs/datasets/FewCLUE_csl/FewCLUE_csl_ppl.py
opencompass/configs/datasets/FewCLUE_csl/FewCLUE_csl_ppl_769f8d.py
opencompass/configs/datasets/FewCLUE_csl/FewCLUE_csl_ppl_841b62.py
opencompass/configs/datasets/FewCLUE_csl/__init__.py
opencompass/configs/datasets/FewCLUE_eprstmt/FewCLUE_eprstmt_gen.py
opencompass/configs/datasets/FewCLUE_eprstmt/FewCLUE_eprstmt_gen_740ea0.py
opencompass/configs/datasets/FewCLUE_eprstmt/FewCLUE_eprstmt_ppl.py
opencompass/configs/datasets/FewCLUE_eprstmt/FewCLUE_eprstmt_ppl_1ce587.py
opencompass/configs/datasets/FewCLUE_eprstmt/FewCLUE_eprstmt_ppl_f1e631.py
opencompass/configs/datasets/FewCLUE_eprstmt/__init__.py
opencompass/configs/datasets/FewCLUE_ocnli_fc/FewCLUE_ocnli_fc_gen.py
opencompass/configs/datasets/FewCLUE_ocnli_fc/FewCLUE_ocnli_fc_gen_f97a97.py
opencompass/configs/datasets/FewCLUE_ocnli_fc/FewCLUE_ocnli_fc_ppl.py
opencompass/configs/datasets/FewCLUE_ocnli_fc/FewCLUE_ocnli_fc_ppl_9e8b3d.py
opencompass/configs/datasets/FewCLUE_ocnli_fc/FewCLUE_ocnli_fc_ppl_c08300.py
opencompass/configs/datasets/FewCLUE_ocnli_fc/__init__.py
opencompass/configs/datasets/FewCLUE_tnews/FewCLUE_tnews_gen.py
opencompass/configs/datasets/FewCLUE_tnews/FewCLUE_tnews_gen_b90e4a.py
opencompass/configs/datasets/FewCLUE_tnews/FewCLUE_tnews_ppl.py
opencompass/configs/datasets/FewCLUE_tnews/FewCLUE_tnews_ppl_7d1c07.py
opencompass/configs/datasets/FewCLUE_tnews/FewCLUE_tnews_ppl_d10e8a.py
opencompass/configs/datasets/FewCLUE_tnews/FewCLUE_tnews_ppl_fff486.py
opencompass/configs/datasets/FewCLUE_tnews/__init__.py
opencompass/configs/datasets/FinanceIQ/FinanceIQ_gen.py
opencompass/configs/datasets/FinanceIQ/FinanceIQ_gen_e0e6b5.py
opencompass/configs/datasets/FinanceIQ/FinanceIQ_ppl.py
opencompass/configs/datasets/FinanceIQ/FinanceIQ_ppl_42b9bd.py
opencompass/configs/datasets/FinanceIQ/__init__.py
opencompass/configs/datasets/GLUE_CoLA/GLUE_CoLA_ppl.py
opencompass/configs/datasets/GLUE_CoLA/GLUE_CoLA_ppl_77d0df.py
opencompass/configs/datasets/GLUE_CoLA/__init__.py
opencompass/configs/datasets/GLUE_MRPC/GLUE_MRPC_ppl.py
opencompass/configs/datasets/GLUE_MRPC/GLUE_MRPC_ppl_96564c.py
opencompass/configs/datasets/GLUE_MRPC/__init__.py
opencompass/configs/datasets/GLUE_QQP/GLUE_QQP_ppl.py
opencompass/configs/datasets/GLUE_QQP/GLUE_QQP_ppl_250d00.py
opencompass/configs/datasets/GLUE_QQP/__init__.py
opencompass/configs/datasets/GaokaoBench/GaokaoBench_gen.py
opencompass/configs/datasets/GaokaoBench/GaokaoBench_gen_5cfe9e.py
opencompass/configs/datasets/GaokaoBench/GaokaoBench_mixed.py
opencompass/configs/datasets/GaokaoBench/GaokaoBench_mixed_9af5ee.py
opencompass/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_4c31db.py
opencompass/configs/datasets/GaokaoBench/GaokaoBench_no_subjective_gen_d21e37.py
opencompass/configs/datasets/GaokaoBench/GaokaoBench_prompts.py
opencompass/configs/datasets/GaokaoBench/__init__.py
opencompass/configs/datasets/IFEval/IFEval_gen.py
opencompass/configs/datasets/IFEval/IFEval_gen_3321a3.py
opencompass/configs/datasets/IFEval/__init__.py
opencompass/configs/datasets/LCBench/__init__.py
opencompass/configs/datasets/LCBench/lcbench_gen.py
opencompass/configs/datasets/LCBench/lcbench_gen_5ff288.py
opencompass/configs/datasets/LCBench/lcbench_levels_gen_bb665f.py
opencompass/configs/datasets/LCBench/lcbench_repeat10_gen.py
opencompass/configs/datasets/LCBench/lcbench_repeat10_gen_5ff288.py
opencompass/configs/datasets/MMLUArabic/MMLUArabic_gen.py
opencompass/configs/datasets/MMLUArabic/MMLUArabic_gen_326684.py
opencompass/configs/datasets/MMLUArabic/MMLUArabic_ppl.py
opencompass/configs/datasets/MMLUArabic/MMLUArabic_ppl_d2333a.py
opencompass/configs/datasets/MMLUArabic/MMLUArabic_zero_shot_gen.py
opencompass/configs/datasets/MMLUArabic/MMLUArabic_zero_shot_gen_3523e0.py
opencompass/configs/datasets/MMLUArabic/__init__.py
opencompass/configs/datasets/MathBench/__init__.py
opencompass/configs/datasets/MathBench/deprecated_mathbench_2024_gen_de9ff9.py
opencompass/configs/datasets/MathBench/deprecated_mathbench_agent_gen_48ec47.py
opencompass/configs/datasets/MathBench/deprecated_mathbench_agent_gen_fbe13b.py
opencompass/configs/datasets/MathBench/deprecated_mathbench_arith_gen_ccd638.py
opencompass/configs/datasets/MathBench/deprecated_mathbench_cot_gen_66f329.py
opencompass/configs/datasets/MathBench/deprecated_mathbench_gen_7b734b.py
opencompass/configs/datasets/MathBench/mathbench_2024_few_shot_mixed_4a3fd4.py
opencompass/configs/datasets/MathBench/mathbench_2024_gen_19e486.py
opencompass/configs/datasets/MathBench/mathbench_2024_gen_1dc21d.py
opencompass/configs/datasets/MathBench/mathbench_2024_gen_50a320.py
opencompass/configs/datasets/MathBench/mathbench_2024_gen_fc2a24.py
opencompass/configs/datasets/MathBench/mathbench_2024_wocircular_gen_1dc21d.py
opencompass/configs/datasets/MathBench/mathbench_2024_wocircular_mixed_8eb12b.py
opencompass/configs/datasets/MathBench/mathbench_gen.py
opencompass/configs/datasets/MathBench/mathbench_prompt.py
opencompass/configs/datasets/MedBench/__init__.py
opencompass/configs/datasets/MedBench/medbench_gen.py
opencompass/configs/datasets/MedBench/medbench_gen_0b4fff.py
opencompass/configs/datasets/NPHardEval/NPHardEval_gen.py
opencompass/configs/datasets/NPHardEval/NPHardEval_gen_22aac5.py
opencompass/configs/datasets/NPHardEval/__init__.py
opencompass/configs/datasets/OpenFinData/OpenFinData_gen.py
opencompass/configs/datasets/OpenFinData/OpenFinData_gen_46dedb.py
opencompass/configs/datasets/OpenFinData/__init__.py
opencompass/configs/datasets/PJExam/PJExam_gen.py
opencompass/configs/datasets/PJExam/PJExam_gen_8cd97c.py
opencompass/configs/datasets/PJExam/__init__.py
opencompass/configs/datasets/PMMEval/__init__.py
opencompass/configs/datasets/PMMEval/flores_gen.py
opencompass/configs/datasets/PMMEval/flores_gen_2697d7.py
opencompass/configs/datasets/PMMEval/humanevalxl_gen.py
opencompass/configs/datasets/PMMEval/humanevalxl_gen_bdec92.py
opencompass/configs/datasets/PMMEval/mgsm_gen.py
opencompass/configs/datasets/PMMEval/mgsm_gen_679720.py
opencompass/configs/datasets/PMMEval/mhellaswag_gen.py
opencompass/configs/datasets/PMMEval/mhellaswag_gen_1a6b73.py
opencompass/configs/datasets/PMMEval/mifeval_gen.py
opencompass/configs/datasets/PMMEval/mifeval_gen_79f8fb.py
opencompass/configs/datasets/PMMEval/mlogiqa_gen.py
opencompass/configs/datasets/PMMEval/mlogiqa_gen_36c4f9.py
opencompass/configs/datasets/PMMEval/mmmlu_gen.py
opencompass/configs/datasets/PMMEval/mmmlu_gen_d5017d.py
opencompass/configs/datasets/PMMEval/pmmeval_gen.py
opencompass/configs/datasets/PMMEval/xnli_gen.py
opencompass/configs/datasets/PMMEval/xnli_gen_973734.py
opencompass/configs/datasets/QuALITY/QuALITY_gen.py
opencompass/configs/datasets/QuALITY/QuALITY_gen_c407cb.py
opencompass/configs/datasets/QuALITY/__init__.py
opencompass/configs/datasets/SVAMP/__init__.py
opencompass/configs/datasets/SVAMP/svamp_gen.py
opencompass/configs/datasets/SVAMP/svamp_gen_fb25e4.py
opencompass/configs/datasets/SuperGLUE_AX_b/SuperGLUE_AX_b_gen.py
opencompass/configs/datasets/SuperGLUE_AX_b/SuperGLUE_AX_b_gen_4dfefa.py
opencompass/configs/datasets/SuperGLUE_AX_b/SuperGLUE_AX_b_ppl.py
opencompass/configs/datasets/SuperGLUE_AX_b/SuperGLUE_AX_b_ppl_0748aa.py
opencompass/configs/datasets/SuperGLUE_AX_b/SuperGLUE_AX_b_ppl_6db806.py
opencompass/configs/datasets/SuperGLUE_AX_b/__init__.py
opencompass/configs/datasets/SuperGLUE_AX_g/SuperGLUE_AX_g_gen.py
opencompass/configs/datasets/SuperGLUE_AX_g/SuperGLUE_AX_g_gen_68aac7.py
opencompass/configs/datasets/SuperGLUE_AX_g/SuperGLUE_AX_g_ppl.py
opencompass/configs/datasets/SuperGLUE_AX_g/SuperGLUE_AX_g_ppl_50f8f6.py
opencompass/configs/datasets/SuperGLUE_AX_g/SuperGLUE_AX_g_ppl_66caf3.py
opencompass/configs/datasets/SuperGLUE_AX_g/__init__.py
opencompass/configs/datasets/SuperGLUE_BoolQ/SuperGLUE_BoolQ_cot_gen_1d56df.py
opencompass/configs/datasets/SuperGLUE_BoolQ/SuperGLUE_BoolQ_few_shot_gen_ba58ea.py
opencompass/configs/datasets/SuperGLUE_BoolQ/SuperGLUE_BoolQ_few_shot_ppl.py
opencompass/configs/datasets/SuperGLUE_BoolQ/SuperGLUE_BoolQ_gen.py
opencompass/configs/datasets/SuperGLUE_BoolQ/SuperGLUE_BoolQ_gen_883d50.py
opencompass/configs/datasets/SuperGLUE_BoolQ/SuperGLUE_BoolQ_ppl.py
opencompass/configs/datasets/SuperGLUE_BoolQ/SuperGLUE_BoolQ_ppl_16b1d9.py
opencompass/configs/datasets/SuperGLUE_BoolQ/SuperGLUE_BoolQ_ppl_314797.py
opencompass/configs/datasets/SuperGLUE_BoolQ/SuperGLUE_BoolQ_ppl_314b96.py
opencompass/configs/datasets/SuperGLUE_BoolQ/SuperGLUE_BoolQ_ppl_4da4db.py
opencompass/configs/datasets/SuperGLUE_BoolQ/SuperGLUE_BoolQ_ppl_9619db.py
opencompass/configs/datasets/SuperGLUE_BoolQ/__init__.py
opencompass/configs/datasets/SuperGLUE_CB/SuperGLUE_CB_gen.py
opencompass/configs/datasets/SuperGLUE_CB/SuperGLUE_CB_gen_854c6c.py
opencompass/configs/datasets/SuperGLUE_CB/SuperGLUE_CB_ppl.py
opencompass/configs/datasets/SuperGLUE_CB/SuperGLUE_CB_ppl_0143fe.py
opencompass/configs/datasets/SuperGLUE_CB/SuperGLUE_CB_ppl_11c175.py
opencompass/configs/datasets/SuperGLUE_CB/__init__.py
opencompass/configs/datasets/SuperGLUE_COPA/SuperGLUE_COPA_gen.py
opencompass/configs/datasets/SuperGLUE_COPA/SuperGLUE_COPA_gen_91ca53.py
opencompass/configs/datasets/SuperGLUE_COPA/SuperGLUE_COPA_ppl.py
opencompass/configs/datasets/SuperGLUE_COPA/SuperGLUE_COPA_ppl_54058d.py
opencompass/configs/datasets/SuperGLUE_COPA/SuperGLUE_COPA_ppl_5c24f1.py
opencompass/configs/datasets/SuperGLUE_COPA/SuperGLUE_COPA_ppl_9f3618.py
opencompass/configs/datasets/SuperGLUE_COPA/__init__.py
opencompass/configs/datasets/SuperGLUE_MultiRC/SuperGLUE_MultiRC_gen.py
opencompass/configs/datasets/SuperGLUE_MultiRC/SuperGLUE_MultiRC_gen_27071f.py
opencompass/configs/datasets/SuperGLUE_MultiRC/SuperGLUE_MultiRC_ppl.py
opencompass/configs/datasets/SuperGLUE_MultiRC/SuperGLUE_MultiRC_ppl_866273.py
opencompass/configs/datasets/SuperGLUE_MultiRC/SuperGLUE_MultiRC_ppl_ced824.py
opencompass/configs/datasets/SuperGLUE_MultiRC/__init__.py
opencompass/configs/datasets/SuperGLUE_RTE/SuperGLUE_RTE_gen.py
opencompass/configs/datasets/SuperGLUE_RTE/SuperGLUE_RTE_gen_68aac7.py
opencompass/configs/datasets/SuperGLUE_RTE/SuperGLUE_RTE_ppl.py
opencompass/configs/datasets/SuperGLUE_RTE/SuperGLUE_RTE_ppl_50f8f6.py
opencompass/configs/datasets/SuperGLUE_RTE/SuperGLUE_RTE_ppl_66caf3.py
opencompass/configs/datasets/SuperGLUE_RTE/__init__.py
opencompass/configs/datasets/SuperGLUE_ReCoRD/SuperGLUE_ReCoRD_gen.py
opencompass/configs/datasets/SuperGLUE_ReCoRD/SuperGLUE_ReCoRD_gen_0f7784.py
opencompass/configs/datasets/SuperGLUE_ReCoRD/SuperGLUE_ReCoRD_gen_30dea0.py
opencompass/configs/datasets/SuperGLUE_ReCoRD/SuperGLUE_ReCoRD_gen_a69961.py
opencompass/configs/datasets/SuperGLUE_ReCoRD/__init__.py
opencompass/configs/datasets/SuperGLUE_WSC/SuperGLUE_WSC_gen.py
opencompass/configs/datasets/SuperGLUE_WSC/SuperGLUE_WSC_gen_7902a7.py
opencompass/configs/datasets/SuperGLUE_WSC/SuperGLUE_WSC_gen_fe4bf3.py
opencompass/configs/datasets/SuperGLUE_WSC/SuperGLUE_WSC_ppl.py
opencompass/configs/datasets/SuperGLUE_WSC/SuperGLUE_WSC_ppl_003529.py
opencompass/configs/datasets/SuperGLUE_WSC/SuperGLUE_WSC_ppl_1c4a90.py
opencompass/configs/datasets/SuperGLUE_WSC/SuperGLUE_WSC_ppl_d0f531.py
opencompass/configs/datasets/SuperGLUE_WSC/SuperGLUE_WSC_ppl_f37e78.py
opencompass/configs/datasets/SuperGLUE_WSC/__init__.py
opencompass/configs/datasets/SuperGLUE_WiC/SuperGLUE_WiC_gen.py
opencompass/configs/datasets/SuperGLUE_WiC/SuperGLUE_WiC_gen_d06864.py
opencompass/configs/datasets/SuperGLUE_WiC/SuperGLUE_WiC_ppl.py
opencompass/configs/datasets/SuperGLUE_WiC/SuperGLUE_WiC_ppl_312de9.py
opencompass/configs/datasets/SuperGLUE_WiC/SuperGLUE_WiC_ppl_3fb6fd.py
opencompass/configs/datasets/SuperGLUE_WiC/SuperGLUE_WiC_ppl_c926be.py
opencompass/configs/datasets/SuperGLUE_WiC/__init__.py
opencompass/configs/datasets/TabMWP/TabMWP_gen.py
opencompass/configs/datasets/TabMWP/TabMWP_gen_2aef96.py
opencompass/configs/datasets/TabMWP/__init__.py
opencompass/configs/datasets/TheoremQA/TheoremQA_5shot_gen_6f0af8.py
opencompass/configs/datasets/TheoremQA/TheoremQA_few_shot_examples.py
opencompass/configs/datasets/TheoremQA/TheoremQA_few_shot_examples_official.py
opencompass/configs/datasets/TheoremQA/TheoremQA_gen.py
opencompass/configs/datasets/TheoremQA/__init__.py
opencompass/configs/datasets/TheoremQA/deprecated_TheoremQA_gen_424e0a.py
opencompass/configs/datasets/TheoremQA/deprecated_TheoremQA_gen_7009de.py
opencompass/configs/datasets/TheoremQA/deprecated_TheoremQA_gen_ef26ca.py
opencompass/configs/datasets/TheoremQA/deprecated_TheoremQA_post_v2_gen_2c2583.py
opencompass/configs/datasets/TheoremQA/deprecated_TheoremQA_post_v2_gen_ef26ca.py
opencompass/configs/datasets/XCOPA/XCOPA_ppl.py
opencompass/configs/datasets/XCOPA/XCOPA_ppl_54058d.py
opencompass/configs/datasets/XCOPA/__init__.py
opencompass/configs/datasets/XLSum/XLSum_gen.py
opencompass/configs/datasets/XLSum/XLSum_gen_2bb71c.py
opencompass/configs/datasets/XLSum/__init__.py
opencompass/configs/datasets/Xsum/Xsum_gen.py
opencompass/configs/datasets/Xsum/Xsum_gen_31397e.py
opencompass/configs/datasets/Xsum/Xsum_gen_8ea5f8.py
opencompass/configs/datasets/Xsum/__init__.py
opencompass/configs/datasets/adv_glue/__init__.py
opencompass/configs/datasets/agieval/__init__.py
opencompass/configs/datasets/agieval/agieval_gen.py
opencompass/configs/datasets/agieval/agieval_gen_397d81.py
opencompass/configs/datasets/agieval/agieval_gen_617738.py
opencompass/configs/datasets/agieval/agieval_gen_64afd3.py
opencompass/configs/datasets/agieval/agieval_gen_a0c741.py
opencompass/configs/datasets/agieval/agieval_mixed.py
opencompass/configs/datasets/agieval/agieval_mixed_0fa998.py
opencompass/configs/datasets/anli/__init__.py
opencompass/configs/datasets/anli/anli_gen.py
opencompass/configs/datasets/anli/anli_gen_fc7328.py
opencompass/configs/datasets/anli/anli_ppl.py
opencompass/configs/datasets/anli/anli_ppl_1d290e.py
opencompass/configs/datasets/anthropics_evals/__init__.py
opencompass/configs/datasets/anthropics_evals/airisk_gen.py
opencompass/configs/datasets/anthropics_evals/airisk_gen_ba66fc.py
opencompass/configs/datasets/anthropics_evals/persona_gen.py
opencompass/configs/datasets/anthropics_evals/persona_gen_cc72e2.py
opencompass/configs/datasets/anthropics_evals/sycophancy_gen.py
opencompass/configs/datasets/anthropics_evals/sycophancy_gen_4bba45.py
opencompass/configs/datasets/apps/__init__.py
opencompass/configs/datasets/apps/apps_gen.py
opencompass/configs/datasets/apps/apps_gen_c7893a.py
opencompass/configs/datasets/apps/apps_mini_gen.py
opencompass/configs/datasets/apps/apps_mini_gen_c7893a.py
opencompass/configs/datasets/apps/deprecated_apps_gen_5b4254.py
opencompass/configs/datasets/apps/deprecated_apps_gen_7fbb95.py
opencompass/configs/datasets/apps/deprecated_apps_gen_b4dee3.py
opencompass/configs/datasets/bbh/__init__.py
opencompass/configs/datasets/bbh/bbh_gen.py
opencompass/configs/datasets/bbh/bbh_gen_2879b0.py
opencompass/configs/datasets/bbh/bbh_gen_4a31fa.py
opencompass/configs/datasets/bbh/bbh_gen_5b92b0.py
opencompass/configs/datasets/bbh/bbh_gen_5bf00b.py
opencompass/configs/datasets/bbh/bbh_gen_98fba6.py
opencompass/configs/datasets/bbh/bbh_subset_settings.py
opencompass/configs/datasets/bbh/lib_prompt/__init__.py
opencompass/configs/datasets/bbh/lib_prompt/boolean_expressions.txt
opencompass/configs/datasets/bbh/lib_prompt/causal_judgement.txt
opencompass/configs/datasets/bbh/lib_prompt/date_understanding.txt
opencompass/configs/datasets/bbh/lib_prompt/disambiguation_qa.txt
opencompass/configs/datasets/bbh/lib_prompt/dyck_languages.txt
opencompass/configs/datasets/bbh/lib_prompt/formal_fallacies.txt
opencompass/configs/datasets/bbh/lib_prompt/geometric_shapes.txt
opencompass/configs/datasets/bbh/lib_prompt/hyperbaton.txt
opencompass/configs/datasets/bbh/lib_prompt/logical_deduction_five_objects.txt
opencompass/configs/datasets/bbh/lib_prompt/logical_deduction_seven_objects.txt
opencompass/configs/datasets/bbh/lib_prompt/logical_deduction_three_objects.txt
opencompass/configs/datasets/bbh/lib_prompt/movie_recommendation.txt
opencompass/configs/datasets/bbh/lib_prompt/multistep_arithmetic_two.txt
opencompass/configs/datasets/bbh/lib_prompt/navigate.txt
opencompass/configs/datasets/bbh/lib_prompt/object_counting.txt
opencompass/configs/datasets/bbh/lib_prompt/penguins_in_a_table.txt
opencompass/configs/datasets/bbh/lib_prompt/reasoning_about_colored_objects.txt
opencompass/configs/datasets/bbh/lib_prompt/ruin_names.txt
opencompass/configs/datasets/bbh/lib_prompt/salient_translation_error_detection.txt
opencompass/configs/datasets/bbh/lib_prompt/snarks.txt
opencompass/configs/datasets/bbh/lib_prompt/sports_understanding.txt
opencompass/configs/datasets/bbh/lib_prompt/temporal_sequences.txt
opencompass/configs/datasets/bbh/lib_prompt/tracking_shuffled_objects_five_objects.txt
opencompass/configs/datasets/bbh/lib_prompt/tracking_shuffled_objects_seven_objects.txt
opencompass/configs/datasets/bbh/lib_prompt/tracking_shuffled_objects_three_objects.txt
opencompass/configs/datasets/bbh/lib_prompt/web_of_lies.txt
opencompass/configs/datasets/bbh/lib_prompt/word_sorting.txt
opencompass/configs/datasets/ceval/__init__.py
opencompass/configs/datasets/ceval/ceval_clean_ppl.py
opencompass/configs/datasets/ceval/ceval_gen.py
opencompass/configs/datasets/ceval/ceval_gen_2daf24.py
opencompass/configs/datasets/ceval/ceval_gen_5f30c7.py
opencompass/configs/datasets/ceval/ceval_internal_ppl_1cd8bf.py
opencompass/configs/datasets/ceval/ceval_internal_ppl_93e5ce.py
opencompass/configs/datasets/ceval/ceval_ppl.py
opencompass/configs/datasets/ceval/ceval_ppl_1cd8bf.py
opencompass/configs/datasets/ceval/ceval_ppl_578f8d.py
opencompass/configs/datasets/ceval/ceval_ppl_93e5ce.py
opencompass/configs/datasets/ceval/ceval_zero_shot_gen_bd40ef.py
opencompass/configs/datasets/civilcomments/__init__.py
opencompass/configs/datasets/civilcomments/civilcomments_clp.py
opencompass/configs/datasets/civilcomments/civilcomments_clp_6a2561.py
opencompass/configs/datasets/civilcomments/civilcomments_clp_a3c5fd.py
opencompass/configs/datasets/clozeTest_maxmin/__init__.py
opencompass/configs/datasets/clozeTest_maxmin/clozeTest_maxmin_gen.py
opencompass/configs/datasets/clozeTest_maxmin/clozeTest_maxmin_gen_c205fb.py
opencompass/configs/datasets/cmb/__init__.py
opencompass/configs/datasets/cmb/cmb_gen.py
opencompass/configs/datasets/cmb/cmb_gen_dfb5c4.py
opencompass/configs/datasets/cmmlu/__init__.py
opencompass/configs/datasets/cmmlu/cmmlu_0shot_cot_gen_305931.py
opencompass/configs/datasets/cmmlu/cmmlu_gen.py
opencompass/configs/datasets/cmmlu/cmmlu_gen_c13365.py
opencompass/configs/datasets/cmmlu/cmmlu_ppl.py
opencompass/configs/datasets/cmmlu/cmmlu_ppl_041cbf.py
opencompass/configs/datasets/cmmlu/cmmlu_ppl_8b9c76.py
opencompass/configs/datasets/collections/__init__.py
opencompass/configs/datasets/collections/base_core.py
opencompass/configs/datasets/collections/base_medium.py
opencompass/configs/datasets/collections/base_medium_llama.py
opencompass/configs/datasets/collections/base_small.py
opencompass/configs/datasets/collections/chat_core.py
opencompass/configs/datasets/collections/chat_medium.py
opencompass/configs/datasets/collections/chat_small.py
opencompass/configs/datasets/collections/example.py
opencompass/configs/datasets/commonsenseqa/__init__.py
opencompass/configs/datasets/commonsenseqa/commonsenseqa_7shot_cot_gen_734a22.py
opencompass/configs/datasets/commonsenseqa/commonsenseqa_gen.py
opencompass/configs/datasets/commonsenseqa/commonsenseqa_gen_1da2d0.py
opencompass/configs/datasets/commonsenseqa/commonsenseqa_gen_c946f2.py
opencompass/configs/datasets/commonsenseqa/commonsenseqa_ppl.py
opencompass/configs/datasets/commonsenseqa/commonsenseqa_ppl_3e9f2d.py
opencompass/configs/datasets/commonsenseqa/commonsenseqa_ppl_5545e2.py
opencompass/configs/datasets/commonsenseqa/commonsenseqa_ppl_716f78.py
opencompass/configs/datasets/commonsenseqa/commonsenseqa_ppl_c49e77.py
opencompass/configs/datasets/commonsenseqa/commonsenseqa_ppl_e51e32.py
opencompass/configs/datasets/commonsenseqa_cn/__init__.py
opencompass/configs/datasets/commonsenseqa_cn/commonsenseqacn_gen.py
opencompass/configs/datasets/commonsenseqa_cn/commonsenseqacn_gen_d380d0.py
opencompass/configs/datasets/commonsenseqa_cn/commonsenseqacn_ppl.py
opencompass/configs/datasets/commonsenseqa_cn/commonsenseqacn_ppl_971f48.py
opencompass/configs/datasets/contamination/__init__.py
opencompass/configs/datasets/contamination/ceval_contamination_ppl_810ec6.py
opencompass/configs/datasets/contamination/mbpp_contamination_ppl_f01cb6.py
opencompass/configs/datasets/contamination/mmlu_contamination_ppl_810ec6.py
opencompass/configs/datasets/crowspairs/__init__.py
opencompass/configs/datasets/crowspairs/crowspairs_gen.py
opencompass/configs/datasets/crowspairs/crowspairs_gen_02b6c1.py
opencompass/configs/datasets/crowspairs/crowspairs_gen_381af0.py
opencompass/configs/datasets/crowspairs/crowspairs_ppl.py
opencompass/configs/datasets/crowspairs/crowspairs_ppl_47f211.py
opencompass/configs/datasets/crowspairs/crowspairs_ppl_e811e1.py
opencompass/configs/datasets/crowspairs_cn/__init__.py
opencompass/configs/datasets/crowspairs_cn/crowspairscn_gen.py
opencompass/configs/datasets/crowspairs_cn/crowspairscn_gen_556dc9.py
opencompass/configs/datasets/crowspairs_cn/crowspairscn_ppl.py
opencompass/configs/datasets/crowspairs_cn/crowspairscn_ppl_f53575.py
opencompass/configs/datasets/cvalues/__init__.py
opencompass/configs/datasets/cvalues/cvalues_responsibility_gen.py
opencompass/configs/datasets/cvalues/cvalues_responsibility_gen_543378.py
opencompass/configs/datasets/drop/__init__.py
opencompass/configs/datasets/drop/deprecated_drop_gen_8a9ed9.py
opencompass/configs/datasets/drop/drop_examples.py
opencompass/configs/datasets/drop/drop_gen.py
opencompass/configs/datasets/drop/drop_gen_a2697c.py
opencompass/configs/datasets/drop/drop_gen_eb14af.py
opencompass/configs/datasets/drop/drop_openai_simple_evals_gen_3857b0.py
opencompass/configs/datasets/ds1000/__init__.py
opencompass/configs/datasets/ds1000/ds1000_compl_gen_cbc84f.py
opencompass/configs/datasets/ds1000/ds1000_compl_service_eval_gen_cbc84f.py
opencompass/configs/datasets/ds1000/ds1000_gen_5c4bec.py
opencompass/configs/datasets/ds1000/ds1000_gen_cbc84f.py
opencompass/configs/datasets/ds1000/ds1000_service_eval_gen_cbc84f.py
opencompass/configs/datasets/flames/__init__.py
opencompass/configs/datasets/flores/__init__.py
opencompass/configs/datasets/flores/flores_gen.py
opencompass/configs/datasets/flores/flores_gen_806ede.py
opencompass/configs/datasets/flores/flores_gen_aad4fd.py
opencompass/configs/datasets/game24/__init__.py
opencompass/configs/datasets/game24/game24_gen.py
opencompass/configs/datasets/game24/game24_gen_52a460.py
opencompass/configs/datasets/govrepcrs/__init__.py
opencompass/configs/datasets/govrepcrs/govrepcrs_gen.py
opencompass/configs/datasets/govrepcrs/govrepcrs_gen_aa5eb3.py
opencompass/configs/datasets/govrepcrs/govrepcrs_gen_db7930.py
opencompass/configs/datasets/gpqa/__init__.py
opencompass/configs/datasets/gpqa/gpqa_few_shot_ppl_4b5a83.py
opencompass/configs/datasets/gpqa/gpqa_gen.py
opencompass/configs/datasets/gpqa/gpqa_gen_015262.py
opencompass/configs/datasets/gpqa/gpqa_gen_4baadb.py
opencompass/configs/datasets/gpqa/gpqa_openai_simple_evals_gen_5aeece.py
opencompass/configs/datasets/gpqa/gpqa_ppl_6bf57a.py
opencompass/configs/datasets/gsm8k/__init__.py
opencompass/configs/datasets/gsm8k/deprecated_gsm8k_agent_gen_be1606.py
opencompass/configs/datasets/gsm8k/gsm8k_0shot_gen_a58960.py
opencompass/configs/datasets/gsm8k/gsm8k_0shot_v2_gen_a58960.py
opencompass/configs/datasets/gsm8k/gsm8k_agent_gen_c3dff3.py
opencompass/configs/datasets/gsm8k/gsm8k_gen.py
opencompass/configs/datasets/gsm8k/gsm8k_gen_17d0dc.py
opencompass/configs/datasets/gsm8k/gsm8k_gen_1d7fe4.py
opencompass/configs/datasets/gsm8k/gsm8k_gen_1dce88.py
opencompass/configs/datasets/gsm8k/gsm8k_gen_3309bd.py
opencompass/configs/datasets/gsm8k/gsm8k_gen_57b0b1.py
opencompass/configs/datasets/gsm8k/gsm8k_gen_701491.py
opencompass/configs/datasets/gsm8k/gsm8k_gen_a3e34a.py
opencompass/configs/datasets/gsm8k/gsm8k_gen_d6de81.py
opencompass/configs/datasets/gsm8k/gsm8k_gen_e9e91e.py
opencompass/configs/datasets/gsm8k/gsm8k_gen_ee684f.py
opencompass/configs/datasets/gsm8k/gsm8k_model_postprocess_gen_a58960.py
opencompass/configs/datasets/gsm8k/gsm8k_xfinder_gen_a58960.py
opencompass/configs/datasets/gsm8k_contamination/__init__.py
opencompass/configs/datasets/gsm8k_contamination/gsm8k_contamination_ppl_ecdd22.py
opencompass/configs/datasets/gsm_hard/__init__.py
opencompass/configs/datasets/gsm_hard/gsmhard_gen.py
opencompass/configs/datasets/gsm_hard/gsmhard_gen_8a1400.py
opencompass/configs/datasets/hellaswag/__init__.py
opencompass/configs/datasets/hellaswag/hellaswag_10shot_gen_e42710.py
opencompass/configs/datasets/hellaswag/hellaswag_10shot_ppl_59c85e.py
opencompass/configs/datasets/hellaswag/hellaswag_clean_ppl.py
opencompass/configs/datasets/hellaswag/hellaswag_gen.py
opencompass/configs/datasets/hellaswag/hellaswag_gen_6faab5.py
opencompass/configs/datasets/hellaswag/hellaswag_ppl.py
opencompass/configs/datasets/hellaswag/hellaswag_ppl_47bff9.py
opencompass/configs/datasets/hellaswag/hellaswag_ppl_7d7f2d.py
opencompass/configs/datasets/hellaswag/hellaswag_ppl_9dbb12.py
opencompass/configs/datasets/hellaswag/hellaswag_ppl_a6e128.py
opencompass/configs/datasets/humaneval/__init__.py
opencompass/configs/datasets/humaneval/deprecated_humaneval_gen_4a6eef.py
opencompass/configs/datasets/humaneval/deprecated_humaneval_gen_6d1cc2.py
opencompass/configs/datasets/humaneval/deprecated_humaneval_gen_a82cae.py
opencompass/configs/datasets/humaneval/deprecated_humaneval_gen_d2537e.py
opencompass/configs/datasets/humaneval/deprecated_humaneval_gen_fd5822.py
opencompass/configs/datasets/humaneval/deprecated_humaneval_gen_ff7054.py
opencompass/configs/datasets/humaneval/humaneval_gen.py
opencompass/configs/datasets/humaneval/humaneval_gen_66a7f4.py
opencompass/configs/datasets/humaneval/humaneval_gen_8e312c.py
opencompass/configs/datasets/humaneval/humaneval_openai_sample_evals_gen_159614.py
opencompass/configs/datasets/humaneval/humaneval_passk_gen_8e312c.py
opencompass/configs/datasets/humaneval/humaneval_repeat10_gen_8e312c.py
opencompass/configs/datasets/humaneval_cn/__init__.py
opencompass/configs/datasets/humaneval_cn/humaneval_cn_gen.py
opencompass/configs/datasets/humaneval_cn/humaneval_cn_gen_6313aa.py
opencompass/configs/datasets/humaneval_cn/humaneval_cn_passk_gen_6313aa.py
opencompass/configs/datasets/humaneval_cn/humaneval_cn_repeat10_gen_6313aa.py
opencompass/configs/datasets/humaneval_multi/__init__.py
opencompass/configs/datasets/humaneval_multi/humaneval_multi_gen.py
opencompass/configs/datasets/humaneval_multi/humaneval_multi_gen_82cf85.py
opencompass/configs/datasets/humaneval_plus/__init__.py
opencompass/configs/datasets/humaneval_plus/humaneval_plus_gen.py
opencompass/configs/datasets/humaneval_plus/humaneval_plus_gen_66a7f4.py
opencompass/configs/datasets/humaneval_plus/humaneval_plus_gen_8e312c.py
opencompass/configs/datasets/humaneval_plus/humaneval_plus_passk_gen_8e312c.py
opencompass/configs/datasets/humaneval_plus/humaneval_plus_repeat10_gen_8e312c.py
opencompass/configs/datasets/humanevalx/__init__.py
opencompass/configs/datasets/humanevalx/humanevalx_gen.py
opencompass/configs/datasets/humanevalx/humanevalx_gen_0af626.py
opencompass/configs/datasets/humanevalx/humanevalx_gen_620cfa.py
opencompass/configs/datasets/hungarian_exam/__init__.py
opencompass/configs/datasets/hungarian_exam/hungarian_exam_gen.py
opencompass/configs/datasets/hungarian_exam/hungarian_exam_gen_8a1435.py
opencompass/configs/datasets/infinitebench/__init__.py
opencompass/configs/datasets/infinitebench/infinitebench.py
opencompass/configs/datasets/infinitebench/infinitebenchcodedebug/__init__.py
opencompass/configs/datasets/infinitebench/infinitebenchcodedebug/infinitebench_codedebug_gen.py
opencompass/configs/datasets/infinitebench/infinitebenchcodedebug/infinitebench_codedebug_gen_276a42.py
opencompass/configs/datasets/infinitebench/infinitebenchcoderun/__init__.py
opencompass/configs/datasets/infinitebench/infinitebenchcoderun/infinitebench_coderun_gen.py
opencompass/configs/datasets/infinitebench/infinitebenchcoderun/infinitebench_coderun_gen_1a76bd.py
opencompass/configs/datasets/infinitebench/infinitebenchendia/__init__.py
opencompass/configs/datasets/infinitebench/infinitebenchendia/infinitebench_endia_gen.py
opencompass/configs/datasets/infinitebench/infinitebenchendia/infinitebench_endia_gen_c96eb5.py
opencompass/configs/datasets/infinitebench/infinitebenchenmc/__init__.py
opencompass/configs/datasets/infinitebench/infinitebenchenmc/infinitebench_enmc_gen.py
opencompass/configs/datasets/infinitebench/infinitebenchenmc/infinitebench_enmc_gen_3a4102.py
opencompass/configs/datasets/infinitebench/infinitebenchenqa/__init__.py
opencompass/configs/datasets/infinitebench/infinitebenchenqa/infinitebench_enqa_gen.py
opencompass/configs/datasets/infinitebench/infinitebenchenqa/infinitebench_enqa_gen_a1640c.py
opencompass/configs/datasets/infinitebench/infinitebenchensum/__init__.py
opencompass/configs/datasets/infinitebench/infinitebenchensum/infinitebench_ensum_gen.py
opencompass/configs/datasets/infinitebench/infinitebenchensum/infinitebench_ensum_gen_cfbc08.py
opencompass/configs/datasets/infinitebench/infinitebenchmathcalc/__init__.py
opencompass/configs/datasets/infinitebench/infinitebenchmathcalc/infinitebench_mathcalc_gen.py
opencompass/configs/datasets/infinitebench/infinitebenchmathcalc/infinitebench_mathcalc_gen_78d17e.py
opencompass/configs/datasets/infinitebench/infinitebenchmathfind/__init__.py
opencompass/configs/datasets/infinitebench/infinitebenchmathfind/infinitebench_mathfind_gen.py
opencompass/configs/datasets/infinitebench/infinitebenchmathfind/infinitebench_mathfind_gen_6d799e.py
opencompass/configs/datasets/infinitebench/infinitebenchretrievekv/__init__.py
opencompass/configs/datasets/infinitebench/infinitebenchretrievekv/infinitebench_retrievekv_gen.py
opencompass/configs/datasets/infinitebench/infinitebenchretrievekv/infinitebench_retrievekv_gen_06b3ac.py
opencompass/configs/datasets/infinitebench/infinitebenchretrievenumber/__init__.py
opencompass/configs/datasets/infinitebench/infinitebenchretrievenumber/infinitebench_retrievenumber_gen.py
opencompass/configs/datasets/infinitebench/infinitebenchretrievenumber/infinitebench_retrievenumber_gen_047436.py
opencompass/configs/datasets/infinitebench/infinitebenchretrievepasskey/__init__.py
opencompass/configs/datasets/infinitebench/infinitebenchretrievepasskey/infinitebench_retrievepasskey_gen.py
opencompass/configs/datasets/infinitebench/infinitebenchretrievepasskey/infinitebench_retrievepasskey_gen_62ff68.py
opencompass/configs/datasets/infinitebench/infinitebenchzhqa/__init__.py
opencompass/configs/datasets/infinitebench/infinitebenchzhqa/infinitebench_zhqa_gen.py
opencompass/configs/datasets/infinitebench/infinitebenchzhqa/infinitebench_zhqa_gen_1e5293.py
opencompass/configs/datasets/iwslt2017/__init__.py
opencompass/configs/datasets/iwslt2017/iwslt2017_gen.py
opencompass/configs/datasets/iwslt2017/iwslt2017_gen_69ce16.py
opencompass/configs/datasets/iwslt2017/iwslt2017_gen_b4a814.py
opencompass/configs/datasets/iwslt2017/iwslt2017_gen_d0ebd1.py
opencompass/configs/datasets/jigsawmultilingual/__init__.py
opencompass/configs/datasets/jigsawmultilingual/jigsawmultilingual_clp.py
opencompass/configs/datasets/jigsawmultilingual/jigsawmultilingual_clp_1af0ae.py
opencompass/configs/datasets/jigsawmultilingual/jigsawmultilingual_clp_fe50d8.py
opencompass/configs/datasets/kaoshi/__init__.py
opencompass/configs/datasets/kaoshi/kaoshi_gen.py
opencompass/configs/datasets/kaoshi/kaoshi_gen_86aca2.py
opencompass/configs/datasets/lambada/__init__.py
opencompass/configs/datasets/lambada/lambada_gen.py
opencompass/configs/datasets/lambada/lambada_gen_217e11.py
opencompass/configs/datasets/lambada/lambada_gen_8b48a5.py
opencompass/configs/datasets/lawbench/__init__.py
opencompass/configs/datasets/lawbench/lawbench_one_shot_gen_002588.py
opencompass/configs/datasets/lawbench/lawbench_zero_shot_gen_002588.py
opencompass/configs/datasets/lcsts/__init__.py
opencompass/configs/datasets/lcsts/lcsts_gen.py
opencompass/configs/datasets/lcsts/lcsts_gen_8ee1fe.py
opencompass/configs/datasets/lcsts/lcsts_gen_9b0b89.py
opencompass/configs/datasets/leval/__init__.py
opencompass/configs/datasets/leval/leval.py
opencompass/configs/datasets/leval/levalcoursera/__init__.py
opencompass/configs/datasets/leval/levalcoursera/leval_coursera_gen.py
opencompass/configs/datasets/leval/levalcoursera/leval_coursera_gen_36a006.py
opencompass/configs/datasets/leval/levalfinancialqa/__init__.py
opencompass/configs/datasets/leval/levalfinancialqa/leval_financialqa_gen.py
opencompass/configs/datasets/leval/levalfinancialqa/leval_financialqa_gen_b03798.py
opencompass/configs/datasets/leval/levalgovreportsumm/__init__.py
opencompass/configs/datasets/leval/levalgovreportsumm/leval_gov_report_summ_gen.py
opencompass/configs/datasets/leval/levalgovreportsumm/leval_gov_report_summ_gen_b03798.py
opencompass/configs/datasets/leval/levalgsm100/__init__.py
opencompass/configs/datasets/leval/levalgsm100/leval_gsm100_gen.py
opencompass/configs/datasets/leval/levalgsm100/leval_gsm100_gen_77dd94.py
opencompass/configs/datasets/leval/levallegalcontractqa/__init__.py
opencompass/configs/datasets/leval/levallegalcontractqa/leval_legalcontractqa_gen.py
opencompass/configs/datasets/leval/levallegalcontractqa/leval_legalcontractqa_gen_68a2ac.py
opencompass/configs/datasets/leval/levalmeetingsumm/__init__.py
opencompass/configs/datasets/leval/levalmeetingsumm/leval_meetingsumm_gen.py
opencompass/configs/datasets/leval/levalmeetingsumm/leval_meetingsumm_gen_b03798.py
opencompass/configs/datasets/leval/levalmultidocqa/__init__.py
opencompass/configs/datasets/leval/levalmultidocqa/leval_multidocqa_gen.py
opencompass/configs/datasets/leval/levalmultidocqa/leval_multidocqa_gen_96bf3f.py
opencompass/configs/datasets/leval/levalnarrativeqa/__init__.py
opencompass/configs/datasets/leval/levalnarrativeqa/leval_narrativeqa_gen.py
opencompass/configs/datasets/leval/levalnarrativeqa/leval_narrativeqa_gen_766dd0.py
opencompass/configs/datasets/leval/levalnaturalquestion/__init__.py
opencompass/configs/datasets/leval/levalnaturalquestion/leval_naturalquestion_gen.py
opencompass/configs/datasets/leval/levalnaturalquestion/leval_naturalquestion_gen_52c33f.py
opencompass/configs/datasets/leval/levalnewssumm/__init__.py
opencompass/configs/datasets/leval/levalnewssumm/leval_newssumm_gen.py
opencompass/configs/datasets/leval/levalnewssumm/leval_newssumm_gen_b03798.py
opencompass/configs/datasets/leval/levalpaperassistant/__init__.py
opencompass/configs/datasets/leval/levalpaperassistant/leval_paper_assistant_gen.py
opencompass/configs/datasets/leval/levalpaperassistant/leval_paper_assistant_gen_b03798.py
opencompass/configs/datasets/leval/levalpatentsumm/__init__.py
opencompass/configs/datasets/leval/levalpatentsumm/leval_patent_summ_gen.py
opencompass/configs/datasets/leval/levalpatentsumm/leval_patent_summ_gen_b03798.py
opencompass/configs/datasets/leval/levalquality/__init__.py
opencompass/configs/datasets/leval/levalquality/leval_quality_gen.py
opencompass/configs/datasets/leval/levalquality/leval_quality_gen_36a006.py
opencompass/configs/datasets/leval/levalreviewsumm/__init__.py
opencompass/configs/datasets/leval/levalreviewsumm/leval_review_summ_gen.py
opencompass/configs/datasets/leval/levalreviewsumm/leval_review_summ_gen_b03798.py
opencompass/configs/datasets/leval/levalscientificqa/__init__.py
opencompass/configs/datasets/leval/levalscientificqa/leval_scientificqa_gen.py
opencompass/configs/datasets/leval/levalscientificqa/leval_scientificqa_gen_96bf3f.py
opencompass/configs/datasets/leval/levaltopicretrieval/__init__.py
opencompass/configs/datasets/leval/levaltopicretrieval/leval_topic_retrieval_gen.py
opencompass/configs/datasets/leval/levaltopicretrieval/leval_topic_retrieval_gen_bf433f.py
opencompass/configs/datasets/leval/levaltpo/__init__.py
opencompass/configs/datasets/leval/levaltpo/leval_tpo_gen.py
opencompass/configs/datasets/leval/levaltpo/leval_tpo_gen_36a006.py
opencompass/configs/datasets/leval/levaltvshowsumm/__init__.py
opencompass/configs/datasets/leval/levaltvshowsumm/leval_tvshow_summ_gen.py
opencompass/configs/datasets/leval/levaltvshowsumm/leval_tvshow_summ_gen_b03798.py
opencompass/configs/datasets/llm_compression/__init__.py
opencompass/configs/datasets/llm_compression/llm_compression.py
opencompass/configs/datasets/longbench/__init__.py
opencompass/configs/datasets/longbench/longbench.py
opencompass/configs/datasets/longbench/longbench2wikimqa/__init__.py
opencompass/configs/datasets/longbench/longbench2wikimqa/longbench_2wikimqa_gen.py
opencompass/configs/datasets/longbench/longbench2wikimqa/longbench_2wikimqa_gen_6b3efc.py
opencompass/configs/datasets/longbench/longbenchdureader/__init__.py
opencompass/configs/datasets/longbench/longbenchdureader/longbench_dureader_gen.py
opencompass/configs/datasets/longbench/longbenchdureader/longbench_dureader_gen_c6c7e4.py
opencompass/configs/datasets/longbench/longbenchgov_report/__init__.py
opencompass/configs/datasets/longbench/longbenchgov_report/longbench_gov_report_gen.py
opencompass/configs/datasets/longbench/longbenchgov_report/longbench_gov_report_gen_54c5b0.py
opencompass/configs/datasets/longbench/longbenchhotpotqa/__init__.py
opencompass/configs/datasets/longbench/longbenchhotpotqa/longbench_hotpotqa_gen.py
opencompass/configs/datasets/longbench/longbenchhotpotqa/longbench_hotpotqa_gen_6b3efc.py
opencompass/configs/datasets/longbench/longbenchlcc/__init__.py
opencompass/configs/datasets/longbench/longbenchlcc/longbench_lcc_gen.py
opencompass/configs/datasets/longbench/longbenchlcc/longbench_lcc_gen_6ba507.py
opencompass/configs/datasets/longbench/longbenchlsht/__init__.py
opencompass/configs/datasets/longbench/longbenchlsht/longbench_lsht_gen.py
opencompass/configs/datasets/longbench/longbenchlsht/longbench_lsht_gen_e8a339.py
opencompass/configs/datasets/longbench/longbenchmulti_news/__init__.py
opencompass/configs/datasets/longbench/longbenchmulti_news/longbench_multi_news_gen.py
opencompass/configs/datasets/longbench/longbenchmulti_news/longbench_multi_news_gen_6f9da9.py
opencompass/configs/datasets/longbench/longbenchmultifieldqa_en/__init__.py
opencompass/configs/datasets/longbench/longbenchmultifieldqa_en/longbench_multifieldqa_en_gen.py
opencompass/configs/datasets/longbench/longbenchmultifieldqa_en/longbench_multifieldqa_en_gen_d3838e.py
opencompass/configs/datasets/longbench/longbenchmultifieldqa_zh/__init__.py
opencompass/configs/datasets/longbench/longbenchmultifieldqa_zh/longbench_multifieldqa_zh_gen.py
opencompass/configs/datasets/longbench/longbenchmultifieldqa_zh/longbench_multifieldqa_zh_gen_e9a7ef.py
opencompass/configs/datasets/longbench/longbenchmusique/__init__.py
opencompass/configs/datasets/longbench/longbenchmusique/longbench_musique_gen.py
opencompass/configs/datasets/longbench/longbenchmusique/longbench_musique_gen_6b3efc.py
opencompass/configs/datasets/longbench/longbenchnarrativeqa/__init__.py
opencompass/configs/datasets/longbench/longbenchnarrativeqa/longbench_narrativeqa_gen.py
opencompass/configs/datasets/longbench/longbenchnarrativeqa/longbench_narrativeqa_gen_a68305.py
opencompass/configs/datasets/longbench/longbenchpassage_count/__init__.py
opencompass/configs/datasets/longbench/longbenchpassage_count/longbench_passage_count_gen.py
opencompass/configs/datasets/longbench/longbenchpassage_count/longbench_passage_count_gen_dcdaab.py
opencompass/configs/datasets/longbench/longbenchpassage_retrieval_en/__init__.py
opencompass/configs/datasets/longbench/longbenchpassage_retrieval_en/longbench_passage_retrieval_en_gen.py
opencompass/configs/datasets/longbench/longbenchpassage_retrieval_en/longbench_passage_retrieval_en_gen_734db5.py
opencompass/configs/datasets/longbench/longbenchpassage_retrieval_zh/__init__.py
opencompass/configs/datasets/longbench/longbenchpassage_retrieval_zh/longbench_passage_retrieval_zh_gen.py
opencompass/configs/datasets/longbench/longbenchpassage_retrieval_zh/longbench_passage_retrieval_zh_gen_01cca2.py
opencompass/configs/datasets/longbench/longbenchqasper/__init__.py
opencompass/configs/datasets/longbench/longbenchqasper/longbench_qasper_gen.py
opencompass/configs/datasets/longbench/longbenchqasper/longbench_qasper_gen_6b3efc.py
opencompass/configs/datasets/longbench/longbenchqmsum/__init__.py
opencompass/configs/datasets/longbench/longbenchqmsum/longbench_qmsum_gen.py
opencompass/configs/datasets/longbench/longbenchqmsum/longbench_qmsum_gen_d33331.py
opencompass/configs/datasets/longbench/longbenchrepobench/__init__.py
opencompass/configs/datasets/longbench/longbenchrepobench/longbench_repobench_gen.py
opencompass/configs/datasets/longbench/longbenchrepobench/longbench_repobench_gen_6df953.py
opencompass/configs/datasets/longbench/longbenchsamsum/__init__.py
opencompass/configs/datasets/longbench/longbenchsamsum/longbench_samsum_gen.py
opencompass/configs/datasets/longbench/longbenchsamsum/longbench_samsum_gen_f4416d.py
opencompass/configs/datasets/longbench/longbenchtrec/__init__.py
opencompass/configs/datasets/longbench/longbenchtrec/longbench_trec_gen.py
opencompass/configs/datasets/longbench/longbenchtrec/longbench_trec_gen_824187.py
opencompass/configs/datasets/longbench/longbenchtriviaqa/__init__.py
opencompass/configs/datasets/longbench/longbenchtriviaqa/longbench_triviaqa_gen.py
opencompass/configs/datasets/longbench/longbenchtriviaqa/longbench_triviaqa_gen_d30cb9.py
opencompass/configs/datasets/longbench/longbenchvcsum/__init__.py
opencompass/configs/datasets/longbench/longbenchvcsum/longbench_vcsum_gen.py
opencompass/configs/datasets/longbench/longbenchvcsum/longbench_vcsum_gen_f7a8ac.py
opencompass/configs/datasets/lveval/__init__.py
opencompass/configs/datasets/lveval/lveval.py
opencompass/configs/datasets/lveval/lvevalcmrc_mixup/__init__.py
opencompass/configs/datasets/lveval/lvevalcmrc_mixup/lveval_cmrc_mixup_gen.py
opencompass/configs/datasets/lveval/lvevalcmrc_mixup/lveval_cmrc_mixup_gen_465823.py
opencompass/configs/datasets/lveval/lvevaldureader_mixup/__init__.py
opencompass/configs/datasets/lveval/lvevaldureader_mixup/lveval_dureader_mixup_gen.py
opencompass/configs/datasets/lveval/lvevaldureader_mixup/lveval_dureader_mixup_gen_465823.py
opencompass/configs/datasets/lveval/lvevalfactrecall_en/__init__.py
opencompass/configs/datasets/lveval/lvevalfactrecall_en/lveval_factrecall_en_gen.py
opencompass/configs/datasets/lveval/lvevalfactrecall_en/lveval_factrecall_en_gen_9a836f.py
opencompass/configs/datasets/lveval/lvevalfactrecall_zh/__init__.py
opencompass/configs/datasets/lveval/lvevalfactrecall_zh/lveval_factrecall_zh_gen.py
opencompass/configs/datasets/lveval/lvevalfactrecall_zh/lveval_factrecall_zh_gen_dbee70.py
opencompass/configs/datasets/lveval/lvevalhotpotwikiqa_mixup/__init__.py
opencompass/configs/datasets/lveval/lvevalhotpotwikiqa_mixup/lveval_hotpotwikiqa_mixup_gen.py
opencompass/configs/datasets/lveval/lvevalhotpotwikiqa_mixup/lveval_hotpotwikiqa_mixup_gen_77ce82.py
opencompass/configs/datasets/lveval/lvevallic_mixup/__init__.py
opencompass/configs/datasets/lveval/lvevallic_mixup/lveval_lic_mixup_gen.py
opencompass/configs/datasets/lveval/lvevallic_mixup/lveval_lic_mixup_gen_01eb0c.py
opencompass/configs/datasets/lveval/lvevalloogle_CR_mixup/__init__.py
opencompass/configs/datasets/lveval/lvevalloogle_CR_mixup/lveval_loogle_CR_mixup_gen.py
opencompass/configs/datasets/lveval/lvevalloogle_CR_mixup/lveval_loogle_CR_mixup_gen_d7ea36.py
opencompass/configs/datasets/lveval/lvevalloogle_MIR_mixup/__init__.py
opencompass/configs/datasets/lveval/lvevalloogle_MIR_mixup/lveval_loogle_MIR_mixup_gen.py
opencompass/configs/datasets/lveval/lvevalloogle_MIR_mixup/lveval_loogle_MIR_mixup_gen_d7ea36.py
opencompass/configs/datasets/lveval/lvevalloogle_SD_mixup/__init__.py
opencompass/configs/datasets/lveval/lvevalloogle_SD_mixup/lveval_loogle_SD_mixup_gen.py
opencompass/configs/datasets/lveval/lvevalloogle_SD_mixup/lveval_loogle_SD_mixup_gen_d7ea36.py
opencompass/configs/datasets/lveval/lvevalmultifieldqa_en_mixup/__init__.py
opencompass/configs/datasets/lveval/lvevalmultifieldqa_en_mixup/lveval_multifieldqa_en_mixup_gen.py
opencompass/configs/datasets/lveval/lvevalmultifieldqa_en_mixup/lveval_multifieldqa_en_mixup_gen_d7ea36.py
opencompass/configs/datasets/lveval/lvevalmultifieldqa_zh_mixup/__init__.py
opencompass/configs/datasets/lveval/lvevalmultifieldqa_zh_mixup/lveval_multifieldqa_zh_mixup_gen.py
opencompass/configs/datasets/lveval/lvevalmultifieldqa_zh_mixup/lveval_multifieldqa_zh_mixup_gen_0fbdad.py
opencompass/configs/datasets/mastermath2024v1/__init__.py
opencompass/configs/datasets/mastermath2024v1/mastermath2024v1_gen.py
opencompass/configs/datasets/mastermath2024v1/mastermath2024v1_gen_be6318.py
opencompass/configs/datasets/math/__init__.py
opencompass/configs/datasets/math/deprecated_math_agent_evaluatorv2_gen_861b4f.py
opencompass/configs/datasets/math/deprecated_math_evaluatorv2_gen_265cce.py
opencompass/configs/datasets/math/math_0shot_gen_393424.py
opencompass/configs/datasets/math/math_0shot_llm_judge_gen_393424.py
opencompass/configs/datasets/math/math_4shot_base_gen_43d5b6.py
opencompass/configs/datasets/math/math_4shot_base_gen_db136b.py
opencompass/configs/datasets/math/math_4shot_example_from_google_research.py
opencompass/configs/datasets/math/math_agent_evaluatorv2_gen_0c1b4e.py
opencompass/configs/datasets/math/math_agent_gen_0c1b4e.py
opencompass/configs/datasets/math/math_agent_gen_861b4f.py
opencompass/configs/datasets/math/math_agent_gen_af2293.py
opencompass/configs/datasets/math/math_evaluatorv2_gen_2f4a71.py
opencompass/configs/datasets/math/math_evaluatorv2_gen_cecb31.py
opencompass/configs/datasets/math/math_gen.py
opencompass/configs/datasets/math/math_gen_0957ff.py
opencompass/configs/datasets/math/math_gen_1ed9c2.py
opencompass/configs/datasets/math/math_gen_265cce.py
opencompass/configs/datasets/math/math_gen_559593.py
opencompass/configs/datasets/math/math_gen_5e8458.py
opencompass/configs/datasets/math/math_gen_736506.py
opencompass/configs/datasets/math/math_gen_78ced2.py
opencompass/configs/datasets/math/math_gen_943d32.py
opencompass/configs/datasets/math/math_intern_evaluator_gen_265cce.py
opencompass/configs/datasets/math/math_llm_judge.py
opencompass/configs/datasets/math401/__init__.py
opencompass/configs/datasets/math401/math401_gen.py
opencompass/configs/datasets/math401/math401_gen_ab5f39.py
opencompass/configs/datasets/mbpp/__init__.py
opencompass/configs/datasets/mbpp/deprecated_mbpp_gen_1e1056.py
opencompass/configs/datasets/mbpp/deprecated_mbpp_gen_6590b0.py
opencompass/configs/datasets/mbpp/deprecated_mbpp_gen_caa7ab.py
opencompass/configs/datasets/mbpp/deprecated_mbpp_passk_gen_1e1056.py
opencompass/configs/datasets/mbpp/deprecated_mbpp_repeat10_gen_1e1056.py
opencompass/configs/datasets/mbpp/deprecated_sanitized_mbpp_gen_1e1056.py
opencompass/configs/datasets/mbpp/deprecated_sanitized_mbpp_gen_cb43ef.py
opencompass/configs/datasets/mbpp/deprecated_sanitized_mbpp_passk_gen_1e1056.py
opencompass/configs/datasets/mbpp/deprecated_sanitized_mbpp_repeat10_gen_1e1056.py
opencompass/configs/datasets/mbpp/mbpp_gen.py
opencompass/configs/datasets/mbpp/mbpp_gen_830460.py
opencompass/configs/datasets/mbpp/mbpp_passk_gen_830460.py
opencompass/configs/datasets/mbpp/mbpp_repeat10_gen_830460.py
opencompass/configs/datasets/mbpp/sanitized_mbpp_gen_742f0c.py
opencompass/configs/datasets/mbpp/sanitized_mbpp_gen_830460.py
opencompass/configs/datasets/mbpp/sanitized_mbpp_gen_a0fc46.py
opencompass/configs/datasets/mbpp/sanitized_mbpp_mdblock_gen_a447ff.py
opencompass/configs/datasets/mbpp/sanitized_mbpp_passk_gen_830460.py
opencompass/configs/datasets/mbpp/sanitized_mbpp_repeat10_gen_830460.py
opencompass/configs/datasets/mbpp_cn/__init__.py
opencompass/configs/datasets/mbpp_cn/deprecated_mbpp_cn_gen_1d1481.py
opencompass/configs/datasets/mbpp_cn/deprecated_mbpp_cn_passk_gen_1d1481.py
opencompass/configs/datasets/mbpp_cn/deprecated_mbpp_cn_repeat10_gen_1d1481.py
opencompass/configs/datasets/mbpp_cn/mbpp_cn_gen.py
opencompass/configs/datasets/mbpp_cn/mbpp_cn_gen_9114d5.py
opencompass/configs/datasets/mbpp_plus/__init__.py
opencompass/configs/datasets/mbpp_plus/deprecated_mbpp_plus_gen_94815c.py
opencompass/configs/datasets/mbpp_plus/mbpp_plus_gen.py
opencompass/configs/datasets/mbpp_plus/mbpp_plus_gen_0b836a.py
opencompass/configs/datasets/mgsm/__init__.py
opencompass/configs/datasets/mgsm/mgsm_gen.py
opencompass/configs/datasets/mgsm/mgsm_gen_d967bc.py
opencompass/configs/datasets/mmlu/__init__.py
opencompass/configs/datasets/mmlu/mmlu_all_sets.py
opencompass/configs/datasets/mmlu/mmlu_clean_ppl.py
opencompass/configs/datasets/mmlu/mmlu_gen.py
opencompass/configs/datasets/mmlu/mmlu_gen_23a9a9.py
opencompass/configs/datasets/mmlu/mmlu_gen_4d595a.py
opencompass/configs/datasets/mmlu/mmlu_gen_5d1409.py
opencompass/configs/datasets/mmlu/mmlu_gen_79e572.py
opencompass/configs/datasets/mmlu/mmlu_gen_a484b3.py
opencompass/configs/datasets/mmlu/mmlu_model_postprocess_gen_4d595a.py
opencompass/configs/datasets/mmlu/mmlu_openai_simple_evals_gen_b618ea.py
opencompass/configs/datasets/mmlu/mmlu_ppl.py
opencompass/configs/datasets/mmlu/mmlu_ppl_ac766d.py
opencompass/configs/datasets/mmlu/mmlu_xfinder_gen_4d595a.py
opencompass/configs/datasets/mmlu/mmlu_zero_shot_gen_47e2c0.py
opencompass/configs/datasets/narrativeqa/__init__.py
opencompass/configs/datasets/narrativeqa/narrativeqa_gen.py
opencompass/configs/datasets/narrativeqa/narrativeqa_gen_a2d88a.py
opencompass/configs/datasets/narrativeqa/narrativeqa_gen_db6413.py
opencompass/configs/datasets/needlebench/__init__.py
opencompass/configs/datasets/needlebench/atc/__init__.py
opencompass/configs/datasets/needlebench/atc/atc.py
opencompass/configs/datasets/needlebench/atc/atc_choice.py
opencompass/configs/datasets/needlebench/atc/atc_choice_20.py
opencompass/configs/datasets/needlebench/atc/atc_choice_50.py
opencompass/configs/datasets/needlebench/atc/atc_choice_50_en_reasoning.py
opencompass/configs/datasets/needlebench/atc/atc_choice_80.py
opencompass/configs/datasets/needlebench/atc/atc_choice_80_en_reasoning.py
opencompass/configs/datasets/needlebench/needlebench_1000k/__init__.py
opencompass/configs/datasets/needlebench/needlebench_1000k/needlebench_1000k.py
opencompass/configs/datasets/needlebench/needlebench_1000k/needlebench_multi_reasoning_1000k.py
opencompass/configs/datasets/needlebench/needlebench_1000k/needlebench_multi_retrieval_1000k.py
opencompass/configs/datasets/needlebench/needlebench_1000k/needlebench_single_1000k.py
opencompass/configs/datasets/needlebench/needlebench_128k/__init__.py
opencompass/configs/datasets/needlebench/needlebench_128k/needlebench_128k.py
opencompass/configs/datasets/needlebench/needlebench_128k/needlebench_multi_reasoning_128k.py
opencompass/configs/datasets/needlebench/needlebench_128k/needlebench_multi_retrieval_128k.py
opencompass/configs/datasets/needlebench/needlebench_128k/needlebench_single_128k.py
opencompass/configs/datasets/needlebench/needlebench_200k/__init__.py
opencompass/configs/datasets/needlebench/needlebench_200k/needlebench_200k.py
opencompass/configs/datasets/needlebench/needlebench_200k/needlebench_multi_reasoning_200k.py
opencompass/configs/datasets/needlebench/needlebench_200k/needlebench_multi_retrieval_200k.py
opencompass/configs/datasets/needlebench/needlebench_200k/needlebench_single_200k.py
opencompass/configs/datasets/needlebench/needlebench_256k/__init__.py
opencompass/configs/datasets/needlebench/needlebench_256k/needlebench_256k.py
opencompass/configs/datasets/needlebench/needlebench_256k/needlebench_multi_reasoning_256k.py
opencompass/configs/datasets/needlebench/needlebench_256k/needlebench_multi_retrieval_256k.py
opencompass/configs/datasets/needlebench/needlebench_256k/needlebench_single_256k.py
opencompass/configs/datasets/needlebench/needlebench_32k/__init__.py
opencompass/configs/datasets/needlebench/needlebench_32k/needlebench_32k.py
opencompass/configs/datasets/needlebench/needlebench_32k/needlebench_multi_reasoning_32k.py
opencompass/configs/datasets/needlebench/needlebench_32k/needlebench_multi_retrieval_32k.py
opencompass/configs/datasets/needlebench/needlebench_32k/needlebench_single_32k.py
opencompass/configs/datasets/needlebench/needlebench_4k/__init__.py
opencompass/configs/datasets/needlebench/needlebench_4k/needlebench_4k.py
opencompass/configs/datasets/needlebench/needlebench_4k/needlebench_multi_reasoning_4k.py
opencompass/configs/datasets/needlebench/needlebench_4k/needlebench_multi_retrieval_4k.py
opencompass/configs/datasets/needlebench/needlebench_4k/needlebench_single_4k.py
opencompass/configs/datasets/needlebench/needlebench_8k/__init__.py
opencompass/configs/datasets/needlebench/needlebench_8k/needlebench_8k.py
opencompass/configs/datasets/needlebench/needlebench_8k/needlebench_multi_reasoning_8k.py
opencompass/configs/datasets/needlebench/needlebench_8k/needlebench_multi_retrieval_8k.py
opencompass/configs/datasets/needlebench/needlebench_8k/needlebench_multi_retrieval_compare_batch_8k.py
opencompass/configs/datasets/needlebench/needlebench_8k/needlebench_single_8k.py
opencompass/configs/datasets/nq/__init__.py
opencompass/configs/datasets/nq/nq_gen.py
opencompass/configs/datasets/nq/nq_gen_0356ec.py
opencompass/configs/datasets/nq/nq_gen_2463e2.py
opencompass/configs/datasets/nq/nq_gen_3dcea1.py
opencompass/configs/datasets/nq/nq_gen_68c1c6.py
opencompass/configs/datasets/nq/nq_gen_c788f6.py
opencompass/configs/datasets/nq/nq_open_1shot_gen_01cf41.py
opencompass/configs/datasets/nq/nq_open_1shot_gen_20a989.py
opencompass/configs/datasets/nq/nq_open_1shot_gen_2e45e5.py
opencompass/configs/datasets/nq/nq_open_gen_e93f8a.py
opencompass/configs/datasets/nq/nq_xfinder_gen_3dcea1.py
opencompass/configs/datasets/nq_cn/__init__.py
opencompass/configs/datasets/nq_cn/nqcn_gen.py
opencompass/configs/datasets/nq_cn/nqcn_gen_141737.py
opencompass/configs/datasets/obqa/__init__.py
opencompass/configs/datasets/obqa/obqa_gen.py
opencompass/configs/datasets/obqa/obqa_gen_9069e4.py
opencompass/configs/datasets/obqa/obqa_ppl.py
opencompass/configs/datasets/obqa/obqa_ppl_1defe8.py
opencompass/configs/datasets/obqa/obqa_ppl_6aac9e.py
opencompass/configs/datasets/obqa/obqa_ppl_c7c154.py
opencompass/configs/datasets/piqa/__init__.py
opencompass/configs/datasets/piqa/piqa_gen.py
opencompass/configs/datasets/piqa/piqa_gen_1194eb.py
opencompass/configs/datasets/piqa/piqa_ppl.py
opencompass/configs/datasets/piqa/piqa_ppl_0cfff2.py
opencompass/configs/datasets/piqa/piqa_ppl_1cf9f0.py
opencompass/configs/datasets/piqa/piqa_ppl_3431ea.py
opencompass/configs/datasets/promptbench/__init__.py
opencompass/configs/datasets/promptbench/promptbench_iwslt2017_gen_cbb8c8.py
opencompass/configs/datasets/promptbench/promptbench_math_gen_abf776.py
opencompass/configs/datasets/promptbench/promptbench_squad20_gen_b15d1c.py
opencompass/configs/datasets/promptbench/promptbench_wnli_gen_50662f.py
opencompass/configs/datasets/py150/__init__.py
opencompass/configs/datasets/py150/py150_gen.py
opencompass/configs/datasets/py150/py150_gen_38b13d.py
opencompass/configs/datasets/qabench/__init__.py
opencompass/configs/datasets/qabench/qabench_gen.py
opencompass/configs/datasets/qabench/qabench_gen_353ae7.py
opencompass/configs/datasets/qasper/__init__.py
opencompass/configs/datasets/qasper/qasper_gen.py
opencompass/configs/datasets/qasper/qasper_gen_a2d88a.py
opencompass/configs/datasets/qasper/qasper_gen_db6413.py
opencompass/configs/datasets/qaspercut/__init__.py
opencompass/configs/datasets/qaspercut/qaspercut_gen.py
opencompass/configs/datasets/qaspercut/qaspercut_gen_a2d88a.py
opencompass/configs/datasets/qaspercut/qaspercut_gen_db6413.py
opencompass/configs/datasets/race/__init__.py
opencompass/configs/datasets/race/race_cot_gen_d95929.py
opencompass/configs/datasets/race/race_few_shot_gen_a498ed.py
opencompass/configs/datasets/race/race_few_shot_ppl.py
opencompass/configs/datasets/race/race_gen.py
opencompass/configs/datasets/race/race_gen_69ee4f.py
opencompass/configs/datasets/race/race_gen_9302a5.py
opencompass/configs/datasets/race/race_ppl.py
opencompass/configs/datasets/race/race_ppl_5831a0.py
opencompass/configs/datasets/race/race_ppl_a138cd.py
opencompass/configs/datasets/race/race_ppl_abed12.py
opencompass/configs/datasets/realtoxicprompts/__init__.py
opencompass/configs/datasets/realtoxicprompts/realtoxicprompts_gen.py
opencompass/configs/datasets/realtoxicprompts/realtoxicprompts_gen_7605e4.py
opencompass/configs/datasets/realtoxicprompts/realtoxicprompts_gen_ac723c.py
opencompass/configs/datasets/rolebench/__init__.py
opencompass/configs/datasets/rolebench/instruction_generalization_eng.py
opencompass/configs/datasets/rolebench/instruction_generalization_zh.py
opencompass/configs/datasets/rolebench/role_generalization_eng.py
opencompass/configs/datasets/s3eval/__init__.py
opencompass/configs/datasets/s3eval/s3eval_gen.py
opencompass/configs/datasets/s3eval/s3eval_gen_b8ac80.py
opencompass/configs/datasets/safety/__init__.py
opencompass/configs/datasets/safety/safety_gen.py
opencompass/configs/datasets/safety/safety_gen_7ce197.py
opencompass/configs/datasets/scibench/__init__.py
opencompass/configs/datasets/scibench/scibench_gen.py
opencompass/configs/datasets/scibench/scibench_gen_2b21f3.py
opencompass/configs/datasets/siqa/__init__.py
opencompass/configs/datasets/siqa/siqa_gen.py
opencompass/configs/datasets/siqa/siqa_gen_18632c.py
opencompass/configs/datasets/siqa/siqa_gen_e78df3.py
opencompass/configs/datasets/siqa/siqa_ppl.py
opencompass/configs/datasets/siqa/siqa_ppl_42bc6e.py
opencompass/configs/datasets/siqa/siqa_ppl_7845b0.py
opencompass/configs/datasets/siqa/siqa_ppl_ced5f6.py
opencompass/configs/datasets/siqa/siqa_ppl_e8d8c5.py
opencompass/configs/datasets/squad20/__init__.py
opencompass/configs/datasets/squad20/squad20_gen.py
opencompass/configs/datasets/squad20/squad20_gen_1710bc.py
opencompass/configs/datasets/storycloze/__init__.py
opencompass/configs/datasets/storycloze/storycloze_gen.py
opencompass/configs/datasets/storycloze/storycloze_gen_7f656a.py
opencompass/configs/datasets/storycloze/storycloze_ppl.py
opencompass/configs/datasets/storycloze/storycloze_ppl_496661.py
opencompass/configs/datasets/storycloze/storycloze_ppl_afd16f.py
opencompass/configs/datasets/strategyqa/__init__.py
opencompass/configs/datasets/strategyqa/strategyqa_gen.py
opencompass/configs/datasets/strategyqa/strategyqa_gen_1180a7.py
opencompass/configs/datasets/strategyqa/strategyqa_gen_934441.py
opencompass/configs/datasets/subjective/__init__.py
opencompass/configs/datasets/subjective/alignbench/__init__.py
opencompass/configs/datasets/subjective/alignbench/alignbench_judgeby_critiquellm.py
opencompass/configs/datasets/subjective/alignbench/alignbench_judgeby_critiquellm_new.py
opencompass/configs/datasets/subjective/alignbench/alignbench_v1_1_judgeby_critiquellm.py
opencompass/configs/datasets/subjective/alignbench/alignbench_v1_1_judgeby_critiquellm_new.py
opencompass/configs/datasets/subjective/alpaca_eval/__init__.py
opencompass/configs/datasets/subjective/alpaca_eval/alpacav2_judgeby_gpt4.py
opencompass/configs/datasets/subjective/alpaca_eval/alpacav2_judgeby_gpt4_new.py
opencompass/configs/datasets/subjective/arena_hard/__init__.py
opencompass/configs/datasets/subjective/arena_hard/arena_hard_compare.py
opencompass/configs/datasets/subjective/arena_hard/arena_hard_compare_new.py
opencompass/configs/datasets/subjective/compassarena/__init__.py
opencompass/configs/datasets/subjective/compassarena/compassarena_compare.py
opencompass/configs/datasets/subjective/compassarena/compassarena_compare_new.py
opencompass/configs/datasets/subjective/multiround/__init__.py
opencompass/configs/datasets/subjective/multiround/mtbench101_judge.py
opencompass/configs/datasets/subjective/multiround/mtbench101_judge_new.py
opencompass/configs/datasets/subjective/multiround/mtbench_single_judge_diff_temp.py
opencompass/configs/datasets/subjective/multiround/mtbench_single_judge_diff_temp_new.py
opencompass/configs/datasets/subjective/subjective_cmp/__init__.py
opencompass/configs/datasets/summedits/__init__.py
opencompass/configs/datasets/summedits/summedits_gen.py
opencompass/configs/datasets/summedits/summedits_gen_315438.py
opencompass/configs/datasets/summedits/summedits_gen_4fb38b.py
opencompass/configs/datasets/summedits/summedits_ppl.py
opencompass/configs/datasets/summedits/summedits_ppl_1fbeb6.py
opencompass/configs/datasets/summedits/summedits_ppl_3c30d0.py
opencompass/configs/datasets/summedits/summedits_ppl_fa58ba.py
opencompass/configs/datasets/summscreen/__init__.py
opencompass/configs/datasets/summscreen/summscreen_gen.py
opencompass/configs/datasets/summscreen/summscreen_gen_653185.py
opencompass/configs/datasets/summscreen/summscreen_gen_aa5eb3.py
opencompass/configs/datasets/taco/__init__.py
opencompass/configs/datasets/taco/taco_gen.py
opencompass/configs/datasets/taco/taco_gen_c7893a.py
opencompass/configs/datasets/taco/taco_levels_gen_411572.py
opencompass/configs/datasets/teval/__init__.py
opencompass/configs/datasets/teval/teval_en_gen.py
opencompass/configs/datasets/teval/teval_en_gen_1ac254.py
opencompass/configs/datasets/teval/teval_zh_gen.py
opencompass/configs/datasets/teval/teval_zh_gen_1ac254.py
opencompass/configs/datasets/teval_v2/__init__.py
opencompass/configs/datasets/teval_v2/teval_v2_en_gen.py
opencompass/configs/datasets/teval_v2/teval_v2_en_gen_1ac254.py
opencompass/configs/datasets/teval_v2/teval_v2_zh_gen.py
opencompass/configs/datasets/teval_v2/teval_v2_zh_gen_1ac254.py
opencompass/configs/datasets/triviaqa/__init__.py
opencompass/configs/datasets/triviaqa/triviaqa_gen.py
opencompass/configs/datasets/triviaqa/triviaqa_gen_0356ec.py
opencompass/configs/datasets/triviaqa/triviaqa_gen_2121ce.py
opencompass/configs/datasets/triviaqa/triviaqa_gen_3e39a5.py
opencompass/configs/datasets/triviaqa/triviaqa_gen_429db5.py
opencompass/configs/datasets/triviaqa/triviaqa_gen_d297bb.py
opencompass/configs/datasets/triviaqa/triviaqa_wiki_1shot_gen_20a989.py
opencompass/configs/datasets/triviaqa/triviaqa_wiki_1shot_gen_bc5f21.py
opencompass/configs/datasets/triviaqa/triviaqa_wiki_1shot_gen_eaf81e.py
opencompass/configs/datasets/triviaqa/triviaqa_wiki_gen_d18bf4.py
opencompass/configs/datasets/triviaqarc/__init__.py
opencompass/configs/datasets/triviaqarc/triviaqarc_gen.py
opencompass/configs/datasets/triviaqarc/triviaqarc_gen_a2d88a.py
opencompass/configs/datasets/triviaqarc/triviaqarc_gen_db6413.py
opencompass/configs/datasets/truthfulqa/__init__.py
opencompass/configs/datasets/truthfulqa/truthfulqa_gen.py
opencompass/configs/datasets/truthfulqa/truthfulqa_gen_1e7d8d.py
opencompass/configs/datasets/truthfulqa/truthfulqa_gen_5ddc62.py
opencompass/configs/datasets/tydiqa/__init__.py
opencompass/configs/datasets/tydiqa/tydiqa_gen.py
opencompass/configs/datasets/tydiqa/tydiqa_gen_978d2a.py
opencompass/configs/datasets/wikibench/__init__.py
opencompass/configs/datasets/wikibench/wikibench_few_shot_ppl_c23d79.py
opencompass/configs/datasets/wikibench/wikibench_gen.py
opencompass/configs/datasets/wikibench/wikibench_gen_0978ad.py
opencompass/configs/datasets/wikibench/wikibench_gen_f96ece.py
opencompass/configs/datasets/wikitext/__init__.py
opencompass/configs/datasets/wikitext/wikitext_103_raw_ppl.py
opencompass/configs/datasets/wikitext/wikitext_103_raw_ppl_752e2a.py
opencompass/configs/datasets/wikitext/wikitext_2_raw_ppl.py
opencompass/configs/datasets/wikitext/wikitext_2_raw_ppl_752e2a.py
opencompass/configs/datasets/winograd/__init__.py
opencompass/configs/datasets/winograd/winograd_ppl.py
opencompass/configs/datasets/winograd/winograd_ppl_8f3049.py
opencompass/configs/datasets/winograd/winograd_ppl_b6c7ed.py
opencompass/configs/datasets/winogrande/__init__.py
opencompass/configs/datasets/winogrande/deprecated_winogrande_gen_a9ede5.py
opencompass/configs/datasets/winogrande/winogrande_5shot_gen_6447e6.py
opencompass/configs/datasets/winogrande/winogrande_5shot_gen_b36770.py
opencompass/configs/datasets/winogrande/winogrande_5shot_ll_252f01.py
opencompass/configs/datasets/winogrande/winogrande_gen.py
opencompass/configs/datasets/winogrande/winogrande_gen_458220.py
opencompass/configs/datasets/winogrande/winogrande_gen_a027b6.py
opencompass/configs/datasets/winogrande/winogrande_ll.py
opencompass/configs/datasets/winogrande/winogrande_ll_c5cf57.py
opencompass/configs/datasets/winogrande/winogrande_ppl_55a66e.py
opencompass/configs/datasets/winogrande/winogrande_ppl_9307fd.py
opencompass/configs/datasets/xiezhi/__init__.py
opencompass/configs/datasets/xiezhi/xiezhi_gen.py
opencompass/configs/datasets/xiezhi/xiezhi_gen_b86cf5.py
opencompass/configs/datasets/xiezhi/xiezhi_ppl.py
opencompass/configs/datasets/xiezhi/xiezhi_ppl_ea6bd7.py
opencompass/configs/summarizers/PMMEval.py
opencompass/configs/summarizers/__init__.py
opencompass/configs/summarizers/agent_bench.py
opencompass/configs/summarizers/charm_reason.py
opencompass/configs/summarizers/chat_OC15.py
opencompass/configs/summarizers/chat_OC15_multi_faceted.py
opencompass/configs/summarizers/cibench.py
opencompass/configs/summarizers/code_passk.py
opencompass/configs/summarizers/compassbench_v1_1_objective.py
opencompass/configs/summarizers/compassbench_v1_1_objective_public.py
opencompass/configs/summarizers/compassbench_v1_3_objective.py
opencompass/configs/summarizers/compassbench_v1_objective.py
opencompass/configs/summarizers/contamination.py
opencompass/configs/summarizers/example.py
opencompass/configs/summarizers/infinitebench.py
opencompass/configs/summarizers/internlm2_keyset.py
opencompass/configs/summarizers/lawbench.py
opencompass/configs/summarizers/leaderboard.py
opencompass/configs/summarizers/leval.py
opencompass/configs/summarizers/longbench.py
opencompass/configs/summarizers/longeval_v2.py
opencompass/configs/summarizers/lveval.py
opencompass/configs/summarizers/math_agent.py
opencompass/configs/summarizers/math_baseline.py
opencompass/configs/summarizers/mathbench.py
opencompass/configs/summarizers/mathbench_v1.py
opencompass/configs/summarizers/medium.py
opencompass/configs/summarizers/mmlu_pro.py
opencompass/configs/summarizers/needlebench.py
opencompass/configs/summarizers/plugineval.py
opencompass/configs/summarizers/ruler.py
opencompass/configs/summarizers/scicode.py
opencompass/configs/summarizers/small.py
opencompass/configs/summarizers/subjective.py
opencompass/configs/summarizers/teval.py
opencompass/configs/summarizers/teval_v2.py
opencompass/configs/summarizers/tiny.py
opencompass/configs/summarizers/groups/GaokaoBench.py
opencompass/configs/summarizers/groups/MMLUArabic.py
opencompass/configs/summarizers/groups/PMMEval.py
opencompass/configs/summarizers/groups/__init__.py
opencompass/configs/summarizers/groups/agieval.py
opencompass/configs/summarizers/groups/bbh.py
opencompass/configs/summarizers/groups/calm.py
opencompass/configs/summarizers/groups/ceval.py
opencompass/configs/summarizers/groups/charm_reason.py
opencompass/configs/summarizers/groups/cibench.py
opencompass/configs/summarizers/groups/cmmlu.py
opencompass/configs/summarizers/groups/ds1000.py
opencompass/configs/summarizers/groups/flores.py
opencompass/configs/summarizers/groups/humanevalx.py
opencompass/configs/summarizers/groups/infinitebench.py
opencompass/configs/summarizers/groups/jigsaw_multilingual.py
opencompass/configs/summarizers/groups/lawbench.py
opencompass/configs/summarizers/groups/lcbench.py
opencompass/configs/summarizers/groups/leval.py
opencompass/configs/summarizers/groups/longbench.py
opencompass/configs/summarizers/groups/lveval.py
opencompass/configs/summarizers/groups/mathbench.py
opencompass/configs/summarizers/groups/mathbench_2024.py
opencompass/configs/summarizers/groups/mathbench_agent.py
opencompass/configs/summarizers/groups/mathbench_v1.py
opencompass/configs/summarizers/groups/mathbench_v1_2024.py
opencompass/configs/summarizers/groups/mathbench_v1_2024_lang.py
opencompass/configs/summarizers/groups/mgsm.py
opencompass/configs/summarizers/groups/mmlu.py
opencompass/configs/summarizers/groups/mmlu_pro.py
opencompass/configs/summarizers/groups/plugineval.py
opencompass/configs/summarizers/groups/ruler.py
opencompass/configs/summarizers/groups/scibench.py
opencompass/configs/summarizers/groups/scicode.py
opencompass/configs/summarizers/groups/teval.py
opencompass/configs/summarizers/groups/teval_v2.py
opencompass/configs/summarizers/groups/tydiqa.py
opencompass/configs/summarizers/groups/xiezhi.py
opencompass/configs/summarizers/groups/legacy/__init__.py
opencompass/configs/summarizers/groups/legacy/cibench.py
opencompass/datasets/FinanceIQ.py
opencompass/datasets/GaokaoBench.py
opencompass/datasets/LCBench.py
opencompass/datasets/MMLUArabic.py
opencompass/datasets/OpenFinData.py
opencompass/datasets/QuALITY.py
opencompass/datasets/__init__.py
opencompass/datasets/advglue.py
opencompass/datasets/afqmcd.py
opencompass/datasets/aime2024.py
opencompass/datasets/anli.py
opencompass/datasets/anthropics_evals.py
opencompass/datasets/apps.py
opencompass/datasets/arc.py
opencompass/datasets/arc_prize_public_evaluation.py
opencompass/datasets/ax.py
opencompass/datasets/base.py
opencompass/datasets/bbh.py
opencompass/datasets/benbench.py
opencompass/datasets/boolq.py
opencompass/datasets/bustum.py
opencompass/datasets/c3.py
opencompass/datasets/cb.py
opencompass/datasets/ceval.py
opencompass/datasets/charm.py
opencompass/datasets/chembench.py
opencompass/datasets/chid.py
opencompass/datasets/cibench.py
opencompass/datasets/circular.py
opencompass/datasets/civilcomments.py
opencompass/datasets/clozeTest_maxmin.py
opencompass/datasets/cluewsc.py
opencompass/datasets/cmb.py
opencompass/datasets/cmmlu.py
opencompass/datasets/cmnli.py
opencompass/datasets/cmo_fib.py
opencompass/datasets/cmrc.py
opencompass/datasets/commonsenseqa.py
opencompass/datasets/commonsenseqa_cn.py
opencompass/datasets/compassbench_obj.py
opencompass/datasets/copa.py
opencompass/datasets/crowspairs.py
opencompass/datasets/crowspairs_cn.py
opencompass/datasets/csl.py
opencompass/datasets/custom.py
opencompass/datasets/cvalues.py
opencompass/datasets/dingo.py
opencompass/datasets/drcd.py
opencompass/datasets/drop.py
opencompass/datasets/drop_simple_eval.py
opencompass/datasets/ds1000.py
opencompass/datasets/ds1000_interpreter.py
opencompass/datasets/eprstmt.py
opencompass/datasets/flores.py
opencompass/datasets/game24.py
opencompass/datasets/gaokao_math.py
opencompass/datasets/govrepcrs.py
opencompass/datasets/gpqa.py
opencompass/datasets/gsm8k.py
opencompass/datasets/gsm_hard.py
opencompass/datasets/hellaswag.py
opencompass/datasets/huggingface.py
opencompass/datasets/humaneval.py
opencompass/datasets/humaneval_multi.py
opencompass/datasets/humanevalx.py
opencompass/datasets/hungarian_math.py
opencompass/datasets/inference_ppl.py
opencompass/datasets/iwslt2017.py
opencompass/datasets/jigsawmultilingual.py
opencompass/datasets/jsonl.py
opencompass/datasets/kaoshi.py
opencompass/datasets/lambada.py
opencompass/datasets/lcsts.py
opencompass/datasets/llm_compression.py
opencompass/datasets/lmeval.py
opencompass/datasets/mastermath2024v1.py
opencompass/datasets/math.py
opencompass/datasets/math401.py
opencompass/datasets/math_intern.py
opencompass/datasets/mathbench.py
opencompass/datasets/mbpp.py
opencompass/datasets/mgsm.py
opencompass/datasets/mmlu.py
opencompass/datasets/mmlu_pro.py
opencompass/datasets/mmmlu.py
opencompass/datasets/multirc.py
opencompass/datasets/narrativeqa.py
opencompass/datasets/natural_question.py
opencompass/datasets/natural_question_cn.py
opencompass/datasets/obqa.py
opencompass/datasets/piqa.py
opencompass/datasets/py150.py
opencompass/datasets/qasper.py
opencompass/datasets/qaspercut.py
opencompass/datasets/race.py
opencompass/datasets/realtoxicprompts.py
opencompass/datasets/record.py
opencompass/datasets/rolebench.py
opencompass/datasets/s3eval.py
opencompass/datasets/safety.py
opencompass/datasets/scibench.py
opencompass/datasets/scicode.py
opencompass/datasets/simpleqa.py
opencompass/datasets/siqa.py
opencompass/datasets/squad20.py
opencompass/datasets/storycloze.py
opencompass/datasets/strategyqa.py
opencompass/datasets/summedits.py
opencompass/datasets/summscreen.py
opencompass/datasets/svamp.py
opencompass/datasets/tabmwp.py
opencompass/datasets/taco.py
opencompass/datasets/tnews.py
opencompass/datasets/triviaqa.py
opencompass/datasets/triviaqarc.py
opencompass/datasets/truthfulqa.py
opencompass/datasets/tydiqa.py
opencompass/datasets/wic.py
opencompass/datasets/wikibench.py
opencompass/datasets/winograd.py
opencompass/datasets/winogrande.py
opencompass/datasets/wnli.py
opencompass/datasets/wsc.py
opencompass/datasets/xcopa.py
opencompass/datasets/xiezhi.py
opencompass/datasets/xlsum.py
opencompass/datasets/xsum.py
opencompass/datasets/IFEval/__init__.py
opencompass/datasets/IFEval/evaluation_main.py
opencompass/datasets/IFEval/ifeval.py
opencompass/datasets/IFEval/instructions.py
opencompass/datasets/IFEval/instructions_registry.py
opencompass/datasets/IFEval/instructions_util.py
opencompass/datasets/NPHardEval/__init__.py
opencompass/datasets/NPHardEval/cmp_GCP_D.py
opencompass/datasets/NPHardEval/cmp_KSP.py
opencompass/datasets/NPHardEval/cmp_TSP_D.py
opencompass/datasets/NPHardEval/hard_GCP.py
opencompass/datasets/NPHardEval/hard_MSP.py
opencompass/datasets/NPHardEval/hard_TSP.py
opencompass/datasets/NPHardEval/p_BSP.py
opencompass/datasets/NPHardEval/p_EDP.py
opencompass/datasets/NPHardEval/p_SPP.py
opencompass/datasets/NPHardEval/prompts.py
opencompass/datasets/NPHardEval/utils.py
opencompass/datasets/PMMEval/__init__.py
opencompass/datasets/PMMEval/flores.py
opencompass/datasets/PMMEval/humanevalxl.py
opencompass/datasets/PMMEval/mgsm.py
opencompass/datasets/PMMEval/mhellaswag.py
opencompass/datasets/PMMEval/mifeval.py
opencompass/datasets/PMMEval/mlogiqa.py
opencompass/datasets/PMMEval/mmmlu.py
opencompass/datasets/PMMEval/xnli.py
opencompass/datasets/PMMEval/mifeval_utils/__init__.py
opencompass/datasets/PMMEval/mifeval_utils/combination_checker.py
opencompass/datasets/PMMEval/mifeval_utils/detectable_content_checker.py
opencompass/datasets/PMMEval/mifeval_utils/detectable_format_checker.py
opencompass/datasets/PMMEval/mifeval_utils/keywords_checker.py
opencompass/datasets/PMMEval/mifeval_utils/length_constraints_checker.py
opencompass/datasets/PMMEval/mifeval_utils/punctuation_checker.py
opencompass/datasets/PMMEval/mifeval_utils/startend_checker.py
opencompass/datasets/TheoremQA/__init__.py
opencompass/datasets/TheoremQA/legacy.py
opencompass/datasets/TheoremQA/main.py
opencompass/datasets/TheoremQA/number_utils.py
opencompass/datasets/TheoremQA/utils.py
opencompass/datasets/agieval/__init__.py
opencompass/datasets/agieval/agieval.py
opencompass/datasets/agieval/constructions.py
opencompass/datasets/agieval/dataset_loader.py
opencompass/datasets/agieval/evaluation.py
opencompass/datasets/agieval/math_equivalence.py
opencompass/datasets/agieval/post_process.py
opencompass/datasets/agieval/utils.py
opencompass/datasets/babilong/__init__.py
opencompass/datasets/babilong/babilong.py
opencompass/datasets/babilong/babilong_utils.py
opencompass/datasets/babilong/prompts.py
opencompass/datasets/calm/__init__.py
opencompass/datasets/calm/calm.py
opencompass/datasets/calm/data_processing/__init__.py
opencompass/datasets/calm/data_processing/generate_questions.py
opencompass/datasets/calm/data_processing/task_hiearchy.py
opencompass/datasets/calm/data_processing/prompt/AC-B_causal_judgement.py
opencompass/datasets/calm/data_processing/prompt/AR-B_CaLM-AR.py
opencompass/datasets/calm/data_processing/prompt/ATE.py
opencompass/datasets/calm/data_processing/prompt/BAS-B_backadj.py
opencompass/datasets/calm/data_processing/prompt/BAS-C_max-BAS.py
opencompass/datasets/calm/data_processing/prompt/BAS-C_min-BAS.py
opencompass/datasets/calm/data_processing/prompt/BAS-C_mix-BAS.py
opencompass/datasets/calm/data_processing/prompt/CA-B_FA.py
opencompass/datasets/calm/data_processing/prompt/CA-B_FP.py
opencompass/datasets/calm/data_processing/prompt/CB-B_collider-bias.py
opencompass/datasets/calm/data_processing/prompt/CDE.py
opencompass/datasets/calm/data_processing/prompt/CEG-O_E-CARE.py
opencompass/datasets/calm/data_processing/prompt/CEI-B.py
opencompass/datasets/calm/data_processing/prompt/CORR-B_correlation.py
opencompass/datasets/calm/data_processing/prompt/CR-B_det-counterfactual.py
opencompass/datasets/calm/data_processing/prompt/CR-C_CRASS.py
opencompass/datasets/calm/data_processing/prompt/EAE-B_exp-away.py
opencompass/datasets/calm/data_processing/prompt/ECI-B_CTB.py
opencompass/datasets/calm/data_processing/prompt/ECI-B_ESC.py
opencompass/datasets/calm/data_processing/prompt/ECI-B_MAVEN-ERE.py
opencompass/datasets/calm/data_processing/prompt/ETT.py
opencompass/datasets/calm/data_processing/prompt/FAS-C_FAS.py
opencompass/datasets/calm/data_processing/prompt/IV-C_CaLM-IV.py
opencompass/datasets/calm/data_processing/prompt/NDE.py
opencompass/datasets/calm/data_processing/prompt/NIE.py
opencompass/datasets/calm/data_processing/prompt/PCD-B_COPA.py
opencompass/datasets/calm/data_processing/prompt/PCD-B_E-CARE.py
opencompass/datasets/calm/data_processing/prompt/PCD-C_COPA.py
opencompass/datasets/calm/data_processing/prompt/PCD-C_E-CARE.py
opencompass/datasets/calm/data_processing/prompt/PN.py
opencompass/datasets/calm/data_processing/prompt/PS.py
opencompass/datasets/calm/data_processing/prompt/__init__.py
opencompass/datasets/calm/evaluation/__init__.py
opencompass/datasets/calm/evaluation/core_metrics.py
opencompass/datasets/calm/evaluation/errors.py
opencompass/datasets/calm/evaluation/accuracy/__init__.py
opencompass/datasets/calm/evaluation/accuracy/choice.py
opencompass/datasets/calm/evaluation/accuracy/open-ended.py
opencompass/datasets/calm/evaluation/accuracy/prob.py
opencompass/datasets/calm/evaluation/error/__init__.py
opencompass/datasets/calm/evaluation/error/basic_adversarial/AC-B_causal_judgement.py
opencompass/datasets/calm/evaluation/error/basic_adversarial/AR-B_CaLM-AR.py
opencompass/datasets/calm/evaluation/error/basic_adversarial/AS.py
opencompass/datasets/calm/evaluation/error/basic_adversarial/CA-B.py
opencompass/datasets/calm/evaluation/error/basic_adversarial/CEI-B.py
opencompass/datasets/calm/evaluation/error/basic_adversarial/CLADDER.py
opencompass/datasets/calm/evaluation/error/basic_adversarial/CR-C_CRASS.py
opencompass/datasets/calm/evaluation/error/basic_adversarial/ECI.py
opencompass/datasets/calm/evaluation/error/basic_adversarial/Natural.py
opencompass/datasets/calm/evaluation/error/basic_adversarial/PCD-B.py
opencompass/datasets/calm/evaluation/error/basic_adversarial/PCD-C.py
opencompass/datasets/calm/evaluation/error/basic_adversarial/Probability.py
opencompass/datasets/calm/evaluation/error/basic_adversarial/__init__.py
opencompass/datasets/calm/evaluation/labeling/AC-B_causal_judgement.py
opencompass/datasets/calm/evaluation/labeling/AR-B_CaLM-AR.py
opencompass/datasets/calm/evaluation/labeling/AS.py
opencompass/datasets/calm/evaluation/labeling/CA-B_FA.py
opencompass/datasets/calm/evaluation/labeling/CA-B_FP.py
opencompass/datasets/calm/evaluation/labeling/CEG-O_E-CARE.py
opencompass/datasets/calm/evaluation/labeling/CEI-B.py
opencompass/datasets/calm/evaluation/labeling/CLADDER.py
opencompass/datasets/calm/evaluation/labeling/CR-C_CRASS.py
opencompass/datasets/calm/evaluation/labeling/ECI.py
opencompass/datasets/calm/evaluation/labeling/Natural.py
opencompass/datasets/calm/evaluation/labeling/PCD-B.py
opencompass/datasets/calm/evaluation/labeling/PCD-C.py
opencompass/datasets/calm/evaluation/labeling/Probability.py
opencompass/datasets/calm/evaluation/labeling/__init__.py
opencompass/datasets/calm/evaluation/labeling/common_answers.py
opencompass/datasets/calm/utils/__init__.py
opencompass/datasets/calm/utils/load_items.py
opencompass/datasets/infinitebench/__init__.py
opencompass/datasets/infinitebench/infinitebench_codedebug.py
opencompass/datasets/infinitebench/infinitebench_coderun.py
opencompass/datasets/infinitebench/infinitebench_endia.py
opencompass/datasets/infinitebench/infinitebench_enmc.py
opencompass/datasets/infinitebench/infinitebench_enqa.py
opencompass/datasets/infinitebench/infinitebench_ensum.py
opencompass/datasets/infinitebench/infinitebench_mathcalc.py
opencompass/datasets/infinitebench/infinitebench_mathfind.py
opencompass/datasets/infinitebench/infinitebench_retrievekv.py
opencompass/datasets/infinitebench/infinitebench_retrievenumber.py
opencompass/datasets/infinitebench/infinitebench_retrievepasskey.py
opencompass/datasets/infinitebench/infinitebench_zhqa.py
opencompass/datasets/infinitebench/utils.py
opencompass/datasets/korbench/__init__.py
opencompass/datasets/korbench/korbench.py
opencompass/datasets/korbench/korbench_utils.py
opencompass/datasets/lawbench/__init__.py
opencompass/datasets/lawbench/lawbench.py
opencompass/datasets/lawbench/evaluation_functions/__init__.py
opencompass/datasets/lawbench/evaluation_functions/cjft.py
opencompass/datasets/lawbench/evaluation_functions/flzx.py
opencompass/datasets/lawbench/evaluation_functions/ftcs.py
opencompass/datasets/lawbench/evaluation_functions/jdzy.py
opencompass/datasets/lawbench/evaluation_functions/jec_ac.py
opencompass/datasets/lawbench/evaluation_functions/jec_kd.py
opencompass/datasets/lawbench/evaluation_functions/jetq.py
opencompass/datasets/lawbench/evaluation_functions/lblj.py
opencompass/datasets/lawbench/evaluation_functions/ljp_accusation.py
opencompass/datasets/lawbench/evaluation_functions/ljp_article.py
opencompass/datasets/lawbench/evaluation_functions/ljp_imprison.py
opencompass/datasets/lawbench/evaluation_functions/sjjc.py
opencompass/datasets/lawbench/evaluation_functions/wbfl.py
opencompass/datasets/lawbench/evaluation_functions/wsjd.py
opencompass/datasets/lawbench/evaluation_functions/xxcq.py
opencompass/datasets/lawbench/evaluation_functions/ydlj.py
opencompass/datasets/lawbench/evaluation_functions/yqzy.py
opencompass/datasets/lawbench/evaluation_functions/zxfl.py
opencompass/datasets/lawbench/utils/__init__.py
opencompass/datasets/lawbench/utils/char_smi.py
opencompass/datasets/lawbench/utils/compare_m2_for_evaluation.py
opencompass/datasets/lawbench/utils/comprehension_scores.py
opencompass/datasets/lawbench/utils/function_utils.py
opencompass/datasets/lawbench/utils/parallel_to_m2.py
opencompass/datasets/lawbench/utils/rc_f1.py
opencompass/datasets/lawbench/utils/modules/__init__.py
opencompass/datasets/lawbench/utils/modules/alignment.py
opencompass/datasets/lawbench/utils/modules/annotator.py
opencompass/datasets/lawbench/utils/modules/classifier.py
opencompass/datasets/lawbench/utils/modules/merger.py
opencompass/datasets/lawbench/utils/modules/tokenization.py
opencompass/datasets/lawbench/utils/modules/tokenizer.py
opencompass/datasets/leval/__init__.py
opencompass/datasets/leval/evaluators.py
opencompass/datasets/leval/leval_coursera.py
opencompass/datasets/leval/leval_financial_qa.py
opencompass/datasets/leval/leval_gov_report_summ.py
opencompass/datasets/leval/leval_gsm100.py
opencompass/datasets/leval/leval_legal_contract_qa.py
opencompass/datasets/leval/leval_meeting_summ.py
opencompass/datasets/leval/leval_multidoc_qa.py
opencompass/datasets/leval/leval_narrattive_qa.py
opencompass/datasets/leval/leval_natural_question.py
opencompass/datasets/leval/leval_news_summ.py
opencompass/datasets/leval/leval_paper_assistant.py
opencompass/datasets/leval/leval_patent_summ.py
opencompass/datasets/leval/leval_quality.py
opencompass/datasets/leval/leval_review_summ.py
opencompass/datasets/leval/leval_scientific_qa.py
opencompass/datasets/leval/leval_topic_retrieval.py
opencompass/datasets/leval/leval_tpo.py
opencompass/datasets/leval/leval_tvshow_summ.py
opencompass/datasets/livecodebench/__init__.py
opencompass/datasets/livecodebench/evaluator.py
opencompass/datasets/livecodebench/execute_utils.py
opencompass/datasets/livecodebench/extract_utils.py
opencompass/datasets/livecodebench/livecodebench.py
opencompass/datasets/livecodebench/pass_k_utils.py
opencompass/datasets/livecodebench/prompts.py
opencompass/datasets/livecodebench/testing_util.py
opencompass/datasets/longbench/__init__.py
opencompass/datasets/longbench/evaluators.py
opencompass/datasets/longbench/longbench_2wikim_qa.py
opencompass/datasets/longbench/longbench_dureader.py
opencompass/datasets/longbench/longbench_gov_report.py
opencompass/datasets/longbench/longbench_hotpot_qa.py
opencompass/datasets/longbench/longbench_lcc.py
opencompass/datasets/longbench/longbench_lsht.py
opencompass/datasets/longbench/longbench_multi_news.py
opencompass/datasets/longbench/longbench_multifieldqa_en.py
opencompass/datasets/longbench/longbench_multifieldqa_zh.py
opencompass/datasets/longbench/longbench_musique.py
opencompass/datasets/longbench/longbench_narrative_qa.py
opencompass/datasets/longbench/longbench_passage_count.py
opencompass/datasets/longbench/longbench_passage_retrieval_en.py
opencompass/datasets/longbench/longbench_passage_retrieval_zh.py
opencompass/datasets/longbench/longbench_qasper.py
opencompass/datasets/longbench/longbench_qmsum.py
opencompass/datasets/longbench/longbench_repobench.py
opencompass/datasets/longbench/longbench_samsum.py
opencompass/datasets/longbench/longbench_trec.py
opencompass/datasets/longbench/longbench_trivia_qa.py
opencompass/datasets/longbench/longbench_vcsum.py
opencompass/datasets/lveval/__init__.py
opencompass/datasets/lveval/evaluators.py
opencompass/datasets/lveval/lveval_cmrc_mixup.py
opencompass/datasets/lveval/lveval_dureader_mixup.py
opencompass/datasets/lveval/lveval_factrecall_en.py
opencompass/datasets/lveval/lveval_factrecall_zh.py
opencompass/datasets/lveval/lveval_hotpotwikiqa_mixup.py
opencompass/datasets/lveval/lveval_lic_mixup.py
opencompass/datasets/lveval/lveval_loogle_CR_mixup.py
opencompass/datasets/lveval/lveval_loogle_MIR_mixup.py
opencompass/datasets/lveval/lveval_loogle_SD_mixup.py
opencompass/datasets/lveval/lveval_multifieldqa_en_mixup.py
opencompass/datasets/lveval/lveval_multifieldqa_zh_mixup.py
opencompass/datasets/medbench/__init__.py
opencompass/datasets/medbench/constructions.py
opencompass/datasets/medbench/dataset_loader.py
opencompass/datasets/medbench/evaluation.py
opencompass/datasets/medbench/math_equivalence.py
opencompass/datasets/medbench/medbench.py
opencompass/datasets/medbench/post_process.py
opencompass/datasets/medbench/utils.py
opencompass/datasets/musr/__init__.py
opencompass/datasets/musr/murder_mystery_solved_ex.py
opencompass/datasets/musr/musr.py
opencompass/datasets/musr/object_placements_solved_ex.py
opencompass/datasets/musr/team_allocation_solved_ex.py
opencompass/datasets/musr/tree.py
opencompass/datasets/needlebench/__init__.py
opencompass/datasets/needlebench/atc.py
opencompass/datasets/needlebench/atc_choice.py
opencompass/datasets/needlebench/multi.py
opencompass/datasets/needlebench/origin.py
opencompass/datasets/needlebench/parallel.py
opencompass/datasets/reasonbench/ReasonBenchDataset.py
opencompass/datasets/reasonbench/__init__.py
opencompass/datasets/ruler/__init__.py
opencompass/datasets/ruler/ruler_cwe.py
opencompass/datasets/ruler/ruler_fwe.py
opencompass/datasets/ruler/ruler_niah.py
opencompass/datasets/ruler/ruler_qa.py
opencompass/datasets/ruler/ruler_vt.py
opencompass/datasets/subjective/__init__.py
opencompass/datasets/subjective/alignbench.py
opencompass/datasets/subjective/alpacaeval.py
opencompass/datasets/subjective/arena_hard.py
opencompass/datasets/subjective/compass_arena.py
opencompass/datasets/subjective/compass_arena_subjective_bench.py
opencompass/datasets/subjective/compassbench.py
opencompass/datasets/subjective/compassbench_checklist.py
opencompass/datasets/subjective/compassbench_control_length_bias.py
opencompass/datasets/subjective/corev2.py
opencompass/datasets/subjective/creationbench.py
opencompass/datasets/subjective/flames.py
opencompass/datasets/subjective/fofo.py
opencompass/datasets/subjective/followbench.py
opencompass/datasets/subjective/hellobench.py
opencompass/datasets/subjective/judgerbench.py
opencompass/datasets/subjective/mtbench.py
opencompass/datasets/subjective/mtbench101.py
opencompass/datasets/subjective/multiround.py
opencompass/datasets/subjective/subjective_cmp.py
opencompass/datasets/subjective/utils.py
opencompass/datasets/subjective/wildbench.py
opencompass/datasets/teval/__init__.py
opencompass/datasets/teval/schema.py
opencompass/datasets/teval/evaluators/__init__.py
opencompass/datasets/teval/evaluators/instruct_evaluator.py
opencompass/datasets/teval/evaluators/planning_evaluator.py
opencompass/datasets/teval/evaluators/reason_retrieve_understand_evaluator.py
opencompass/datasets/teval/evaluators/review_evaluator.py
opencompass/datasets/teval/utils/__init__.py
opencompass/datasets/teval/utils/convert_results.py
opencompass/datasets/teval/utils/format_load.py
opencompass/datasets/teval/utils/meta_template.py
opencompass/datasets/teval/utils/template.py
opencompass/metrics/__init__.py
opencompass/metrics/dump_results.py
opencompass/metrics/mme_score.py
opencompass/metrics/seedbench.py
opencompass/models/__init__.py
opencompass/models/accessory.py
opencompass/models/ai360_api.py
opencompass/models/alaya.py
opencompass/models/baichuan_api.py
opencompass/models/baidu_api.py
opencompass/models/bailing_api_oc.py
opencompass/models/base.py
opencompass/models/base_api.py
opencompass/models/bytedance_api.py
opencompass/models/claude_allesapin.py
opencompass/models/claude_sdk_api.py
opencompass/models/deepseek_api.py
opencompass/models/doubao.py
opencompass/models/doubao_api.py
opencompass/models/gemini_api.py
opencompass/models/glm.py
opencompass/models/huggingface.py
opencompass/models/huggingface_above_v4_33.py
opencompass/models/hunyuan_api.py
opencompass/models/intern_model.py
opencompass/models/interntrain.py
opencompass/models/krgpt_api.py
opencompass/models/lagent.py
opencompass/models/langchain.py
opencompass/models/lightllm_api.py
opencompass/models/llama2.py
opencompass/models/minimax_api.py
opencompass/models/mistral_api.py
opencompass/models/mixtral.py
opencompass/models/modelscope.py
opencompass/models/moonshot_api.py
opencompass/models/nanbeige_api.py
opencompass/models/openai_api.py
opencompass/models/pangu_api.py
opencompass/models/qwen_api.py
opencompass/models/rendu_api.py
opencompass/models/sensetime_api.py
opencompass/models/stepfun_api.py
opencompass/models/turbomind.py
opencompass/models/turbomind_api.py
opencompass/models/turbomind_with_tf_above_v4_33.py
opencompass/models/unigpt_api.py
opencompass/models/vllm.py
opencompass/models/vllm_with_tf_above_v4_33.py
opencompass/models/xunfei_api.py
opencompass/models/yayi_api.py
opencompass/models/yi_api.py
opencompass/models/zhipuai_api.py
opencompass/models/zhipuai_v2_api.py
opencompass/models/claude_api/__init__.py
opencompass/models/claude_api/claude_api.py
opencompass/models/claude_api/postprocessors.py
opencompass/openicl/__init__.py
opencompass/openicl/icl_dataset_reader.py
opencompass/openicl/icl_prompt_template.py
opencompass/openicl/icl_evaluator/__init__.py
opencompass/openicl/icl_evaluator/icl_agent_evaluator.py
opencompass/openicl/icl_evaluator/icl_aucroc_evaluator.py
opencompass/openicl/icl_evaluator/icl_base_evaluator.py
opencompass/openicl/icl_evaluator/icl_bpc_evaluator.py
opencompass/openicl/icl_evaluator/icl_circular_evaluator.py
opencompass/openicl/icl_evaluator/icl_em_evaluator.py
opencompass/openicl/icl_evaluator/icl_hf_evaluator.py
opencompass/openicl/icl_evaluator/icl_jieba_rouge_evaluator.py
opencompass/openicl/icl_evaluator/icl_korbench_evaluator.py
opencompass/openicl/icl_evaluator/icl_misc_evaluator.py
opencompass/openicl/icl_evaluator/icl_plugin_evaluator.py
opencompass/openicl/icl_evaluator/icl_toxic_evaluator.py
opencompass/openicl/icl_evaluator/lm_evaluator.py
opencompass/openicl/icl_evaluator/hf_metrics/__init__.py
opencompass/openicl/icl_evaluator/hf_metrics/accuracy.py
opencompass/openicl/icl_evaluator/hf_metrics/rouge.py
opencompass/openicl/icl_evaluator/hf_metrics/sacrebleu.py
opencompass/openicl/icl_evaluator/hf_metrics/squad.py
opencompass/openicl/icl_inferencer/__init__.py
opencompass/openicl/icl_inferencer/icl_agent_inferencer.py
opencompass/openicl/icl_inferencer/icl_attack_inferencer.py
opencompass/openicl/icl_inferencer/icl_base_inferencer.py
opencompass/openicl/icl_inferencer/icl_chat_inferencer.py
opencompass/openicl/icl_inferencer/icl_clp_inferencer.py
opencompass/openicl/icl_inferencer/icl_gen_inferencer.py
opencompass/openicl/icl_inferencer/icl_inference_ppl_only_inferencer.py
opencompass/openicl/icl_inferencer/icl_ll_inferencer.py
opencompass/openicl/icl_inferencer/icl_mink_percent_inferencer.py
opencompass/openicl/icl_inferencer/icl_ppl_inferencer.py
opencompass/openicl/icl_inferencer/icl_ppl_only_inferencer.py
opencompass/openicl/icl_inferencer/icl_sc_inferencer.py
opencompass/openicl/icl_inferencer/icl_sw_ce_loss_inferencer.py
opencompass/openicl/icl_inferencer/icl_tot_inferencer.py
opencompass/openicl/icl_retriever/__init__.py
opencompass/openicl/icl_retriever/icl_base_retriever.py
opencompass/openicl/icl_retriever/icl_bm25_retriever.py
opencompass/openicl/icl_retriever/icl_dpp_retriever.py
opencompass/openicl/icl_retriever/icl_fix_k_retriever.py
opencompass/openicl/icl_retriever/icl_mdl_retriever.py
opencompass/openicl/icl_retriever/icl_random_retriever.py
opencompass/openicl/icl_retriever/icl_sliding_k_retriever.py
opencompass/openicl/icl_retriever/icl_topk_retriever.py
opencompass/openicl/icl_retriever/icl_votek_retriever.py
opencompass/openicl/icl_retriever/icl_zero_retriever.py
opencompass/openicl/utils/__init__.py
opencompass/openicl/utils/logging.py
opencompass/partitioners/__init__.py
opencompass/partitioners/base.py
opencompass/partitioners/naive.py
opencompass/partitioners/num_worker.py
opencompass/partitioners/size.py
opencompass/partitioners/sub_naive.py
opencompass/partitioners/sub_num_worker.py
opencompass/partitioners/sub_size.py
opencompass/runners/__init__.py
opencompass/runners/base.py
opencompass/runners/dlc.py
opencompass/runners/local.py
opencompass/runners/local_api.py
opencompass/runners/slurm.py
opencompass/runners/slurm_sequential.py
opencompass/runners/volc.py
opencompass/summarizers/__init__.py
opencompass/summarizers/circular.py
opencompass/summarizers/default.py
opencompass/summarizers/default_subjective.py
opencompass/summarizers/llm_compression.py
opencompass/summarizers/multi_faceted.py
opencompass/summarizers/multi_model.py
opencompass/summarizers/needlebench.py
opencompass/summarizers/summarizer_pretrain.py
opencompass/summarizers/subjective/__init__.py
opencompass/summarizers/subjective/alignmentbench.py
opencompass/summarizers/subjective/all_obj.py
opencompass/summarizers/subjective/alpacaeval.py
opencompass/summarizers/subjective/arenahard.py
opencompass/summarizers/subjective/charm.py
opencompass/summarizers/subjective/common_summarizer.py
opencompass/summarizers/subjective/compass_arena.py
opencompass/summarizers/subjective/compassbench.py
opencompass/summarizers/subjective/compassbench_v13.py
opencompass/summarizers/subjective/corev2.py
opencompass/summarizers/subjective/creationbench.py
opencompass/summarizers/subjective/flames.py
opencompass/summarizers/subjective/fofo.py
opencompass/summarizers/subjective/followbench.py
opencompass/summarizers/subjective/mtbench.py
opencompass/summarizers/subjective/mtbench101.py
opencompass/summarizers/subjective/multiround.py
opencompass/summarizers/subjective/subjective.py
opencompass/summarizers/subjective/subjective_post_process.py
opencompass/summarizers/subjective/utils.py
opencompass/summarizers/subjective/wildbench.py
opencompass/tasks/__init__.py
opencompass/tasks/base.py
opencompass/tasks/llm_eval.py
opencompass/tasks/openicl_attack.py
opencompass/tasks/openicl_eval.py
opencompass/tasks/openicl_infer.py
opencompass/tasks/subjective_eval.py
opencompass/utils/__init__.py
opencompass/utils/abbr.py
opencompass/utils/auxiliary.py
opencompass/utils/build.py
opencompass/utils/clients.py
opencompass/utils/collect_env.py
opencompass/utils/datasets.py
opencompass/utils/datasets_info.py
opencompass/utils/dependency.py
opencompass/utils/dict_postprocessors.py
opencompass/utils/file.py
opencompass/utils/fileio.py
opencompass/utils/lark.py
opencompass/utils/logging.py
opencompass/utils/menu.py
opencompass/utils/model_postprocessors.py
opencompass/utils/prompt.py
opencompass/utils/run.py
opencompass/utils/text_postprocessors.py
opencompass/utils/types.py
opencompass/utils/postprocessors/__init__.py
opencompass/utils/postprocessors/naive/PROMPT_TEMPLATE.py
opencompass/utils/postprocessors/naive/__init__.py
opencompass/utils/postprocessors/naive/extractor.py
opencompass/utils/postprocessors/xfinder/__init__.py
opencompass/utils/postprocessors/xfinder/extractor.py
opencompass/utils/postprocessors/xfinder/xfinder_utils/PROMPT_TEMPLATE.py
opencompass/utils/postprocessors/xfinder/xfinder_utils/__init__.py
opencompass/utils/postprocessors/xfinder/xfinder_utils/convert_data.py
opencompass/utils/postprocessors/xfinder/xfinder_utils/data_process.py