subcategories = { "agronomy": ['other'], "anatomy": ['biology'], "ancient_chinese": ['linguistics','china specific'], "arts": ['arts'], "astronomy": ['physics'], "business_ethics": ['business'], "chinese_civil_service_exam": ['politics','china specific'], "chinese_driving_rule": ['other','china specific'], "chinese_food_culture": ['culture','china specific'], "chinese_foreign_policy": ['politics','china specific'], "chinese_history":['history','china specific'], "chinese_literature": ['literature','china specific'], "chinese_teacher_qualification": ['education','china specific'], "college_actuarial_science":['math'], "college_education":['education'], "college_engineering_hydrology": ['engineering'], "college_law": ['law'], "college_mathematics": ['math'], "college_medical_statistics":['statistics'], "clinical_knowledge": ['other'], "college_medicine": ['other'], "computer_science": ['computer science'], "computer_security": ['other'], "conceptual_physics": ['physics'], "construction_project_management": ['other','china specific'], "economics": ['economics'], "education": ['education'], "elementary_chinese":['linguistics','china specific'], "elementary_commonsense":['other','china specific'], "elementary_information_and_technology": ['other'], "electrical_engineering": ['engineering'], "elementary_mathematics": ['math'], "ethnology": ['culture','china specific'], "food_science": ['other'], "genetics": ['biology'], "global_facts": ['global'], "high_school_biology": ['biology'], "high_school_chemistry": ['chemistry'], "high_school_geography": ['geography'], "high_school_mathematics": ['math'], "high_school_physics": ['physics'], "high_school_politics": ['politics','china specific'], "human_sexuality": ['other'], "international_law": ['law'], "journalism": ['sociology'], "jurisprudence": ['law'], "legal_and_moral_basis": ['other'], "logical": ['philosophy'], "machine_learning": ['computer science'], "management": ['business'], "marketing": ['business'], "marxist_theory": ['philosophy'], "modern_chinese": ['linguistics','china specific'], "nutrition": ['other'], "philosophy": ['philosophy'], "professional_accounting": ['business'], "professional_law": ['law'], "professional_medicine": ['other'], "professional_psychology": ['psychology'], "public_relations": ['politics'], "security_study": ['politics'], "sociology": ['culture'], "sports_science": ['other'], "traditional_chinese_medicine": ['other','china specific'], "virology": ['biology'], "world_history":['history'], "world_religions": ['global'], } categories = { "STEM": ["physics", "chemistry", "biology", "computer science", "math", "engineering", "statistics"], "Humanities": ["history", "philosophy", "law", "arts", "literature", "global"], "Social Science": ['linguistics',"business", "politics", "culture", "economics", "geography", "psychology", "education", "sociology"], "Other":["other"], "China specific": ["china specific"], } category2subject = {} for k, v in categories.items(): for subject, subcat in subcategories.items(): for c in subcat: if c in v: category2subject.setdefault(k, []).append(subject) cmmlu_summary_groups = [] _cmmlu_humanities = ['cmmlu-' + s for s in category2subject['Humanities']] cmmlu_summary_groups.append({'name': 'cmmlu-humanities', 'subsets': _cmmlu_humanities}) _cmmlu_stem = ['cmmlu-' + s for s in category2subject['STEM']] cmmlu_summary_groups.append({'name': 'cmmlu-stem', 'subsets': _cmmlu_stem}) _cmmlu_social_science = ['cmmlu-' + s for s in category2subject['Social Science']] cmmlu_summary_groups.append({'name': 'cmmlu-social-science', 'subsets': _cmmlu_social_science}) _cmmlu_other = ['cmmlu-' + s for s in category2subject['Other']] cmmlu_summary_groups.append({'name': 'cmmlu-other', 'subsets': _cmmlu_other}) _cmmlu_china_specific = ['cmmlu-' + s for s in category2subject['China specific']] cmmlu_summary_groups.append({'name': 'cmmlu-china-specific', 'subsets': _cmmlu_china_specific}) _cmmlu_all = ['cmmlu-' + s for s in subcategories.keys()] cmmlu_summary_groups.append({'name': 'cmmlu', 'subsets': _cmmlu_all})