File size: 14,647 Bytes
256a159 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 |
20240305_153409 tabulate format ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ dataset version metric mode llama-7b-hf ------------------------------------------------- --------- -------- ------ ------------- ceval-computer_network - - - - ceval-operating_system - - - - ceval-computer_architecture - - - - ceval-college_programming - - - - ceval-college_physics - - - - ceval-college_chemistry - - - - ceval-advanced_mathematics - - - - ceval-probability_and_statistics - - - - ceval-discrete_mathematics - - - - ceval-electrical_engineer - - - - ceval-metrology_engineer - - - - ceval-high_school_mathematics - - - - ceval-high_school_physics - - - - ceval-high_school_chemistry - - - - ceval-high_school_biology - - - - ceval-middle_school_mathematics - - - - ceval-middle_school_biology - - - - ceval-middle_school_physics - - - - ceval-middle_school_chemistry - - - - ceval-veterinary_medicine - - - - ceval-college_economics - - - - ceval-business_administration - - - - ceval-marxism - - - - ceval-mao_zedong_thought - - - - ceval-education_science - - - - ceval-teacher_qualification - - - - ceval-high_school_politics - - - - ceval-high_school_geography - - - - ceval-middle_school_politics - - - - ceval-middle_school_geography - - - - ceval-modern_chinese_history - - - - ceval-ideological_and_moral_cultivation - - - - ceval-logic - - - - ceval-law - - - - ceval-chinese_language_and_literature - - - - ceval-art_studies - - - - ceval-professional_tour_guide - - - - ceval-legal_professional - - - - ceval-high_school_chinese - - - - ceval-high_school_history - - - - ceval-middle_school_history - - - - ceval-civil_servant - - - - ceval-sports_science - - - - ceval-plant_protection - - - - ceval-basic_medicine - - - - ceval-clinical_medicine - - - - ceval-urban_and_rural_planner - - - - ceval-accountant - - - - ceval-fire_engineer - - - - ceval-environmental_impact_assessment_engineer - - - - ceval-tax_accountant - - - - ceval-physician - - - - lukaemon_mmlu_college_biology - - - - lukaemon_mmlu_college_chemistry - - - - lukaemon_mmlu_college_computer_science - - - - lukaemon_mmlu_college_mathematics - - - - lukaemon_mmlu_college_physics - - - - lukaemon_mmlu_electrical_engineering - - - - lukaemon_mmlu_astronomy - - - - lukaemon_mmlu_anatomy - - - - lukaemon_mmlu_abstract_algebra - - - - lukaemon_mmlu_machine_learning - - - - lukaemon_mmlu_clinical_knowledge - - - - lukaemon_mmlu_global_facts - - - - lukaemon_mmlu_management - - - - lukaemon_mmlu_nutrition - - - - lukaemon_mmlu_marketing - - - - lukaemon_mmlu_professional_accounting - - - - lukaemon_mmlu_high_school_geography - - - - lukaemon_mmlu_international_law - - - - lukaemon_mmlu_moral_scenarios - - - - lukaemon_mmlu_computer_security - - - - lukaemon_mmlu_high_school_microeconomics - - - - lukaemon_mmlu_professional_law - - - - lukaemon_mmlu_medical_genetics - - - - lukaemon_mmlu_professional_psychology - - - - lukaemon_mmlu_jurisprudence - - - - lukaemon_mmlu_world_religions - - - - lukaemon_mmlu_philosophy - - - - lukaemon_mmlu_virology - - - - lukaemon_mmlu_high_school_chemistry - - - - lukaemon_mmlu_public_relations - - - - lukaemon_mmlu_high_school_macroeconomics - - - - lukaemon_mmlu_human_sexuality - - - - lukaemon_mmlu_elementary_mathematics - - - - lukaemon_mmlu_high_school_physics - - - - lukaemon_mmlu_high_school_computer_science - - - - lukaemon_mmlu_high_school_european_history - - - - lukaemon_mmlu_business_ethics - - - - lukaemon_mmlu_moral_disputes - - - - lukaemon_mmlu_high_school_statistics - - - - lukaemon_mmlu_miscellaneous - - - - lukaemon_mmlu_formal_logic - - - - lukaemon_mmlu_high_school_government_and_politics - - - - lukaemon_mmlu_prehistory - - - - lukaemon_mmlu_security_studies - - - - lukaemon_mmlu_high_school_biology - - - - lukaemon_mmlu_logical_fallacies - - - - lukaemon_mmlu_high_school_world_history - - - - lukaemon_mmlu_professional_medicine - - - - lukaemon_mmlu_high_school_mathematics - - - - lukaemon_mmlu_college_medicine - - - - lukaemon_mmlu_high_school_us_history - - - - lukaemon_mmlu_sociology - - - - lukaemon_mmlu_econometrics - - - - lukaemon_mmlu_high_school_psychology - - - - lukaemon_mmlu_human_aging - - - - lukaemon_mmlu_us_foreign_policy - - - - lukaemon_mmlu_conceptual_physics - - - - $$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$ -------------------------------------------------------------------------------------------------------------------------------- THIS IS A DIVIDER -------------------------------------------------------------------------------------------------------------------------------- csv format ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ dataset,version,metric,mode,llama-7b-hf ceval-computer_network,-,-,-,- ceval-operating_system,-,-,-,- ceval-computer_architecture,-,-,-,- ceval-college_programming,-,-,-,- ceval-college_physics,-,-,-,- ceval-college_chemistry,-,-,-,- ceval-advanced_mathematics,-,-,-,- ceval-probability_and_statistics,-,-,-,- ceval-discrete_mathematics,-,-,-,- ceval-electrical_engineer,-,-,-,- ceval-metrology_engineer,-,-,-,- ceval-high_school_mathematics,-,-,-,- ceval-high_school_physics,-,-,-,- ceval-high_school_chemistry,-,-,-,- ceval-high_school_biology,-,-,-,- ceval-middle_school_mathematics,-,-,-,- ceval-middle_school_biology,-,-,-,- ceval-middle_school_physics,-,-,-,- ceval-middle_school_chemistry,-,-,-,- ceval-veterinary_medicine,-,-,-,- ceval-college_economics,-,-,-,- ceval-business_administration,-,-,-,- ceval-marxism,-,-,-,- ceval-mao_zedong_thought,-,-,-,- ceval-education_science,-,-,-,- ceval-teacher_qualification,-,-,-,- ceval-high_school_politics,-,-,-,- ceval-high_school_geography,-,-,-,- ceval-middle_school_politics,-,-,-,- ceval-middle_school_geography,-,-,-,- ceval-modern_chinese_history,-,-,-,- ceval-ideological_and_moral_cultivation,-,-,-,- ceval-logic,-,-,-,- ceval-law,-,-,-,- ceval-chinese_language_and_literature,-,-,-,- ceval-art_studies,-,-,-,- ceval-professional_tour_guide,-,-,-,- ceval-legal_professional,-,-,-,- ceval-high_school_chinese,-,-,-,- ceval-high_school_history,-,-,-,- ceval-middle_school_history,-,-,-,- ceval-civil_servant,-,-,-,- ceval-sports_science,-,-,-,- ceval-plant_protection,-,-,-,- ceval-basic_medicine,-,-,-,- ceval-clinical_medicine,-,-,-,- ceval-urban_and_rural_planner,-,-,-,- ceval-accountant,-,-,-,- ceval-fire_engineer,-,-,-,- ceval-environmental_impact_assessment_engineer,-,-,-,- ceval-tax_accountant,-,-,-,- ceval-physician,-,-,-,- lukaemon_mmlu_college_biology,-,-,-,- lukaemon_mmlu_college_chemistry,-,-,-,- lukaemon_mmlu_college_computer_science,-,-,-,- lukaemon_mmlu_college_mathematics,-,-,-,- lukaemon_mmlu_college_physics,-,-,-,- lukaemon_mmlu_electrical_engineering,-,-,-,- lukaemon_mmlu_astronomy,-,-,-,- lukaemon_mmlu_anatomy,-,-,-,- lukaemon_mmlu_abstract_algebra,-,-,-,- lukaemon_mmlu_machine_learning,-,-,-,- lukaemon_mmlu_clinical_knowledge,-,-,-,- lukaemon_mmlu_global_facts,-,-,-,- lukaemon_mmlu_management,-,-,-,- lukaemon_mmlu_nutrition,-,-,-,- lukaemon_mmlu_marketing,-,-,-,- lukaemon_mmlu_professional_accounting,-,-,-,- lukaemon_mmlu_high_school_geography,-,-,-,- lukaemon_mmlu_international_law,-,-,-,- lukaemon_mmlu_moral_scenarios,-,-,-,- lukaemon_mmlu_computer_security,-,-,-,- lukaemon_mmlu_high_school_microeconomics,-,-,-,- lukaemon_mmlu_professional_law,-,-,-,- lukaemon_mmlu_medical_genetics,-,-,-,- lukaemon_mmlu_professional_psychology,-,-,-,- lukaemon_mmlu_jurisprudence,-,-,-,- lukaemon_mmlu_world_religions,-,-,-,- lukaemon_mmlu_philosophy,-,-,-,- lukaemon_mmlu_virology,-,-,-,- lukaemon_mmlu_high_school_chemistry,-,-,-,- lukaemon_mmlu_public_relations,-,-,-,- lukaemon_mmlu_high_school_macroeconomics,-,-,-,- lukaemon_mmlu_human_sexuality,-,-,-,- lukaemon_mmlu_elementary_mathematics,-,-,-,- lukaemon_mmlu_high_school_physics,-,-,-,- lukaemon_mmlu_high_school_computer_science,-,-,-,- lukaemon_mmlu_high_school_european_history,-,-,-,- lukaemon_mmlu_business_ethics,-,-,-,- lukaemon_mmlu_moral_disputes,-,-,-,- lukaemon_mmlu_high_school_statistics,-,-,-,- lukaemon_mmlu_miscellaneous,-,-,-,- lukaemon_mmlu_formal_logic,-,-,-,- lukaemon_mmlu_high_school_government_and_politics,-,-,-,- lukaemon_mmlu_prehistory,-,-,-,- lukaemon_mmlu_security_studies,-,-,-,- lukaemon_mmlu_high_school_biology,-,-,-,- lukaemon_mmlu_logical_fallacies,-,-,-,- lukaemon_mmlu_high_school_world_history,-,-,-,- lukaemon_mmlu_professional_medicine,-,-,-,- lukaemon_mmlu_high_school_mathematics,-,-,-,- lukaemon_mmlu_college_medicine,-,-,-,- lukaemon_mmlu_high_school_us_history,-,-,-,- lukaemon_mmlu_sociology,-,-,-,- lukaemon_mmlu_econometrics,-,-,-,- lukaemon_mmlu_high_school_psychology,-,-,-,- lukaemon_mmlu_human_aging,-,-,-,- lukaemon_mmlu_us_foreign_policy,-,-,-,- lukaemon_mmlu_conceptual_physics,-,-,-,- $$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$ -------------------------------------------------------------------------------------------------------------------------------- THIS IS A DIVIDER -------------------------------------------------------------------------------------------------------------------------------- raw format ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ ------------------------------- Model: llama-7b-hf $$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$$ |