Yeyito commited on
Commit
1eac270
β€’
1 Parent(s): e41a7dd

reverted again

Browse files
Files changed (1) hide show
  1. data/code_eval_board.csv +30 -30
data/code_eval_board.csv CHANGED
@@ -1,32 +1,32 @@
1
  T,Models,ARC,HellaSwag,MMLU,TruthfulQA,Winogrande,GSM8K,Reference Model
2
- 🟒,roneneldan/TinyStories-3M,0.06,0.1,0.13,0.2,NaN,0,huggyllama/llama-7b
3
- 🟒,roneneldan/TinyStories-1M,0.05,0.11,0.09,0.17,NaN,0,huggyllama/llama-7b
4
- πŸ”Ά,Fredithefish/ReasonixPajama-3B-HF,0.15,0.24,0.21,0.94,NaN,0.44,huggyllama/llama-7b
5
- 🟒,mistralai/Mistral-7B-v0.1,0.54,0.51,0.46,0.75,NaN,0.91,huggyllama/llama-7b
6
- πŸ”Ά,rishiraj/meow,0.11,0.49,0.28,0.36,NaN,0.95,huggyllama/llama-7b
7
- πŸ”Ά,Q-bert/MetaMath-Cybertron-Starling,0.52,0.64,0.51,0.75,NaN,0.99,huggyllama/llama-7b
8
- πŸ”Ά,upstage/SOLAR-10.7B-Instruct-v1.0,0.11,0.49,0.28,0.36,NaN,0.96,huggyllama/llama-7b
9
- πŸ”Ά,AIDC-ai-business/Marcoroni-7B-v3,0.1,0.14,0.2,0.41,NaN,0.95,mistralai/Mistral-7B-v0.1
10
- πŸ”Ά,amazon/MistralLite,0.09,0.14,0.2,0.43,NaN,0.73,mistralai/Mistral-7B-v0.1
11
- πŸ”Ά,openchat/openchat_3.5,0.13,0.13,0.23,0.45,NaN,0.97,mistralai/Mistral-7B-v0.1
12
- πŸ”Ά,meta-math/MetaMath-Mistral-7B,0.08,0.1,0.17,0.42,NaN,0.97,mistralai/Mistral-7B-v0.1
13
- πŸ”Ά,teknium/OpenHermes-2.5-Mistral-7B,0.07,0.13,0.23,0.39,NaN,0.96,mistralai/Mistral-7B-v0.1
14
- πŸ”Ά,microsoft/Orca-2-7b,0.88,0.8,0.77,0.91,NaN,1.0,mistralai/Mistral-7B-v0.1
15
- πŸ”Ά,WizardLM/WizardMath-7B-V1.1,0.1,0.11,0.21,0.4,NaN,0.99,mistralai/Mistral-7B-v0.1
16
- πŸ”Ά,01-ai/Yi-6B-200K,0.19,0.3,0.3,0.6,NaN,0.93,mistralai/Mistral-7B-v0.1
17
- πŸ”Ά,Intel/neural-chat-7b-v3-3,0.06,0.15,0.18,0.47,NaN,0.98,mistralai/Mistral-7B-v0.1
18
- πŸ”Ά,mistralai/Mistral-7B-Instruct-v0.2,0.06,0.21,0.17,0.48,NaN,0.95,mistralai/Mistral-7B-v0.1
19
- πŸ”Ά,Yhyu13/LMCocktail-10.7B-v1,0.1,0.44,0.23,0.51,NaN,0.97,mistralai/Mistral-7B-v0.1
20
- πŸ”Ά,ehartford/dolphin-2.1-mistral-7b,0.08,0.1,0.2,0.4,NaN,0.92,mistralai/Mistral-7B-v0.1
21
- πŸ”Ά,openchat/openchat-3.5-1210,0.1,0.12,0.2,0.4,NaN,0.98,mistralai/Mistral-7B-v0.1
22
- πŸ”Ά,HuggingFaceH4/zephyr-7b-beta,0.06,0.15,0.18,0.37,NaN,0.82,mistralai/Mistral-7B-v0.1
23
- πŸ”Ά,berkeley-nest/Starling-LM-7B-alpha,0.1,0.13,0.19,0.39,NaN,0.97,mistralai/Mistral-7B-v0.1
24
- πŸ”Ά,Sao10K/Ana-v1-m7,0.11,0.12,0.19,0.41,NaN,0.84,mistralai/Mistral-7B-v0.1
25
- πŸ”Ά,Open-Orca/Mistral-7B-OpenOrca,0.08,0.14,0.17,0.36,NaN,0.92,mistralai/Mistral-7B-v0.1
26
- πŸ”Ά,jondurbin/bagel-dpo-7b-v0.1,0.12,0.14,0.21,0.47,NaN,0.91,mistralai/Mistral-7B-v0.1
27
- πŸ”Ά,rwitz/go-bruins-v2,0.09,0.13,0.18,0.4,NaN,0.95,mistralai/Mistral-7B-v0.1
28
- πŸ”Ά,EmbeddedLLM/Mistral-7B-Merge-14-v0.3,0.09,0.11,0.18,0.39,NaN,0.95,mistralai/Mistral-7B-v0.1
29
- πŸ”Ά,chargoddard/loyal-piano-m7,0.11,0.13,0.19,0.45,NaN,0.97,mistralai/Mistral-7B-v0.1
30
- πŸ”Ά,rishiraj/CatPPT,0.09,0.12,0.19,0.44,NaN,0.98,mistralai/Mistral-7B-v0.1
31
- πŸ”Ά,togethercomputer/RedPajama-INCITE-Instruct-3B-v1,0.08,0.12,0.19,0.43,NaN,0.77,mistralai/Mistral-7B-v0.1
32
 
 
1
  T,Models,ARC,HellaSwag,MMLU,TruthfulQA,Winogrande,GSM8K,Reference Model
2
+ 🟒,roneneldan/TinyStories-3M,0.06,0.1,0.13,0.2,0.01,0,huggyllama/llama-7b
3
+ 🟒,roneneldan/TinyStories-1M,0.05,0.11,0.09,0.17,0.01,0,huggyllama/llama-7b
4
+ πŸ”Ά,Fredithefish/ReasonixPajama-3B-HF,0.15,0.24,0.21,0.94,0.01,0.44,huggyllama/llama-7b
5
+ 🟒,mistralai/Mistral-7B-v0.1,0.54,0.51,0.46,0.75,0,0.91,huggyllama/llama-7b
6
+ πŸ”Ά,rishiraj/meow,0.11,0.49,0.28,0.36,0.02,0.95,huggyllama/llama-7b
7
+ πŸ”Ά,Q-bert/MetaMath-Cybertron-Starling,0.52,0.64,0.51,0.75,0.01,0.99,huggyllama/llama-7b
8
+ πŸ”Ά,upstage/SOLAR-10.7B-Instruct-v1.0,0.11,0.49,0.28,0.36,0.01,0.96,huggyllama/llama-7b
9
+ πŸ”Ά,AIDC-ai-business/Marcoroni-7B-v3,0.1,0.14,0.2,0.41,0.0,0.95,mistralai/Mistral-7B-v0.1
10
+ πŸ”Ά,amazon/MistralLite,0.09,0.14,0.2,0.43,0.0,0.73,mistralai/Mistral-7B-v0.1
11
+ πŸ”Ά,openchat/openchat_3.5,0.13,0.13,0.23,0.45,0.0,0.97,mistralai/Mistral-7B-v0.1
12
+ πŸ”Ά,meta-math/MetaMath-Mistral-7B,0.08,0.1,0.17,0.42,0.0,0.97,mistralai/Mistral-7B-v0.1
13
+ πŸ”Ά,teknium/OpenHermes-2.5-Mistral-7B,0.07,0.13,0.23,0.39,0.0,0.96,mistralai/Mistral-7B-v0.1
14
+ πŸ”Ά,microsoft/Orca-2-7b,0.88,0.8,0.77,0.91,0.0,1.0,mistralai/Mistral-7B-v0.1
15
+ πŸ”Ά,WizardLM/WizardMath-7B-V1.1,0.1,0.11,0.21,0.4,0.0,0.99,mistralai/Mistral-7B-v0.1
16
+ πŸ”Ά,01-ai/Yi-6B-200K,0.19,0.3,0.3,0.6,0.0,0.93,mistralai/Mistral-7B-v0.1
17
+ πŸ”Ά,Intel/neural-chat-7b-v3-3,0.06,0.15,0.18,0.47,0.0,0.98,mistralai/Mistral-7B-v0.1
18
+ πŸ”Ά,mistralai/Mistral-7B-Instruct-v0.2,0.06,0.21,0.17,0.48,0.0,0.95,mistralai/Mistral-7B-v0.1
19
+ πŸ”Ά,Yhyu13/LMCocktail-10.7B-v1,0.1,0.44,0.23,0.51,0.0,0.97,mistralai/Mistral-7B-v0.1
20
+ πŸ”Ά,ehartford/dolphin-2.1-mistral-7b,0.08,0.1,0.2,0.4,0.0,0.92,mistralai/Mistral-7B-v0.1
21
+ πŸ”Ά,openchat/openchat-3.5-1210,0.1,0.12,0.2,0.4,0.0,0.98,mistralai/Mistral-7B-v0.1
22
+ πŸ”Ά,HuggingFaceH4/zephyr-7b-beta,0.06,0.15,0.18,0.37,0.0,0.82,mistralai/Mistral-7B-v0.1
23
+ πŸ”Ά,berkeley-nest/Starling-LM-7B-alpha,0.1,0.13,0.19,0.39,0.0,0.97,mistralai/Mistral-7B-v0.1
24
+ πŸ”Ά,Sao10K/Ana-v1-m7,0.11,0.12,0.19,0.41,0.0,0.84,mistralai/Mistral-7B-v0.1
25
+ πŸ”Ά,Open-Orca/Mistral-7B-OpenOrca,0.08,0.14,0.17,0.36,0.0,0.92,mistralai/Mistral-7B-v0.1
26
+ πŸ”Ά,jondurbin/bagel-dpo-7b-v0.1,0.12,0.14,0.21,0.47,0.0,0.91,mistralai/Mistral-7B-v0.1
27
+ πŸ”Ά,rwitz/go-bruins-v2,0.09,0.13,0.18,0.4,0.0,0.95,mistralai/Mistral-7B-v0.1
28
+ πŸ”Ά,EmbeddedLLM/Mistral-7B-Merge-14-v0.3,0.09,0.11,0.18,0.39,0.0,0.95,mistralai/Mistral-7B-v0.1
29
+ πŸ”Ά,chargoddard/loyal-piano-m7,0.11,0.13,0.19,0.45,0.0,0.97,mistralai/Mistral-7B-v0.1
30
+ πŸ”Ά,rishiraj/CatPPT,0.09,0.12,0.19,0.44,0.0,0.98,mistralai/Mistral-7B-v0.1
31
+ πŸ”Ά,togethercomputer/RedPajama-INCITE-Instruct-3B-v1,0.08,0.12,0.19,0.43,0.0,0.77,mistralai/Mistral-7B-v0.1
32