Spaces:
Running
Running
Model,Validation Score | |
llama_avg (Baseline),38.4 | |
my_t5_avg,37.1 | |
flan_t5_weights,37.7 | |
shira_ft5_algo0,40.8 | |
shira_ft5xl_algo0,40.8 | |
shira_mtl7b_0_2_algo0,42.0 | |
shira_llama3_8b_it_algo0,44.9 | |
shira_qw2_7b_it_algo0,44.1 | |
cdutr_AqQ3,41.1 | |
cdutr_pi5c,37.2 | |
readapt_median,48.4 | |
lore_route,45.8 | |
basic_merge_00,44.7 | |
shira_algo_k00,29.5 | |
wcf_lar,52.2 | |
mistral_avg_exp_04,42.2 | |
llama_merge2,42.7 | |
mistral_avg_exp_06,41.2 | |
SLM,26.0 | |
mistral_avg_exp_05,41.4 | |
mistral_avg_exp_07,41.3 | |
llama_base_fc,44.2 | |
llama_base_qa,44.2 | |
llama_avg,18.8 | |
knovel_test,38.4 | |
flan_t5_avg,38 | |
abc,38.1 | |
deepseek_exp,36.5 | |
yi15_exp,40.7 | |
llama_optimized,38.0 | |
Fbaseline,38.0 | |
kobeni,46.7 | |
flan_t5_avg_lora,37.6 | |
BVD_Mega,54.5 | |
llama_avg,38.5 | |
yi15_exp,39.9 | |
mistral_exp,35,12.8 | |
gemma_exp,31.7,0 | |
deepseek_exp,33.0,0.0 | |
mistral_avg_exp_08,43.1,67.7 | |
mistral_grid_exp_01,40.7,67.6 | |
llama_avg,38.5,65.2 | |
mistral_ties_exp_05,40.1,66.0 | |
custom_flan_t5_2,, | |
blend_optimizer_00,40.7,68.2 | |
kobeni,46.7,67.2 | |
knovel_moe,39.2,63.9 | |
blend_optimizer_01,, | |
ties_llama2,32.0,61.0 | |
blend_optimizer_02,, | |
llama_single,44.9,67.7 | |
GemmaInstruct,38.7,65.2 | |
dga_avg,38.0,64.6 | |
llama_sel_lin_avg,, | |
llama_sel_lin_avg_2,, | |
huge_avg,38.2,28.2 | |
ArcLab_algorithm1,, | |
gemma_ties_exp_01,41.9,67.1 | |
gemma_ties_exp_02,, | |
flan_t5_avg,38.0,28.1 | |
llama_local,39.6,67.5 | |
F_or_t,37.9,28.1 | |
ArcLab_algorithm2,, | |
mistral_mc_ties_exp_01,40.4,66.4 | |
llama3_meta_mc_ties_exp_01,43.8,69.0 | |
F_or_t,38.0,28.2 | |
python llm_merging/main.py -m hj_qa,, | |
python llm_merging/main.py -m hj_fc,, | |
llama3_meta_mc_ties_exp_02,43.6,69.1 | |
llama_avg,38.5,65.3 | |
llama_avg8_21,38.5,65.2 |