mihaimasala
commited on
Commit
•
be4b547
1
Parent(s):
f4c53d2
Update README.md
Browse files
README.md
CHANGED
@@ -575,10 +575,16 @@ print(tokenizer.decode(outputs[0]))
|
|
575 |
<td><strong><center>TruthfulQA</center></strong></td>
|
576 |
</tr>
|
577 |
<tr>
|
578 |
-
<td>Llama-3-8B-Instruct</td><td><center
|
579 |
</tr>
|
580 |
<tr>
|
581 |
-
<td><em>RoLlama3-8b-Instruct</em></td><td><center><em>50.56</em></center></td><td><center><em
|
|
|
|
|
|
|
|
|
|
|
|
|
582 |
</tr>
|
583 |
</tbody>
|
584 |
</table>
|
@@ -614,7 +620,13 @@ print(tokenizer.decode(outputs[0]))
|
|
614 |
<td>Llama-3-8B-Instruct</td><td><center>95.88</center></td><td><center>56.21</center></td><td><center><strong>98.53</strong></center></td><td><center>86.19</center></td><td><center>18.88</center></td><td><center><strong>30.98</strong></center></td><td><center><strong>28.02</strong></center></td><td><center>40.28</center></td>
|
615 |
</tr>
|
616 |
<tr>
|
617 |
-
<td><em>RoLlama3-8b-Instruct</em></td><td><center><em><strong>97.52</strong></em></center></td><td><center><em><strong>67.41</strong></em></center></td><td><center><em>94.15</em></center></td><td><center><em
|
|
|
|
|
|
|
|
|
|
|
|
|
618 |
</tr>
|
619 |
</tbody>
|
620 |
</table>
|
@@ -649,7 +661,13 @@ print(tokenizer.decode(outputs[0]))
|
|
649 |
<td>Llama-3-8B-Instruct</td><td><center><strong>39.47</strong></center></td><td><center>58.67</center></td><td><center><strong>67.65</strong></center></td><td><center><strong>82.77</strong></center></td><td><center>73.04</center></td><td><center>72.36</center></td><td><center>83.49</center></td><td><center>84.06</center></td>
|
650 |
</tr>
|
651 |
<tr>
|
652 |
-
<td><em>RoLlama3-8b-Instruct</em></td><td><center><em>39.43</em></center></td><td><center><em><strong>59.50</strong></em></center></td><td><center><em>44.45</em></center></td><td><center><em>59.76</em></center></td><td><center><em
|
|
|
|
|
|
|
|
|
|
|
|
|
653 |
</tr>
|
654 |
</tbody>
|
655 |
</table>
|
@@ -667,10 +685,16 @@ print(tokenizer.decode(outputs[0]))
|
|
667 |
<td><strong><center>Answers in Ro</center></strong></td>
|
668 |
</tr>
|
669 |
<tr>
|
670 |
-
<td>Llama-3-8B-Instruct</td><td><center><strong>5.96</strong></center></td><td><center
|
|
|
|
|
|
|
|
|
|
|
|
|
671 |
</tr>
|
672 |
<tr>
|
673 |
-
<td
|
674 |
</tr>
|
675 |
</tbody>
|
676 |
</table>
|
@@ -689,17 +713,26 @@ print(tokenizer.decode(outputs[0]))
|
|
689 |
<td>Llama-3-8B-Instruct</td><td><center><strong>4.62</strong></center></td><td><center><strong>100/100</strong></center></td>
|
690 |
</tr>
|
691 |
<tr>
|
692 |
-
<td><em>RoLlama3-8b-Instruct</em></td><td><center><em>3.71</em></center></td><td><center><em><strong>100/100</strong></em></center></td>
|
|
|
|
|
|
|
|
|
|
|
|
|
693 |
</tr>
|
694 |
</tbody>
|
695 |
</table>
|
696 |
|
697 |
|
|
|
698 |
## RoLlama3 Model Family
|
699 |
|
700 |
| Model | Link |
|
701 |
|--------------------|:--------:|
|
702 |
-
|*RoLlama3-8b-Instruct*| [link](https://huggingface.co/OpenLLM-Ro/RoLlama3-8b-Instruct) |
|
|
|
|
|
703 |
|
704 |
|
705 |
## Citation
|
|
|
575 |
<td><strong><center>TruthfulQA</center></strong></td>
|
576 |
</tr>
|
577 |
<tr>
|
578 |
+
<td>Llama-3-8B-Instruct</td><td><center>50.62</center></td><td><center>43.69</center></td><td><center>52.04</center></td><td><center>59.33</center></td><td><center>53.19</center></td><td><center><strong>43.87</strong></center></td><td><center><strong>51.59</strong></center></td>
|
579 |
</tr>
|
580 |
<tr>
|
581 |
+
<td><em>RoLlama3-8b-Instruct-2024-06-28</em></td><td><center><em>50.56</em></center></td><td><center><em>44.70</em></center></td><td><center><em>52.19</em></center></td><td><center><em><strong>67.23</strong></em></center></td><td><center><em>57.69</em></center></td><td><center><em>30.23</em></center></td><td><center><em>51.34</em></center></td>
|
582 |
+
</tr>
|
583 |
+
<tr>
|
584 |
+
<td>RoLlama3-8b-Instruct-2024-10-09</td><td><center><strong>52.21</strong></center></td><td><center><strong>47.94</strong></center></td><td><center><strong>53.50</strong></center></td><td><center>66.06</center></td><td><center><strong>59.72</strong></center></td><td><center>40.16</center></td><td><center>45.90</center></td>
|
585 |
+
</tr>
|
586 |
+
<tr>
|
587 |
+
<td>RoLlama3-8b-Instruct-DPO-2024-10-09</td><td><center>49.96</center></td><td><center>46.29</center></td><td><center>53.29</center></td><td><center>65.57</center></td><td><center>58.15</center></td><td><center>34.77</center></td><td><center>41.70</center></td>
|
588 |
</tr>
|
589 |
</tbody>
|
590 |
</table>
|
|
|
620 |
<td>Llama-3-8B-Instruct</td><td><center>95.88</center></td><td><center>56.21</center></td><td><center><strong>98.53</strong></center></td><td><center>86.19</center></td><td><center>18.88</center></td><td><center><strong>30.98</strong></center></td><td><center><strong>28.02</strong></center></td><td><center>40.28</center></td>
|
621 |
</tr>
|
622 |
<tr>
|
623 |
+
<td><em>RoLlama3-8b-Instruct-2024-06-28</em></td><td><center><em><strong>97.52</strong></em></center></td><td><center><em><strong>67.41</strong></em></center></td><td><center><em>94.15</em></center></td><td><center><em>87.13</em></center></td><td><center><em><strong>24.01</strong></em></center></td><td><center><em>27.36</em></center></td><td><center><em>26.53</em></center></td><td><center><em>40.36</em></center></td>
|
624 |
+
</tr>
|
625 |
+
<tr>
|
626 |
+
<td>RoLlama3-8b-Instruct-2024-10-09</td><td><center>95.58</center></td><td><center>61.20</center></td><td><center>96.46</center></td><td><center><strong>87.26</strong></center></td><td><center>22.92</center></td><td><center>24.28</center></td><td><center>27.31</center></td><td><center><strong>40.52</strong></center></td>
|
627 |
+
</tr>
|
628 |
+
<tr>
|
629 |
+
<td>RoLlama3-8b-Instruct-DPO-2024-10-09</td><td><center>-</center></td><td><center>-</center></td><td><center>-</center></td><td><center>-</center></td><td><center>-</center></td><td><center>-</center></td><td><center>-</center></td><td><center>-</center></td>
|
630 |
</tr>
|
631 |
</tbody>
|
632 |
</table>
|
|
|
661 |
<td>Llama-3-8B-Instruct</td><td><center><strong>39.47</strong></center></td><td><center>58.67</center></td><td><center><strong>67.65</strong></center></td><td><center><strong>82.77</strong></center></td><td><center>73.04</center></td><td><center>72.36</center></td><td><center>83.49</center></td><td><center>84.06</center></td>
|
662 |
</tr>
|
663 |
<tr>
|
664 |
+
<td><em>RoLlama3-8b-Instruct-2024-06-28</em></td><td><center><em>39.43</em></center></td><td><center><em><strong>59.50</strong></em></center></td><td><center><em>44.45</em></center></td><td><center><em>59.76</em></center></td><td><center><em>77.20</em></center></td><td><center><em><strong>77.87</strong></em></center></td><td><center><em>85.80</em></center></td><td><center><em>86.05</em></center></td>
|
665 |
+
</tr>
|
666 |
+
<tr>
|
667 |
+
<td>RoLlama3-8b-Instruct-2024-10-09</td><td><center>18.89</center></td><td><center>31.79</center></td><td><center>50.84</center></td><td><center>65.18</center></td><td><center><strong>77.60</strong></center></td><td><center>76.86</center></td><td><center><strong>86.70</strong></center></td><td><center><strong>87.09</strong></center></td>
|
668 |
+
</tr>
|
669 |
+
<tr>
|
670 |
+
<td>RoLlama3-8b-Instruct-DPO-2024-10-09</td><td><center>-</center></td><td><center>-</center></td><td><center>-</center></td><td><center>-</center></td><td><center>-</center></td><td><center>-</center></td><td><center>-</center></td><td><center>-</center></td>
|
671 |
</tr>
|
672 |
</tbody>
|
673 |
</table>
|
|
|
685 |
<td><strong><center>Answers in Ro</center></strong></td>
|
686 |
</tr>
|
687 |
<tr>
|
688 |
+
<td>Llama-3-8B-Instruct</td><td><center><strong>5.96</strong></center></td><td><center>6.16</center></td><td><center><strong>5.76</strong></center></td><td><center>158/160</center></td>
|
689 |
+
</tr>
|
690 |
+
<tr>
|
691 |
+
<td><em>RoLlama3-8b-Instruct-2024-06-28</em></td><td><center><em>5.15</em></center></td><td><center><em>6.03</em></center></td><td><center><em>4.28</em></center></td><td><center><em><strong>160/160</strong></em></center></td>
|
692 |
+
</tr>
|
693 |
+
<tr>
|
694 |
+
<td>RoLlama3-8b-Instruct-2024-10-09</td><td><center>5.38</center></td><td><center>6.09</center></td><td><center>4.67</center></td><td><center><strong>160/160</strong></center></td>
|
695 |
</tr>
|
696 |
<tr>
|
697 |
+
<td>RoLlama3-8b-Instruct-DPO-2024-10-09</td><td><center>5.87</center></td><td><center><strong>6.22</strong></center></td><td><center>5.49</center></td><td><center><strong>160/160</strong></center></td>
|
698 |
</tr>
|
699 |
</tbody>
|
700 |
</table>
|
|
|
713 |
<td>Llama-3-8B-Instruct</td><td><center><strong>4.62</strong></center></td><td><center><strong>100/100</strong></center></td>
|
714 |
</tr>
|
715 |
<tr>
|
716 |
+
<td><em>RoLlama3-8b-Instruct-2024-06-28</em></td><td><center><em>3.71</em></center></td><td><center><em><strong>100/100</strong></em></center></td>
|
717 |
+
</tr>
|
718 |
+
<tr>
|
719 |
+
<td>RoLlama3-8b-Instruct-2024-10-09</td><td><center>3.81</center></td><td><center><strong>100/100</strong></center></td>
|
720 |
+
</tr>
|
721 |
+
<tr>
|
722 |
+
<td>RoLlama3-8b-Instruct-DPO-2024-10-09</td><td><center>4.40</center></td><td><center><strong>100/100</strong></center></td>
|
723 |
</tr>
|
724 |
</tbody>
|
725 |
</table>
|
726 |
|
727 |
|
728 |
+
|
729 |
## RoLlama3 Model Family
|
730 |
|
731 |
| Model | Link |
|
732 |
|--------------------|:--------:|
|
733 |
+
|*RoLlama3-8b-Instruct-2024-06-28*| [link](https://huggingface.co/OpenLLM-Ro/RoLlama3-8b-Instruct-2024-06-28) |
|
734 |
+
|RoLlama3-8b-Instruct-2024-10-09| [link](https://huggingface.co/OpenLLM-Ro/RoLlama3-8b-Instruct-2024-10-09) |
|
735 |
+
|RoLlama3-8b-Instruct-DPO-2024-10-09| [link](https://huggingface.co/OpenLLM-Ro/RoLlama3-8b-Instruct-DPO-2024-10-09) |
|
736 |
|
737 |
|
738 |
## Citation
|