Corey Morris
commited on
Commit
•
0c07f8b
1
Parent(s):
f1eba6e
updated date and model count
Browse files
app.py
CHANGED
@@ -123,8 +123,8 @@ def find_top_differences_table(df, target_model, closest_models, num_differences
|
|
123 |
data_provider = ResultDataProcessor()
|
124 |
|
125 |
# st.title('Model Evaluation Results including MMLU by task')
|
126 |
-
st.title('Exploring the Characteristics of Large Language Models: An Interactive Portal for Analyzing
|
127 |
-
st.markdown("""***Last updated
|
128 |
st.markdown("""**Models that are suspected to have training data contaminated with evaluation data have been removed.**""")
|
129 |
st.markdown("""
|
130 |
Hugging Face runs evaluations on open source models and provides results on a
|
|
|
123 |
data_provider = ResultDataProcessor()
|
124 |
|
125 |
# st.title('Model Evaluation Results including MMLU by task')
|
126 |
+
st.title('Exploring the Characteristics of Large Language Models: An Interactive Portal for Analyzing 1100+ Open Source Models Across 57 Diverse Evaluation Tasks')
|
127 |
+
st.markdown("""***Last updated September 1st***""")
|
128 |
st.markdown("""**Models that are suspected to have training data contaminated with evaluation data have been removed.**""")
|
129 |
st.markdown("""
|
130 |
Hugging Face runs evaluations on open source models and provides results on a
|