Spaces:

LLM360
/

de-arena

Running

yzabc007 commited on Oct 9

Commit

887dd92

•

1 Parent(s): 7467403

Update space

Files changed (2) hide show

app.py CHANGED Viewed

@@ -130,7 +130,7 @@ with demo:
     gr.HTML(SUB_TITLE)
     gr.HTML(EXTERNAL_LINKS)
     gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
     with gr.Tabs(elem_classes="tab-buttons") as tabs:
         with gr.TabItem("🏅 Overview", elem_id="llm-benchmark-tab-table", id=0):
@@ -313,7 +313,7 @@ with demo:
             gr.Markdown(CURRENT_TEXT, elem_classes="markdown-text")
-        with gr.TabItem("</> Coding", elem_id="coding-tab-table", id=5):
             CURRENT_TEXT = """
             # Coming soon!
             We are working on adding more tasks in coding domains to the leaderboard.
@@ -332,7 +332,9 @@ with demo:
         with gr.TabItem("📝 About", elem_id="llm-benchmark-tab-table", id=6):
-            gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")
         '''

     gr.HTML(SUB_TITLE)
     gr.HTML(EXTERNAL_LINKS)
     gr.Markdown(INTRODUCTION_TEXT, elem_classes="markdown-text")
     with gr.Tabs(elem_classes="tab-buttons") as tabs:
         with gr.TabItem("🏅 Overview", elem_id="llm-benchmark-tab-table", id=0):
             gr.Markdown(CURRENT_TEXT, elem_classes="markdown-text")
+        with gr.TabItem("</> Coding", elem_id="coding-table", id=5):
             CURRENT_TEXT = """
             # Coming soon!
             We are working on adding more tasks in coding domains to the leaderboard.
         with gr.TabItem("📝 About", elem_id="llm-benchmark-tab-table", id=6):
+            ABOUT_TEXT = """
+            """
+            gr.Markdown(ABOUT_TEXT, elem_classes="markdown-text")
         '''

src/about.py CHANGED Viewed

@@ -69,7 +69,7 @@ EXTERNAL_LINKS = """
 # What does your leaderboard evaluate?
 INTRODUCTION_TEXT = """
-Decentralized Arena automates and scales "Chatbot Arena" for LLM evaluation across various fine-grained dimensions
 (e.g., math – algebra, geometry, probability; logical reasoning, social reasoning, biology, chemistry, …).
 The evaluation is decentralized and democratic, with all LLMs participating in evaluating others.
 It achieves a 95\% correlation with Chatbot Arena's overall rankings, while being fully transparent and reproducible.

 # What does your leaderboard evaluate?
 INTRODUCTION_TEXT = """
+**Decentralized Arena** automates and scales "Chatbot Arena" for LLM evaluation across various fine-grained dimensions
 (e.g., math – algebra, geometry, probability; logical reasoning, social reasoning, biology, chemistry, …).
 The evaluation is decentralized and democratic, with all LLMs participating in evaluating others.
 It achieves a 95\% correlation with Chatbot Arena's overall rankings, while being fully transparent and reproducible.