Spaces:

ahmedheakl
/

CAMEL-Bench-leaderboard

Running

ahmedheakl commited on 14 days ago

Commit

20f0a61

•

1 Parent(s): aae65ae

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,7 +1,6 @@
 import pandas as pd
 import gradio as gr
-# Create the dataset based on the table you provided
 data = {
     "Method": ["GPT-4o", "GPT-4o-mini", "Gemini-1.5-Pro", "Gemini-1.5-Flash", "Qwen2-VL-2B"],
     "MM Understanding & Reasoning": [57.90, 48.82, 46.67, 45.58, 40.59],
@@ -14,20 +13,18 @@ data = {
     "Remote Sensing Understanding": [22.85, 16.93, 17.07, 14.95, 12.56]
 }
-# Convert the dataset into a DataFrame
 df = pd.DataFrame(data)
-# Calculate the average score for each model across the different tasks
 df['Average Score'] = df.iloc[:, 1:].mean(axis=1)
-# Function to display the data in a Gradio interface
 def display_data():
     return df
-# Create the Gradio interface
 with gr.Blocks() as demo:
-    gr.Markdown("# Model Performance Across Various Understanding Tasks")
-    gr.Markdown("This table shows the performance of different models across various tasks including OCR, chart understanding, video, medical imaging, and more. An average score is also calculated for each model.")
-    gr.Dataframe(value=df, label="Model Performance with Average Scores", interactive=False)
 demo.launch()

 import pandas as pd
 import gradio as gr
 data = {
     "Method": ["GPT-4o", "GPT-4o-mini", "Gemini-1.5-Pro", "Gemini-1.5-Flash", "Qwen2-VL-2B"],
     "MM Understanding & Reasoning": [57.90, 48.82, 46.67, 45.58, 40.59],
     "Remote Sensing Understanding": [22.85, 16.93, 17.07, 14.95, 12.56]
 }
 df = pd.DataFrame(data)
 df['Average Score'] = df.iloc[:, 1:].mean(axis=1)
 def display_data():
     return df
 with gr.Blocks() as demo:
+    gr.Markdown("![camel icon](https://cdn-uploads.huggingface.co/production/uploads/656864e12d73834278a8dea7/n-XfVKd1xVywH_vgPyJyQ.png)", elem_id="camel-icon")  # Replace with actual camel icon URL
+    gr.Markdown("# **CAMEL-Bench: Model Performance Across Vision Understanding Tasks**")
+    gr.Markdown("""
+    This table shows the performance of different models across various tasks including OCR, chart understanding, video, medical imaging, and more.
+    """)
+    gr.Dataframe(value=df, label="CAMEL-Bench Model Performance", interactive=False)
 demo.launch()