compassjudger_subj_eval_leaderboard

Running

linjunyao commited on 10 days ago

Commit

6734e22

•

1 Parent(s): f1fda01

updated citation and intro

Files changed (2) hide show

app.py CHANGED Viewed

@@ -41,7 +41,7 @@ with gr.Blocks() as demo:
     # timestamp = struct['time']
     # EVAL_TIME = format_timestamp(timestamp)
-    EVAL_TIME = '20241015'
     # results = struct['results']
     # N_MODEL = len(results)
@@ -284,7 +284,7 @@ with gr.Blocks() as demo:
                 value=CITATION_BUTTON_TEXT,
                 label=CITATION_BUTTON_LABEL,
                 elem_id='citation-button',
-                lines=10,
             )

     # timestamp = struct['time']
     # EVAL_TIME = format_timestamp(timestamp)
+    EVAL_TIME = '20241022'
     # results = struct['results']
     # N_MODEL = len(results)
                 value=CITATION_BUTTON_TEXT,
                 label=CITATION_BUTTON_LABEL,
                 elem_id='citation-button',
+                lines=7,
             )

judgerbench/meta_data.py CHANGED Viewed

@@ -21,12 +21,13 @@ STYLE_CLASS_MAPPING = {
 URL = "http://opencompass.openxlab.space/assets/OpenVLM.json"
 VLMEVALKIT_README = 'https://raw.githubusercontent.com/open-compass/VLMEvalKit/main/README.md'
 # CONSTANTS-CITATION
-CITATION_BUTTON_TEXT = r"""@misc{2023opencompass,
-    title={OpenCompass: A Universal Evaluation Platform for Foundation Models},
-    author={OpenCompass Contributors},
-    howpublished = {\url{https://github.com/open-compass/opencompass}},
-    year={2023}
-}"""
 CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
 # CONSTANTS-TEXT
@@ -34,6 +35,12 @@ LEADERBORAD_INTRODUCTION = """# CompassJudger Subjective Evaluation Learderboard
 ### Welcome to the CompassJudger Subjective Evaluation Learderboard!
 This leaderboard was last updated: {}.
 *All results from the corresponding datasets have been normalized to percentages.

 URL = "http://opencompass.openxlab.space/assets/OpenVLM.json"
 VLMEVALKIT_README = 'https://raw.githubusercontent.com/open-compass/VLMEvalKit/main/README.md'
 # CONSTANTS-CITATION
+CITATION_BUTTON_TEXT = r"""@article{cao2024compass,
+  title={CompassJudger-1: All-in-one Judge Model Helps Model Evaluation and Evolution},
+  author={Maosong Cao, Alexander Lam, Haodong Duan, Hongwei Liu, Songyang Zhang, Kai Chen},
+  journal={arXiv preprint arXiv:2410.16256},
+  year={2024}
+}
+"""
 CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
 # CONSTANTS-TEXT
 ### Welcome to the CompassJudger Subjective Evaluation Learderboard!
+Model Link: https://huggingface.co/opencompass/CompassJudger-1-7B-Instruct
+Code Link: https://github.com/open-compass/CompassJudger
+Paper Link: https://arxiv.org/pdf/2410.16256
 This leaderboard was last updated: {}.
 *All results from the corresponding datasets have been normalized to percentages.