Gregor Betz commited on
Commit
e39b6d4
1 Parent(s): a6d8c19

just delta abs

Browse files
Files changed (3) hide show
  1. app.py +10 -12
  2. src/display/about.py +7 -7
  3. src/leaderboard/read_evals.py +1 -1
app.py CHANGED
@@ -147,18 +147,16 @@ with demo:
147
  show_label=False,
148
  elem_id="search-bar",
149
  )
150
- with gr.Row():
151
- shown_columns = gr.Radio(
152
- choices=[
153
- c for c in METRICS
154
- ],
155
- value=[
156
- c for c in METRICS
157
- ],
158
- label="Select metrics to show",
159
- elem_id="metrics-select",
160
- interactive=True,
161
- )
162
  with gr.Row():
163
  shown_columns = gr.CheckboxGroup(
164
  choices=[
 
147
  show_label=False,
148
  elem_id="search-bar",
149
  )
150
+ # with gr.Row():
151
+ # shown_columns = gr.Radio(
152
+ # choices=[
153
+ # c for c in METRICS
154
+ # ],
155
+ # value=METRICS[0],
156
+ # label="Select metrics to show",
157
+ # elem_id="metrics-select",
158
+ # interactive=True,
159
+ # )
 
 
160
  with gr.Row():
161
  shown_columns = gr.CheckboxGroup(
162
  choices=[
src/display/about.py CHANGED
@@ -12,15 +12,15 @@ class Task:
12
  class Tasks(Enum):
13
  # task_key in the json file, metric_key in the json file, name to display in the leaderboard
14
  task0 = Task("logiqa", "delta_abs", "LogiQA Δ")
15
- task1 = Task("logiqa", "delta_rel", "LogiQA Δ%")
16
- task2 = Task("logiqa", "acc_base", "LogiQA Acc")
17
- task3 = Task("logiqa", "acc_cot", "LogiQA AccCoT")
18
  task4 = Task("logiqa2", "delta_abs", "LogiQA2 Δ")
19
- task5 = Task("logiqa2", "delta_rel", "LogiQA2 Δ%")
20
- task6 = Task("logiqa2", "acc_base", "LogiQA2 Acc")
21
- task7 = Task("logiqa2", "acc_cot", "LogiQA2 AccCoT")
22
 
23
- METRICS = list(set([task.value.metric for task in Tasks]))
24
 
25
 
26
 
 
12
  class Tasks(Enum):
13
  # task_key in the json file, metric_key in the json file, name to display in the leaderboard
14
  task0 = Task("logiqa", "delta_abs", "LogiQA Δ")
15
+ #task1 = Task("logiqa", "delta_rel", "LogiQA Δ%")
16
+ #task2 = Task("logiqa", "acc_base", "LogiQA Acc")
17
+ #task3 = Task("logiqa", "acc_cot", "LogiQA AccCoT")
18
  task4 = Task("logiqa2", "delta_abs", "LogiQA2 Δ")
19
+ #task5 = Task("logiqa2", "delta_rel", "LogiQA2 Δ%")
20
+ #task6 = Task("logiqa2", "acc_base", "LogiQA2 Acc")
21
+ #task7 = Task("logiqa2", "acc_cot", "LogiQA2 AccCoT")
22
 
23
+ #METRICS = list(set([task.value.metric for task in Tasks]))
24
 
25
 
26
 
src/leaderboard/read_evals.py CHANGED
@@ -84,7 +84,7 @@ class EvalResult:
84
  model=model,
85
  results=results,
86
  precision=precision,
87
- revision= config.get("model_sha", ""),
88
  still_on_hub=still_on_hub,
89
  architecture=architecture
90
  )
 
84
  model=model,
85
  results=results,
86
  precision=precision,
87
+ revision=config.get("model_sha", ""),
88
  still_on_hub=still_on_hub,
89
  architecture=architecture
90
  )