lambdaofgod commited on
Commit
15fac57
1 Parent(s): 3e888ed
Files changed (1) hide show
  1. pages/2_Statistics.py +6 -7
pages/2_Statistics.py CHANGED
@@ -1,12 +1,10 @@
1
  import pandas as pd
2
  import streamlit as st
3
 
4
- best_results_df = pd.read_csv("output/best_tasks_with_hits.csv")
5
 
6
 
7
- worst_results_df = pd.read_csv(
8
- "output/worst_tasks_with_hits.csv"
9
- ) # , data_path="output/papers_with_dependencies.csv",
10
 
11
  show_worst_best_statistics = st.sidebar.checkbox(
12
  label="show worst/best statistics grouped by area"
@@ -16,11 +14,13 @@ show_area_aggregated_results = st.sidebar.checkbox(
16
  label="show results aggregated by area"
17
  )
18
  if show_worst_best_statistics:
19
- st.markdown("""
 
20
  ## Worst/best queries
21
  The following are top 10 worst/best queries per area by number of hits.
22
  There are at least 10 documents per query in the test set, so number of hits/10 is the accuracy.
23
- """)
 
24
  sort_key = st.selectbox("sort by", list(best_results_df.columns))
25
  st.markdown("## Queries with best results")
26
  st.table(best_results_df.sort_values(sort_key, ascending=False))
@@ -36,4 +36,3 @@ if show_area_aggregated_results:
36
  st.table(best_results_agg.sort_values(sort_key, ascending=False))
37
  st.markdown("Worst results")
38
  st.table(worst_results_agg.sort_values(sort_key, ascending=False))
39
-
 
1
  import pandas as pd
2
  import streamlit as st
3
 
4
+ best_results_df = pd.read_csv("assets/best_tasks_with_hits.csv")
5
 
6
 
7
+ worst_results_df = pd.read_csv("assets/worst_tasks_with_hits.csv")
 
 
8
 
9
  show_worst_best_statistics = st.sidebar.checkbox(
10
  label="show worst/best statistics grouped by area"
 
14
  label="show results aggregated by area"
15
  )
16
  if show_worst_best_statistics:
17
+ st.markdown(
18
+ """
19
  ## Worst/best queries
20
  The following are top 10 worst/best queries per area by number of hits.
21
  There are at least 10 documents per query in the test set, so number of hits/10 is the accuracy.
22
+ """
23
+ )
24
  sort_key = st.selectbox("sort by", list(best_results_df.columns))
25
  st.markdown("## Queries with best results")
26
  st.table(best_results_df.sort_values(sort_key, ascending=False))
 
36
  st.table(best_results_agg.sort_values(sort_key, ascending=False))
37
  st.markdown("Worst results")
38
  st.table(worst_results_agg.sort_values(sort_key, ascending=False))