lambdaofgod commited on
Commit
1ed024e
1 Parent(s): 6b3fd91

updated model config

Browse files
assets/best_tasks.csv ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ area,task,hits
2
+ adversarial,adversarial attack,9
3
+ adversarial,adversarial defense,4
4
+ adversarial,backdoor attack,1
5
+ adversarial,adversarial text,1
6
+ audio,sound event localization and detection,3
7
+ audio,environmental sound classification,1
8
+ audio,audio tagging,1
9
+ audio,voice anti spoofing,0
10
+ computer-code,program induction,0
11
+ computer-code,learning to execute,0
12
+ computer-code,type prediction,0
13
+ computer-vision,person retrieval,10
14
+ computer-vision,optical character recognition,10
15
+ computer-vision,style transfer,10
16
+ computer-vision,action recognition,10
17
+ computer-vision,denoising,10
18
+ computer-vision,depth estimation,10
19
+ computer-vision,human object interaction detection,10
20
+ computer-vision,semantic segmentation,9
21
+ computer-vision,monocular depth estimation,8
22
+ computer-vision,instance segmentation,8
23
+ graphs,semantic segmentation,9
24
+ graphs,link prediction,7
25
+ graphs,graph attention,4
26
+ graphs,graph clustering,3
27
+ graphs,video inpainting,1
28
+ graphs,graph partitioning,1
29
+ graphs,graph regression,1
30
+ graphs,graph reconstruction,0
31
+ graphs,graph property prediction,0
32
+ graphs,graph learning,0
33
+ knowledge-base,link prediction,7
34
+ knowledge-base,entity alignment,1
35
+ knowledge-base,breast cancer detection,1
36
+ medical,medical image segmentation,5
37
+ medical,breast cancer detection,1
38
+ medical,iris segmentation,1
39
+ medical,cell segmentation,0
40
+ medical,medical relation extraction,0
41
+ medical,pancreas segmentation,0
42
+ medical,liver segmentation,0
43
+ medical,lesion segmentation,0
44
+ medical,medical code prediction,0
45
+ medical,brain segmentation,0
46
+ methodology,gaussian processes,10
47
+ methodology,density estimation,9
48
+ methodology,network pruning,9
49
+ methodology,imitation learning,9
50
+ methodology,word embeddings,9
51
+ methodology,outlier detection,7
52
+ methodology,automl,6
53
+ methodology,data augmentation,5
54
+ methodology,stochastic optimization,5
55
+ methodology,network embedding,4
56
+ miscellaneous,click through rate prediction,9
57
+ miscellaneous,session based recommendations,9
58
+ miscellaneous,molecular property prediction,6
59
+ miscellaneous,cross modal retrieval,5
60
+ miscellaneous,causal inference,5
61
+ miscellaneous,variational monte carlo,2
62
+ miscellaneous,data visualization,0
63
+ miscellaneous,malware classification,0
64
+ miscellaneous,counterfactual inference,0
65
+ miscellaneous,misinformation,0
66
+ music,music source separation,3
67
+ natural-language-processing,relation extraction,10
68
+ natural-language-processing,sentiment analysis,9
69
+ natural-language-processing,text summarization,7
70
+ natural-language-processing,text generation,6
71
+ natural-language-processing,aspect based sentiment analysis,5
72
+ natural-language-processing,chinese word segmentation,4
73
+ natural-language-processing,discourse parsing,4
74
+ natural-language-processing,grammatical error correction,4
75
+ natural-language-processing,discourse segmentation,3
76
+ natural-language-processing,bilingual lexicon induction,3
77
+ playing-games,snes games,0
78
+ playing-games,dota 2,0
79
+ playing-games,real time strategy games,0
80
+ playing-games,smac,0
81
+ reasoning,visual commonsense reasoning,2
82
+ reasoning,model based reinforcement learning,1
83
+ reasoning,common sense reasoning,1
84
+ robots,semantic segmentation,9
85
+ robots,gesture generation,2
86
+ robots,safe exploration,0
87
+ robots,deformable object manipulation,0
88
+ speech,speech synthesis,10
89
+ speech,distant speech recognition,7
90
+ speech,speech recognition,7
91
+ speech,speech enhancement,6
92
+ speech,speaker diarization,3
93
+ speech,speaker recognition,2
94
+ speech,speaker separation,1
95
+ speech,robust speech recognition,0
96
+ speech,acoustic unit discovery,0
97
+ time-series,time series,8
98
+ time-series,dynamic time warping,6
99
+ time-series,time series clustering,2
100
+ time-series,stock price prediction,2
101
+ time-series,stock market prediction,2
102
+ time-series,video quality assessment,1
103
+ time-series,traffic prediction,0
104
+ time-series,time series analysis,0
105
+ time-series,data compression,0
assets/best_tasks_with_hits.csv DELETED
@@ -1,107 +0,0 @@
1
- area,task,hits
2
- adversarial,adversarial attack,8
3
- adversarial,adversarial defense,2
4
- adversarial,data poisoning,2
5
- adversarial,inference attack,0
6
- audio,audio generation,4
7
- audio,audio source separation,3
8
- audio,language identification,1
9
- audio,audio tagging,1
10
- computer-code,text to sql,9
11
- computer-code,program induction,1
12
- computer-code,code search,0
13
- computer-code,type prediction,0
14
- computer-vision,style transfer,10
15
- computer-vision,crowd counting,10
16
- computer-vision,depth estimation,10
17
- computer-vision,object detection,10
18
- computer-vision,person re identification,10
19
- computer-vision,text to image generation,9
20
- computer-vision,image inpainting,8
21
- computer-vision,image registration,7
22
- computer-vision,video captioning,7
23
- computer-vision,lane detection,7
24
- graphs,topological data analysis,8
25
- graphs,node classification,7
26
- graphs,learning to rank,5
27
- graphs,graph embedding,4
28
- graphs,knowledge graph embedding,3
29
- graphs,knowledge graph embeddings,2
30
- graphs,graph learning,1
31
- graphs,knowledge base completion,1
32
- graphs,image outpainting,0
33
- graphs,image relighting,0
34
- knowledge-base,knowledge base completion,1
35
- knowledge-base,video to video synthesis,0
36
- knowledge-base,breast cancer detection,0
37
- medical,synthetic data generation,5
38
- medical,medical image registration,2
39
- medical,cardiac segmentation,2
40
- medical,length of stay prediction,1
41
- medical,skin lesion segmentation,1
42
- medical,medical image segmentation,1
43
- medical,breast cancer detection,0
44
- medical,liver segmentation,0
45
- medical,seizure detection,0
46
- medical,brain decoding,0
47
- methodology,anomaly detection,10
48
- methodology,active learning,10
49
- methodology,domain adaptation,10
50
- methodology,disentanglement,9
51
- methodology,density estimation,9
52
- methodology,few shot learning,7
53
- methodology,imitation learning,6
54
- methodology,stochastic optimization,6
55
- methodology,transfer learning,5
56
- methodology,outlier detection,5
57
- miscellaneous,survival analysis,9
58
- miscellaneous,recommendation systems,7
59
- miscellaneous,sequential recommendation,5
60
- miscellaneous,learning to rank,5
61
- miscellaneous,malware detection,5
62
- miscellaneous,synthetic data generation,5
63
- miscellaneous,multi armed bandits,4
64
- miscellaneous,deep clustering,3
65
- miscellaneous,prediction intervals,2
66
- miscellaneous,model discovery,1
67
- music,music modeling,5
68
- natural-language-processing,relation extraction,10
69
- natural-language-processing,active learning,10
70
- natural-language-processing,coreference resolution,10
71
- natural-language-processing,natural language inference,9
72
- natural-language-processing,text generation,8
73
- natural-language-processing,text matching,5
74
- natural-language-processing,discourse parsing,5
75
- natural-language-processing,relational reasoning,5
76
- natural-language-processing,dialogue generation,4
77
- natural-language-processing,fact verification,4
78
- playing-games,game of chess,9
79
- playing-games,game of go,8
80
- playing-games,atari games,6
81
- playing-games,card games,1
82
- playing-games,real time strategy games,1
83
- playing-games,starcraft,0
84
- playing-games,acrobot,0
85
- reasoning,decision making,3
86
- reasoning,math word problem solving,0
87
- robots,vision and language navigation,4
88
- robots,visual odometry,3
89
- robots,motion planning,3
90
- robots,image outpainting,0
91
- robots,robotic grasping,0
92
- robots,trajectory planning,0
93
- speech,speaker verification,9
94
- speech,text to speech synthesis,5
95
- speech,dialogue generation,4
96
- speech,speech enhancement,4
97
- speech,speaker diarization,4
98
- time-series,time series,8
99
- time-series,time series classification,3
100
- time-series,time series prediction,2
101
- time-series,multivariate time series forecasting,1
102
- time-series,time series clustering,1
103
- time-series,portfolio optimization,1
104
- time-series,stock market prediction,1
105
- time-series,activity prediction,0
106
- time-series,math word problem solving,0
107
- time-series,stock trend prediction,0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
assets/worst_tasks.csv ADDED
@@ -0,0 +1,105 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ area,task,hits
2
+ adversarial,backdoor attack,1
3
+ adversarial,adversarial text,1
4
+ adversarial,adversarial defense,4
5
+ adversarial,adversarial attack,9
6
+ audio,voice anti spoofing,0
7
+ audio,environmental sound classification,1
8
+ audio,audio tagging,1
9
+ audio,sound event localization and detection,3
10
+ computer-code,program induction,0
11
+ computer-code,learning to execute,0
12
+ computer-code,type prediction,0
13
+ computer-vision,traffic sign recognition,0
14
+ computer-vision,object proposal generation,0
15
+ computer-vision,face parsing,0
16
+ computer-vision,stereo lidar fusion,0
17
+ computer-vision,electron microscopy image segmentation,0
18
+ computer-vision,surface normals estimation,0
19
+ computer-vision,salt and pepper noise removal,0
20
+ computer-vision,weakly supervised segmentation,0
21
+ computer-vision,camera calibration,0
22
+ computer-vision,genre classification,0
23
+ graphs,graph reconstruction,0
24
+ graphs,graph property prediction,0
25
+ graphs,graph learning,0
26
+ graphs,video inpainting,1
27
+ graphs,graph partitioning,1
28
+ graphs,graph regression,1
29
+ graphs,graph clustering,3
30
+ graphs,graph attention,4
31
+ graphs,link prediction,7
32
+ graphs,semantic segmentation,9
33
+ knowledge-base,entity alignment,1
34
+ knowledge-base,breast cancer detection,1
35
+ knowledge-base,link prediction,7
36
+ medical,cell segmentation,0
37
+ medical,medical relation extraction,0
38
+ medical,pancreas segmentation,0
39
+ medical,liver segmentation,0
40
+ medical,lesion segmentation,0
41
+ medical,medical code prediction,0
42
+ medical,brain segmentation,0
43
+ medical,skin cancer classification,0
44
+ medical,medical image registration,0
45
+ medical,breast cancer detection,1
46
+ methodology,multi label classification,0
47
+ methodology,unsupervised pre training,0
48
+ methodology,classification,0
49
+ methodology,multilingual word embeddings,0
50
+ methodology,one class classifier,0
51
+ methodology,data visualization,0
52
+ methodology,automatic machine learning model selection,0
53
+ methodology,l2 regularization,0
54
+ methodology,abnormal event detection in video,0
55
+ methodology,generalization bounds,0
56
+ miscellaneous,data visualization,0
57
+ miscellaneous,counterfactual inference,0
58
+ miscellaneous,misinformation,0
59
+ miscellaneous,physical simulations,0
60
+ miscellaneous,formation energy,0
61
+ miscellaneous,malware classification,0
62
+ miscellaneous,multi target regression,0
63
+ miscellaneous,open set learning,0
64
+ miscellaneous,model discovery,0
65
+ miscellaneous,cyber attack detection,0
66
+ music,music source separation,3
67
+ natural-language-processing,automatic post editing,0
68
+ natural-language-processing,text augmentation,0
69
+ natural-language-processing,part of speech tagging,0
70
+ natural-language-processing,sentence ordering,0
71
+ natural-language-processing,grammatical error detection,0
72
+ natural-language-processing,unsupervised extractive summarization,0
73
+ natural-language-processing,multilingual nlp,0
74
+ natural-language-processing,text categorization,0
75
+ natural-language-processing,twitter sentiment analysis,0
76
+ natural-language-processing,extract aspect,0
77
+ playing-games,snes games,0
78
+ playing-games,dota 2,0
79
+ playing-games,real time strategy games,0
80
+ playing-games,smac,0
81
+ reasoning,model based reinforcement learning,1
82
+ reasoning,common sense reasoning,1
83
+ reasoning,visual commonsense reasoning,2
84
+ robots,safe exploration,0
85
+ robots,deformable object manipulation,0
86
+ robots,gesture generation,2
87
+ robots,semantic segmentation,9
88
+ speech,robust speech recognition,0
89
+ speech,acoustic unit discovery,0
90
+ speech,speaker separation,1
91
+ speech,speaker recognition,2
92
+ speech,speaker diarization,3
93
+ speech,speech enhancement,6
94
+ speech,distant speech recognition,7
95
+ speech,speech recognition,7
96
+ speech,speech synthesis,10
97
+ time-series,traffic prediction,0
98
+ time-series,time series analysis,0
99
+ time-series,data compression,0
100
+ time-series,video quality assessment,1
101
+ time-series,time series clustering,2
102
+ time-series,stock price prediction,2
103
+ time-series,stock market prediction,2
104
+ time-series,dynamic time warping,6
105
+ time-series,time series,8
assets/worst_tasks_with_hits.csv DELETED
@@ -1,107 +0,0 @@
1
- area,task,hits
2
- adversarial,inference attack,0
3
- adversarial,adversarial defense,2
4
- adversarial,data poisoning,2
5
- adversarial,adversarial attack,8
6
- audio,language identification,1
7
- audio,audio tagging,1
8
- audio,audio source separation,3
9
- audio,audio generation,4
10
- computer-code,code search,0
11
- computer-code,type prediction,0
12
- computer-code,program induction,1
13
- computer-code,text to sql,9
14
- computer-vision,code search,0
15
- computer-vision,document layout analysis,0
16
- computer-vision,mixed reality,0
17
- computer-vision,stereo lidar fusion,0
18
- computer-vision,multi view subspace clustering,0
19
- computer-vision,anomaly detection in surveillance videos,0
20
- computer-vision,activity prediction,0
21
- computer-vision,superpixels,0
22
- computer-vision,image morphing,0
23
- computer-vision,hyperspectral image classification,0
24
- graphs,image outpainting,0
25
- graphs,image relighting,0
26
- graphs,graph reconstruction,0
27
- graphs,graph partitioning,0
28
- graphs,graph property prediction,0
29
- graphs,graph structure learning,0
30
- graphs,graph learning,1
31
- graphs,knowledge base completion,1
32
- graphs,knowledge graph embeddings,2
33
- graphs,knowledge graph embedding,3
34
- knowledge-base,video to video synthesis,0
35
- knowledge-base,breast cancer detection,0
36
- knowledge-base,knowledge base completion,1
37
- medical,breast cancer detection,0
38
- medical,liver segmentation,0
39
- medical,seizure detection,0
40
- medical,brain decoding,0
41
- medical,disease prediction,0
42
- medical,epidemiology,0
43
- medical,medical relation extraction,0
44
- medical,ecg classification,0
45
- medical,pancreas segmentation,0
46
- medical,length of stay prediction,1
47
- methodology,multi label classification,0
48
- methodology,distributed optimization,0
49
- methodology,dictionary learning,0
50
- methodology,multi label text classification,0
51
- methodology,generalization bounds,0
52
- methodology,one class classifier,0
53
- methodology,automatic machine learning model selection,0
54
- methodology,inductive logic programming,0
55
- methodology,bilevel optimization,0
56
- methodology,l2 regularization,0
57
- miscellaneous,fault detection,0
58
- miscellaneous,gpr,0
59
- miscellaneous,counterfactual inference,0
60
- miscellaneous,brain decoding,0
61
- miscellaneous,protein structure prediction,0
62
- miscellaneous,total energy,0
63
- miscellaneous,seismic imaging,0
64
- miscellaneous,vulnerability detection,0
65
- miscellaneous,model discovery,1
66
- miscellaneous,age estimation,1
67
- music,music modeling,5
68
- natural-language-processing,conversational search,0
69
- natural-language-processing,document ranking,0
70
- natural-language-processing,joint entity and relation extraction,0
71
- natural-language-processing,self learning,0
72
- natural-language-processing,intent detection,0
73
- natural-language-processing,text categorization,0
74
- natural-language-processing,opinion mining,0
75
- natural-language-processing,linguistic acceptability,0
76
- natural-language-processing,cloze test,0
77
- natural-language-processing,zero shot cross lingual transfer,0
78
- playing-games,starcraft,0
79
- playing-games,acrobot,0
80
- playing-games,card games,1
81
- playing-games,real time strategy games,1
82
- playing-games,atari games,6
83
- playing-games,game of go,8
84
- playing-games,game of chess,9
85
- reasoning,math word problem solving,0
86
- reasoning,decision making,3
87
- robots,image outpainting,0
88
- robots,robotic grasping,0
89
- robots,trajectory planning,0
90
- robots,visual odometry,3
91
- robots,motion planning,3
92
- robots,vision and language navigation,4
93
- speech,dialogue generation,4
94
- speech,speech enhancement,4
95
- speech,speaker diarization,4
96
- speech,text to speech synthesis,5
97
- speech,speaker verification,9
98
- time-series,activity prediction,0
99
- time-series,math word problem solving,0
100
- time-series,stock trend prediction,0
101
- time-series,change point detection,0
102
- time-series,spatio temporal forecasting,0
103
- time-series,stock price prediction,0
104
- time-series,multivariate time series forecasting,1
105
- time-series,time series clustering,1
106
- time-series,portfolio optimization,1
107
- time-series,stock market prediction,1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
config.py ADDED
@@ -0,0 +1,4 @@
 
 
 
 
 
1
+ query_encoder_model_name = "lambdaofgod/query_nbow_embedder"
2
+ document_encoder_model_name = "lambdaofgod/document_nbow_embedder"
3
+ best_tasks_path="assets/best_tasks.csv"
4
+ worst_tasks_path="assets/worst_tasks.csv"
model_config.py DELETED
@@ -1,2 +0,0 @@
1
- query_encoder_model_name = "lambdaofgod/query_nbow_10_5000-15"
2
- document_encoder_model_name = "lambdaofgod/document_nbow_10_5000-15"
 
 
 
pages/1_Retrieval_App.py CHANGED
@@ -7,7 +7,7 @@ import sentence_transformers
7
  import streamlit as st
8
  from findkit import feature_extractors, indexes, retrieval_pipeline
9
  from toolz import partial
10
- import model_config
11
 
12
 
13
  def truncate_description(description, length=50):
@@ -145,7 +145,7 @@ def app_main(
145
 
146
 
147
  app_main(
148
- query_encoder_path=model_config.query_encoder_model_name,
149
- document_encoder_path=model_config.document_encoder_model_name,
150
  data_path="lambdaofgod/pwc_repositories_with_dependencies",
151
  )
 
7
  import streamlit as st
8
  from findkit import feature_extractors, indexes, retrieval_pipeline
9
  from toolz import partial
10
+ import config
11
 
12
 
13
  def truncate_description(description, length=50):
 
145
 
146
 
147
  app_main(
148
+ query_encoder_path=config.query_encoder_model_name,
149
+ document_encoder_path=config.document_encoder_model_name,
150
  data_path="lambdaofgod/pwc_repositories_with_dependencies",
151
  )
pages/2_Statistics.py CHANGED
@@ -1,10 +1,11 @@
1
  import pandas as pd
2
  import streamlit as st
 
3
 
4
- best_results_df = pd.read_csv("assets/best_tasks_with_hits.csv")
5
 
6
 
7
- worst_results_df = pd.read_csv("assets/worst_tasks_with_hits.csv")
8
 
9
  show_worst_best_statistics = st.sidebar.checkbox(
10
  label="show worst/best statistics grouped by area"
 
1
  import pandas as pd
2
  import streamlit as st
3
+ import config
4
 
5
+ best_results_df = pd.read_csv(config.best_tasks_path)
6
 
7
 
8
+ worst_results_df = pd.read_csv(config.worst_tasks_path)
9
 
10
  show_worst_best_statistics = st.sidebar.checkbox(
11
  label="show worst/best statistics grouped by area"