jeongsk commited on
Commit
5480786
1 Parent(s): 74e9aa3

Add benchmark data and resources for evaluation

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. .gitattributes +1 -0
  2. evaluator/benchmark/0/config.yaml +22 -0
  3. evaluator/benchmark/0/retrieve_node_line/retrieval/0.parquet +3 -0
  4. evaluator/benchmark/0/retrieve_node_line/retrieval/1.parquet +3 -0
  5. evaluator/benchmark/0/retrieve_node_line/retrieval/10.parquet +3 -0
  6. evaluator/benchmark/0/retrieve_node_line/retrieval/11.parquet +3 -0
  7. evaluator/benchmark/0/retrieve_node_line/retrieval/12.parquet +3 -0
  8. evaluator/benchmark/0/retrieve_node_line/retrieval/13.parquet +3 -0
  9. evaluator/benchmark/0/retrieve_node_line/retrieval/14.parquet +3 -0
  10. evaluator/benchmark/0/retrieve_node_line/retrieval/15.parquet +3 -0
  11. evaluator/benchmark/0/retrieve_node_line/retrieval/16.parquet +3 -0
  12. evaluator/benchmark/0/retrieve_node_line/retrieval/17.parquet +3 -0
  13. evaluator/benchmark/0/retrieve_node_line/retrieval/18.parquet +3 -0
  14. evaluator/benchmark/0/retrieve_node_line/retrieval/19.parquet +3 -0
  15. evaluator/benchmark/0/retrieve_node_line/retrieval/2.parquet +3 -0
  16. evaluator/benchmark/0/retrieve_node_line/retrieval/20.parquet +3 -0
  17. evaluator/benchmark/0/retrieve_node_line/retrieval/21.parquet +3 -0
  18. evaluator/benchmark/0/retrieve_node_line/retrieval/22.parquet +3 -0
  19. evaluator/benchmark/0/retrieve_node_line/retrieval/23.parquet +3 -0
  20. evaluator/benchmark/0/retrieve_node_line/retrieval/24.parquet +3 -0
  21. evaluator/benchmark/0/retrieve_node_line/retrieval/25.parquet +3 -0
  22. evaluator/benchmark/0/retrieve_node_line/retrieval/26.parquet +3 -0
  23. evaluator/benchmark/0/retrieve_node_line/retrieval/27.parquet +3 -0
  24. evaluator/benchmark/0/retrieve_node_line/retrieval/28.parquet +3 -0
  25. evaluator/benchmark/0/retrieve_node_line/retrieval/29.parquet +3 -0
  26. evaluator/benchmark/0/retrieve_node_line/retrieval/3.parquet +3 -0
  27. evaluator/benchmark/0/retrieve_node_line/retrieval/30.parquet +3 -0
  28. evaluator/benchmark/0/retrieve_node_line/retrieval/31.parquet +3 -0
  29. evaluator/benchmark/0/retrieve_node_line/retrieval/32.parquet +3 -0
  30. evaluator/benchmark/0/retrieve_node_line/retrieval/33.parquet +3 -0
  31. evaluator/benchmark/0/retrieve_node_line/retrieval/4.parquet +3 -0
  32. evaluator/benchmark/0/retrieve_node_line/retrieval/5.parquet +3 -0
  33. evaluator/benchmark/0/retrieve_node_line/retrieval/6.parquet +3 -0
  34. evaluator/benchmark/0/retrieve_node_line/retrieval/7.parquet +3 -0
  35. evaluator/benchmark/0/retrieve_node_line/retrieval/8.parquet +3 -0
  36. evaluator/benchmark/0/retrieve_node_line/retrieval/9.parquet +3 -0
  37. evaluator/benchmark/0/retrieve_node_line/retrieval/best_20.parquet +3 -0
  38. evaluator/benchmark/0/retrieve_node_line/retrieval/summary.csv +35 -0
  39. evaluator/benchmark/0/retrieve_node_line/summary.csv +2 -0
  40. evaluator/benchmark/0/summary.csv +2 -0
  41. evaluator/benchmark/data/corpus.parquet +3 -0
  42. evaluator/benchmark/data/qa.parquet +3 -0
  43. evaluator/benchmark/resources/bm25_porter_stemmer.pkl +3 -0
  44. evaluator/benchmark/resources/chroma/50ae74e0-6e8d-43bd-af92-fbefa828e7c1/data_level0.bin +3 -0
  45. evaluator/benchmark/resources/chroma/50ae74e0-6e8d-43bd-af92-fbefa828e7c1/header.bin +3 -0
  46. evaluator/benchmark/resources/chroma/50ae74e0-6e8d-43bd-af92-fbefa828e7c1/length.bin +3 -0
  47. evaluator/benchmark/resources/chroma/50ae74e0-6e8d-43bd-af92-fbefa828e7c1/link_lists.bin +0 -0
  48. evaluator/benchmark/resources/chroma/5cdc4426-9cf3-4176-aa91-2f9940af5fa7/data_level0.bin +3 -0
  49. evaluator/benchmark/resources/chroma/5cdc4426-9cf3-4176-aa91-2f9940af5fa7/header.bin +3 -0
  50. evaluator/benchmark/resources/chroma/5cdc4426-9cf3-4176-aa91-2f9940af5fa7/length.bin +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ *.sqlite3 filter=lfs diff=lfs merge=lfs -text
evaluator/benchmark/0/config.yaml ADDED
@@ -0,0 +1,22 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ node_lines:
2
+ - node_line_name: retrieve_node_line
3
+ nodes:
4
+ - node_type: retrieval
5
+ strategy:
6
+ metrics: [ retrieval_f1, retrieval_recall, retrieval_precision, retrieval_ndcg, retrieval_map, retrieval_mrr ]
7
+ top_k: 4
8
+ modules:
9
+ - module_type: bm25
10
+ - module_type: vectordb
11
+ embedding_model: [ huggingface_baai_llm_embedder, huggingface_baai_bge_large_en, huggingface_baai_bge_small_en, huggingface_baai_bge_base_en ]
12
+ - module_type: hybrid_rrf
13
+ - module_type: hybrid_cc
14
+ normalize_method: [ mm, tmm, z, dbsf ]
15
+ weight_range:
16
+ - (0.0, 1.0)
17
+ - (0.3, 0.7)
18
+ - (0.4, 0.6)
19
+ - (0.5, 0.5)
20
+ - (0.6, 0.4)
21
+ - (0.7, 0.3)
22
+ - (1.0, 0.0)
evaluator/benchmark/0/retrieve_node_line/retrieval/0.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1dcc2aa9409c10cf86bc8640a53f60f025b8244ac0dc0ccb2cd470164c74fc0
3
+ size 154884
evaluator/benchmark/0/retrieve_node_line/retrieval/1.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa788938151f2cacc4744ff38f94918e41d50f72cee3c62dea241973d6a57ce6
3
+ size 185025
evaluator/benchmark/0/retrieve_node_line/retrieval/10.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd67333092309a8e451a835560b7658e358815761e5f1a4d8f86e1e24a201b4f
3
+ size 196661
evaluator/benchmark/0/retrieve_node_line/retrieval/11.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3399de5ad6d629bca3adf7bc896ff8cb96f365f304bf4399771560b4ef0dce0
3
+ size 196560
evaluator/benchmark/0/retrieve_node_line/retrieval/12.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a101ffce50e0cec9a95ce5bcea81aa1c622af85833d83d243c0de8d050f15f5b
3
+ size 203865
evaluator/benchmark/0/retrieve_node_line/retrieval/13.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bb30483713517a6e1172bc820dde30e8dbe026888240633309d94d0f2ac0f05
3
+ size 184139
evaluator/benchmark/0/retrieve_node_line/retrieval/14.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68691107ae8a83b6022d0f5cab704f9e46c0f8717251a0f83734fc86e269a1c0
3
+ size 195569
evaluator/benchmark/0/retrieve_node_line/retrieval/15.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f0c0d80671b841e6ff6e8d845b586adff5abc5825edb4b2f1389d505076bbca
3
+ size 193253
evaluator/benchmark/0/retrieve_node_line/retrieval/16.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21520619a480e02c71960302ee76821bdc2fe4a72be8beacb697002205e5092d
3
+ size 193201
evaluator/benchmark/0/retrieve_node_line/retrieval/17.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d630e5ff5b5185482724410537089f78ec7e1f3bf2e241a0ec15f1253e53793
3
+ size 184231
evaluator/benchmark/0/retrieve_node_line/retrieval/18.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fb562258f9d9c78524bf90b794ea2209781a84ede3932e0cfc2cc3e0f50a400
3
+ size 185386
evaluator/benchmark/0/retrieve_node_line/retrieval/19.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c18164fd827461cdbe6e6cdf8c6c5f150aa00fcec733f703aab4a03f07f95b95
3
+ size 185594
evaluator/benchmark/0/retrieve_node_line/retrieval/2.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a960852fce12c1ec989bf69c8d49d3084e678d3ab85184a48ea04250b7982e7
3
+ size 200433
evaluator/benchmark/0/retrieve_node_line/retrieval/20.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c88e47dcfe1670460e76cca3a44d375bb27f21521568b3dab51ef44fc793aed1
3
+ size 200974
evaluator/benchmark/0/retrieve_node_line/retrieval/21.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0248ddc7edc82fdaa01bec95926c78ee20e5ce91f8b29b46ad85ea2cbe1e8dd4
3
+ size 189141
evaluator/benchmark/0/retrieve_node_line/retrieval/22.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:551bb93fff3e78b5d4b87a243a6185eb57aa39d9b8306405a5176497de993ed6
3
+ size 191912
evaluator/benchmark/0/retrieve_node_line/retrieval/23.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab3a88b00111b8b9979c5b200fceffd5dd51939b9dcabca663989f2b73b0a3a8
3
+ size 191838
evaluator/benchmark/0/retrieve_node_line/retrieval/24.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1db82fceda63866571614e4dc7268d4278752a4f5ef552ad0ccf9c6383a40f44
3
+ size 198913
evaluator/benchmark/0/retrieve_node_line/retrieval/25.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bec39ad8f10dbd0398277fe43f34f3ff5b40f600100dfca8eef4e78f9e9d0232
3
+ size 192550
evaluator/benchmark/0/retrieve_node_line/retrieval/26.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e9ede0b278f99d95da4d6674df50d4fa95deddab0571c826db01bdbdb4f43f2
3
+ size 192512
evaluator/benchmark/0/retrieve_node_line/retrieval/27.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26c1fdadb71467d2e2b3704dfc0f273767c6d2f0101d919996054d7ca6270ebc
3
+ size 196818
evaluator/benchmark/0/retrieve_node_line/retrieval/28.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6da9d46006f5f12aba49d9d3590c1f91c60308586268dcefa726dc064aa404f3
3
+ size 197812
evaluator/benchmark/0/retrieve_node_line/retrieval/29.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d452a46688c8f5d990826e13d50eede5214ee3959fd408cc4abccc52d6413a7
3
+ size 197442
evaluator/benchmark/0/retrieve_node_line/retrieval/3.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1486d5104d4452609935053fd1700cb53365dfbb45de942b569ba29a09c0e73
3
+ size 186242
evaluator/benchmark/0/retrieve_node_line/retrieval/30.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1d452a46688c8f5d990826e13d50eede5214ee3959fd408cc4abccc52d6413a7
3
+ size 197442
evaluator/benchmark/0/retrieve_node_line/retrieval/31.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ca7f7e5b93036f4386a6c9505f28dcad7e466f0eb1c291b1fb108e6ae222222
3
+ size 193507
evaluator/benchmark/0/retrieve_node_line/retrieval/32.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94cbf69631d25a975e9cc786f6a430f762ab710320004ad9a30693cc2a947eb0
3
+ size 193513
evaluator/benchmark/0/retrieve_node_line/retrieval/33.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6414740f884f8d8d58b55835bc47113616254523d374dca5dd39d8e81dfc031a
3
+ size 197743
evaluator/benchmark/0/retrieve_node_line/retrieval/4.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a2850bbc6f1aa63cf6117d6ea507e10c690652d3344bd12c7226c472b31d127
3
+ size 184065
evaluator/benchmark/0/retrieve_node_line/retrieval/5.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f325b0de2c7938d5dae6be278a8c0cc82c4ae579fc33642e0d3155872a26dea
3
+ size 192569
evaluator/benchmark/0/retrieve_node_line/retrieval/6.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ba75d44fad9a8635b93287f3a67b4f4edf4ec5de203521c030d64189db028f3
3
+ size 197404
evaluator/benchmark/0/retrieve_node_line/retrieval/7.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b616c6210ced6ef790b44de6e3cc2d36ea0029b291a7dea670cfc0808f97c7a0
3
+ size 195581
evaluator/benchmark/0/retrieve_node_line/retrieval/8.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae4da4e643df4d5eead4b39173f51b762ece7aeb19ffb867dd1aacc21a59b5bf
3
+ size 196574
evaluator/benchmark/0/retrieve_node_line/retrieval/9.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e940f028f64f11e8e88c30aeee00446bf364ef57dce2b2714d90e2489b2a15f
3
+ size 196593
evaluator/benchmark/0/retrieve_node_line/retrieval/best_20.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3400ba5791411c6966019e6d314d880a0c3c0a923794e20a9fa82ea462dc7f6f
3
+ size 224587
evaluator/benchmark/0/retrieve_node_line/retrieval/summary.csv ADDED
@@ -0,0 +1,35 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ filename,module_name,module_params,execution_time,retrieval_f1,retrieval_recall,retrieval_precision,retrieval_ndcg,retrieval_map,retrieval_mrr,is_best
2
+ 0.parquet,vectordb,"{'top_k': 4, 'embedding_model': 'huggingface_baai_llm_embedder'}",0.10266771121900908,0.33469387755102037,0.8367346938775511,0.20918367346938777,0.36869311025075513,0.2193877551020408,0.2193877551020408,False
3
+ 1.parquet,vectordb,"{'top_k': 4, 'embedding_model': 'huggingface_baai_bge_small_en'}",0.05651242878972268,0.3510204081632653,0.8775510204081632,0.2193877551020408,0.39380379111963937,0.23979591836734693,0.23979591836734693,False
4
+ 2.parquet,vectordb,"{'top_k': 4, 'embedding_model': 'huggingface_baai_bge_base_en'}",0.04421803902606575,0.35918367346938773,0.8979591836734694,0.22448979591836735,0.4134387442347614,0.2585034013605442,0.2585034013605442,False
5
+ 3.parquet,vectordb,"{'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}",0.06927850295086296,0.38367346938775504,0.9591836734693877,0.23979591836734693,0.4241010511081391,0.2534013605442177,0.2534013605442177,False
6
+ 4.parquet,bm25,{'top_k': 4},0.0012699779199094189,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.949463653352772,0.9387755102040817,0.9387755102040817,False
7
+ 5.parquet,hybrid_rrf,"{'top_k': 4, 'weight': 4.0, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.8775884408353242,0.8418367346938775,0.8418367346938775,False
8
+ 6.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'mm', 'weight': 0.0, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.949463653352772,0.9387755102040817,0.9387755102040817,False
9
+ 7.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'mm', 'weight': 0.5, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3755102040816326,0.9387755102040817,0.23469387755102042,0.5996385342755705,0.4812925170068027,0.4812925170068027,False
10
+ 8.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'mm', 'weight': 0.42000000000000004, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.38367346938775504,0.9591836734693877,0.23979591836734693,0.9174366443338617,0.9030612244897959,0.9030612244897959,False
11
+ 9.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'mm', 'weight': 0.4, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.38367346938775504,0.9591836734693877,0.23979591836734693,0.9174366443338617,0.9030612244897959,0.9030612244897959,False
12
+ 10.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'mm', 'weight': 0.3, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.38367346938775504,0.9591836734693877,0.23979591836734693,0.9365875359329464,0.9285714285714286,0.9285714285714286,False
13
+ 11.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'mm', 'weight': 0.3559999999999999, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.38367346938775504,0.9591836734693877,0.23979591836734693,0.9365875359329464,0.9285714285714286,0.9285714285714286,False
14
+ 12.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'mm', 'weight': 0.09999999999999998, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.949463653352772,0.9387755102040817,0.9387755102040817,False
15
+ 13.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'dbsf', 'weight': 0.14, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.9543236634110799,0.945578231292517,0.945578231292517,False
16
+ 14.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'dbsf', 'weight': 0.5, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.8639391132653145,0.8231292517006802,0.8231292517006802,False
17
+ 15.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'dbsf', 'weight': 0.42200000000000004, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.9317275258746386,0.9149659863945577,0.9149659863945577,False
18
+ 16.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'dbsf', 'weight': 0.41800000000000004, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.9317275258746386,0.9149659863945577,0.9149659863945577,False
19
+ 17.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'dbsf', 'weight': 0.3, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.9543236634110799,0.945578231292517,0.945578231292517,False
20
+ 18.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'dbsf', 'weight': 0.33599999999999997, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.9543236634110799,0.945578231292517,0.945578231292517,False
21
+ 19.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'dbsf', 'weight': 0.32999999999999996, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.9543236634110799,0.945578231292517,0.945578231292517,False
22
+ 20.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'tmm', 'weight': 0.29, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.9720597908892135,0.9693877551020408,0.9693877551020408,True
23
+ 21.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'tmm', 'weight': 0.5, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.9453768534446483,0.9336734693877551,0.9336734693877551,False
24
+ 22.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'tmm', 'weight': 0.41600000000000004, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.949463653352772,0.9387755102040817,0.9387755102040817,False
25
+ 23.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'tmm', 'weight': 0.4, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.949463653352772,0.9387755102040817,0.9387755102040817,False
26
+ 24.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'tmm', 'weight': 0.3, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.9720597908892135,0.9693877551020408,0.9693877551020408,False
27
+ 25.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'tmm', 'weight': 0.36799999999999994, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.9720597908892135,0.9693877551020408,0.9693877551020408,False
28
+ 26.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'tmm', 'weight': 0.36, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.9720597908892135,0.9693877551020408,0.9693877551020408,False
29
+ 27.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'z', 'weight': 0.0, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.9453768534446483,0.9336734693877551,0.9336734693877551,False
30
+ 28.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'z', 'weight': 0.5, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3591836734693878,0.8979591836734694,0.22448979591836735,0.49794101393666546,0.3673469387755102,0.3673469387755102,False
31
+ 29.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'z', 'weight': 0.4, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.38367346938775504,0.9591836734693877,0.23979591836734693,0.8080328587684287,0.7568027210884353,0.7568027210884353,False
32
+ 30.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'z', 'weight': 0.4, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.38367346938775504,0.9591836734693877,0.23979591836734693,0.8080328587684287,0.7568027210884353,0.7568027210884353,False
33
+ 31.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'z', 'weight': 0.3, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.38367346938775504,0.9591836734693877,0.23979591836734693,0.9182098544840458,0.9047619047619047,0.9047619047619047,False
34
+ 32.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'z', 'weight': 0.33999999999999997, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.38367346938775504,0.9591836734693877,0.23979591836734693,0.9182098544840458,0.9047619047619047,0.9047619047619047,False
35
+ 33.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'z', 'weight': 0.08999999999999997, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.07054848087077238,0.3918367346938775,0.9795918367346939,0.24489795918367346,0.9453768534446483,0.9336734693877551,0.9336734693877551,False
evaluator/benchmark/0/retrieve_node_line/summary.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ node_type,best_module_filename,best_module_name,best_module_params,best_execution_time
2
+ retrieval,20.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'tmm', 'weight': 0.29, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.0705484808707723
evaluator/benchmark/0/summary.csv ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ node_line_name,node_type,best_module_filename,best_module_name,best_module_params,best_execution_time
2
+ retrieve_node_line,retrieval,20.parquet,hybrid_cc,"{'top_k': 4, 'normalize_method': 'tmm', 'weight': 0.29, 'target_modules': ('vectordb', 'bm25'), 'target_module_params': ({'top_k': 4, 'embedding_model': 'huggingface_baai_bge_large_en'}, {'top_k': 4})}",0.0705484808707723
evaluator/benchmark/data/corpus.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:886c49f338b3f80e49b45d0a73402fc50692eb715f4b8ecf630e5cf42c55b4f7
3
+ size 264035
evaluator/benchmark/data/qa.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:606e9857fa2cb540426286434460231a20f938651b98c552efe7c349c8f1fcd1
3
+ size 20147
evaluator/benchmark/resources/bm25_porter_stemmer.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d49edb8f5b6c8e51e018c101628409abe2c82d2b976a0e973fe2aaa637a01f3d
3
+ size 215345
evaluator/benchmark/resources/chroma/50ae74e0-6e8d-43bd-af92-fbefa828e7c1/data_level0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a13e72541800c513c73dccea69f79e39cf4baef4fa23f7e117c0d6b0f5f99670
3
+ size 3212000
evaluator/benchmark/resources/chroma/50ae74e0-6e8d-43bd-af92-fbefa828e7c1/header.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ec6df10978b056a10062ed99efeef2702fa4a1301fad702b53dd2517103c746
3
+ size 100
evaluator/benchmark/resources/chroma/50ae74e0-6e8d-43bd-af92-fbefa828e7c1/length.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc19b1997119425765295aeab72d76faa6927d4f83985d328c26f20468d6cc76
3
+ size 4000
evaluator/benchmark/resources/chroma/50ae74e0-6e8d-43bd-af92-fbefa828e7c1/link_lists.bin ADDED
File without changes
evaluator/benchmark/resources/chroma/5cdc4426-9cf3-4176-aa91-2f9940af5fa7/data_level0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a13e72541800c513c73dccea69f79e39cf4baef4fa23f7e117c0d6b0f5f99670
3
+ size 3212000
evaluator/benchmark/resources/chroma/5cdc4426-9cf3-4176-aa91-2f9940af5fa7/header.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ec6df10978b056a10062ed99efeef2702fa4a1301fad702b53dd2517103c746
3
+ size 100
evaluator/benchmark/resources/chroma/5cdc4426-9cf3-4176-aa91-2f9940af5fa7/length.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc19b1997119425765295aeab72d76faa6927d4f83985d328c26f20468d6cc76
3
+ size 4000