96abhishekarora
commited on
Commit
•
79be72d
1
Parent(s):
910707d
Updated model with better training and evaluation. Test and val data included as pickle files. Older Legacy files were removed to avoid confusion.
Browse files- .gitattributes +3 -41
- Information-Retrieval_evaluation_eval_results.csv +10 -0
- Information-Retrieval_evaluation_test_results.csv +6 -0
- README.md +1 -1
- config.json +1 -1
- eval/Information-Retrieval_evaluation_eval_results.csv +0 -0
- special_tokens_map.json +2 -2
- pytorch_model.bin → test_data.pickle +2 -2
- val_data.pickle +3 -0
.gitattributes
CHANGED
@@ -1,43 +1,5 @@
|
|
1 |
-
*.7z filter=lfs diff=lfs merge=lfs -text
|
2 |
-
*.arrow filter=lfs diff=lfs merge=lfs -text
|
3 |
-
*.bin filter=lfs diff=lfs merge=lfs -text
|
4 |
-
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
5 |
-
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
6 |
-
*.ftz filter=lfs diff=lfs merge=lfs -text
|
7 |
-
*.gz filter=lfs diff=lfs merge=lfs -text
|
8 |
-
*.h5 filter=lfs diff=lfs merge=lfs -text
|
9 |
-
*.joblib filter=lfs diff=lfs merge=lfs -text
|
10 |
-
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
11 |
-
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
12 |
-
*.model filter=lfs diff=lfs merge=lfs -text
|
13 |
-
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
14 |
-
*.npy filter=lfs diff=lfs merge=lfs -text
|
15 |
-
*.npz filter=lfs diff=lfs merge=lfs -text
|
16 |
-
*.onnx filter=lfs diff=lfs merge=lfs -text
|
17 |
-
*.ot filter=lfs diff=lfs merge=lfs -text
|
18 |
-
*.parquet filter=lfs diff=lfs merge=lfs -text
|
19 |
-
*.pb filter=lfs diff=lfs merge=lfs -text
|
20 |
-
*.pickle filter=lfs diff=lfs merge=lfs -text
|
21 |
-
*.pkl filter=lfs diff=lfs merge=lfs -text
|
22 |
-
*.pt filter=lfs diff=lfs merge=lfs -text
|
23 |
-
*.pth filter=lfs diff=lfs merge=lfs -text
|
24 |
-
*.rar filter=lfs diff=lfs merge=lfs -text
|
25 |
-
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
26 |
-
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
27 |
-
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
28 |
-
*.tar filter=lfs diff=lfs merge=lfs -text
|
29 |
-
*.tflite filter=lfs diff=lfs merge=lfs -text
|
30 |
-
*.tgz filter=lfs diff=lfs merge=lfs -text
|
31 |
-
*.wasm filter=lfs diff=lfs merge=lfs -text
|
32 |
-
*.xz filter=lfs diff=lfs merge=lfs -text
|
33 |
-
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
-
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
-
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
-
pytorch_model.bin filter=lfs diff=lfs merge=lfs -text
|
37 |
-
.git/lfs/objects/50/3c/503cf29c02ef5e01d945058baabbeba308c59511cca769786fda5a6ee595a66c filter=lfs diff=lfs merge=lfs -text
|
38 |
model.safetensors filter=lfs diff=lfs merge=lfs -text
|
39 |
.git/lfs/objects/bd/17/bd176b01380930c75109b551bb5b5e3635b0a881683fc9be2cd1f0b1fb7da29c filter=lfs diff=lfs merge=lfs -text
|
40 |
-
.git/lfs/objects/
|
41 |
-
.
|
42 |
-
.
|
43 |
-
.git/lfs/objects/26/89/2689c2c4bb9f0ae4eed9047269fc0c28ce91c50f3e91e29c8932c4a8b765af72 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
model.safetensors filter=lfs diff=lfs merge=lfs -text
|
2 |
.git/lfs/objects/bd/17/bd176b01380930c75109b551bb5b5e3635b0a881683fc9be2cd1f0b1fb7da29c filter=lfs diff=lfs merge=lfs -text
|
3 |
+
.git/lfs/objects/2a/12/2a1218c92154f764953c79f05c215b2b64682364ba9882d3bb51edabf3a1b827 filter=lfs diff=lfs merge=lfs -text
|
4 |
+
test_data.pickle filter=lfs diff=lfs merge=lfs -text
|
5 |
+
val_data.pickle filter=lfs diff=lfs merge=lfs -text
|
|
Information-Retrieval_evaluation_eval_results.csv
ADDED
@@ -0,0 +1,10 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
epoch,steps,cos_sim-Accuracy@1,cos_sim-Accuracy@3,cos_sim-Accuracy@5,cos_sim-Accuracy@10,cos_sim-Precision@1,cos_sim-Recall@1,cos_sim-Precision@3,cos_sim-Recall@3,cos_sim-Precision@5,cos_sim-Recall@5,cos_sim-Precision@10,cos_sim-Recall@10,cos_sim-MRR@10,cos_sim-NDCG@10,cos_sim-MAP@100
|
2 |
+
0,0,0.5724381625441696,0.8303886925795053,0.872791519434629,0.911660777385159,0.5724381625441696,0.5724381625441696,0.27679623085983507,0.8303886925795053,0.17455830388692575,0.872791519434629,0.09116607773851589,0.911660777385159,0.7069998317348142,0.757919293262377,0.7114810136344818
|
3 |
+
0,0,0.5724381625441696,0.8303886925795053,0.872791519434629,0.911660777385159,0.5724381625441696,0.5724381625441696,0.27679623085983507,0.8303886925795053,0.17455830388692575,0.872791519434629,0.09116607773851589,0.911660777385159,0.7069998317348142,0.757919293262377,0.7114810136344818
|
4 |
+
0,0,0.45889921372408865,0.629735525375268,0.6912080057183703,0.7919942816297355,0.45889921372408865,0.45889921372408865,0.20991184179175598,0.629735525375268,0.13824160114367404,0.6912080057183703,0.07919942816297354,0.7919942816297355,0.561284137195503,0.6163014164506035,0.5699982588123317
|
5 |
+
0,0,0.45889921372408865,0.629735525375268,0.6912080057183703,0.7919942816297355,0.45889921372408865,0.45889921372408865,0.20991184179175598,0.629735525375268,0.13824160114367404,0.6912080057183703,0.07919942816297354,0.7919942816297355,0.561284137195503,0.6163014164506035,0.5699982588123317
|
6 |
+
0,0,0.45889921372408865,0.629735525375268,0.6912080057183703,0.7919942816297355,0.45889921372408865,0.45889921372408865,0.20991184179175598,0.629735525375268,0.13824160114367404,0.6912080057183703,0.07919942816297354,0.7919942816297355,0.561284137195503,0.6163014164506035,0.5699982588123317
|
7 |
+
0,0,0.45889921372408865,0.629735525375268,0.6912080057183703,0.7919942816297355,0.45889921372408865,0.45889921372408865,0.20991184179175598,0.629735525375268,0.13824160114367404,0.6912080057183703,0.07919942816297354,0.7919942816297355,0.561284137195503,0.6163014164506035,0.5699982588123317
|
8 |
+
0,0,0.4753395282344532,0.6540385989992852,0.7326661901358112,0.8070050035739814,0.4753395282344532,0.4753395282344532,0.21801286633309508,0.6540385989992852,0.14653323802716223,0.7326661901358112,0.08070050035739812,0.8070050035739814,0.5827291602845585,0.6368435630051191,0.5905098783240487
|
9 |
+
0,0,0.4753395282344532,0.6540385989992852,0.7326661901358112,0.8070050035739814,0.4753395282344532,0.4753395282344532,0.21801286633309508,0.6540385989992852,0.14653323802716223,0.7326661901358112,0.08070050035739812,0.8070050035739814,0.5827291602845585,0.6368435630051191,0.5905098783240487
|
10 |
+
0,0,0.45889921372408865,0.629735525375268,0.6912080057183703,0.7919942816297355,0.45889921372408865,0.45889921372408865,0.20991184179175598,0.629735525375268,0.13824160114367404,0.6912080057183703,0.07919942816297354,0.7919942816297355,0.561284137195503,0.6163014164506035,0.5699982588123317
|
Information-Retrieval_evaluation_test_results.csv
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
epoch,steps,cos_sim-Accuracy@1,cos_sim-Accuracy@3,cos_sim-Accuracy@5,cos_sim-Accuracy@10,cos_sim-Precision@1,cos_sim-Recall@1,cos_sim-Precision@3,cos_sim-Recall@3,cos_sim-Precision@5,cos_sim-Recall@5,cos_sim-Precision@10,cos_sim-Recall@10,cos_sim-MRR@10,cos_sim-NDCG@10,cos_sim-MAP@100
|
2 |
+
0,0,0.9573333333333334,0.9866666666666667,0.9973333333333333,1.0,0.9573333333333334,0.9573333333333334,0.3288888888888889,0.9866666666666667,0.19946666666666663,0.9973333333333333,0.09999999999999998,1.0,0.9745555555555556,0.9809265830527836,0.9745555555555555
|
3 |
+
0,0,0.9546666666666667,0.9893333333333333,0.9973333333333333,1.0,0.9546666666666667,0.9546666666666667,0.32977777777777784,0.9893333333333333,0.19946666666666663,0.9973333333333333,0.09999999999999998,1.0,0.9734444444444444,0.9801272582407785,0.9734444444444443
|
4 |
+
0,0,0.8289902280130294,0.9543973941368078,0.9788273615635179,0.990228013029316,0.8289902280130294,0.8289902280130294,0.3181324647122693,0.9543973941368078,0.19576547231270355,0.9788273615635179,0.09902280130293159,0.990228013029316,0.8929153094462541,0.9172870124572965,0.8936588316677894
|
5 |
+
0,0,0.8289902280130294,0.9560260586319218,0.9771986970684039,0.99185667752443,0.8289902280130294,0.8289902280130294,0.3186753528773073,0.9560260586319218,0.19543973941368073,0.9771986970684039,0.09918566775244299,0.99185667752443,0.8928293521534562,0.9174937140784137,0.8935326390945282
|
6 |
+
0,0,0.8485342019543974,0.9560260586319218,0.9788273615635179,0.99185667752443,0.8485342019543974,0.8485342019543974,0.3186753528773073,0.9560260586319218,0.19576547231270355,0.9788273615635179,0.09918566775244299,0.99185667752443,0.9050533840028954,0.9266706066970336,0.9057234522625403
|
README.md
CHANGED
@@ -10,7 +10,7 @@ tags:
|
|
10 |
|
11 |
---
|
12 |
|
13 |
-
#
|
14 |
|
15 |
This is a [LinkTransformer](https://linktransformer.github.io/) model. At its core this model this is a sentence transformer model [sentence-transformers](https://www.SBERT.net) model- it just wraps around the class.
|
16 |
It is designed for quick and easy record linkage (entity-matching) through the LinkTransformer package. The tasks include clustering, deduplication, linking, aggregation and more.
|
|
|
10 |
|
11 |
---
|
12 |
|
13 |
+
# {MODEL_NAME}
|
14 |
|
15 |
This is a [LinkTransformer](https://linktransformer.github.io/) model. At its core this model this is a sentence transformer model [sentence-transformers](https://www.SBERT.net) model- it just wraps around the class.
|
16 |
It is designed for quick and easy record linkage (entity-matching) through the LinkTransformer package. The tasks include clustering, deduplication, linking, aggregation and more.
|
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"architectures": [
|
4 |
"MPNetModel"
|
5 |
],
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "sentence-transformers/multi-qa-mpnet-base-dot-v1",
|
3 |
"architectures": [
|
4 |
"MPNetModel"
|
5 |
],
|
eval/Information-Retrieval_evaluation_eval_results.csv
ADDED
The diff for this file is too large to render.
See raw diff
|
|
special_tokens_map.json
CHANGED
@@ -9,7 +9,7 @@
|
|
9 |
"cls_token": {
|
10 |
"content": "<s>",
|
11 |
"lstrip": false,
|
12 |
-
"normalized":
|
13 |
"rstrip": false,
|
14 |
"single_word": false
|
15 |
},
|
@@ -37,7 +37,7 @@
|
|
37 |
"sep_token": {
|
38 |
"content": "</s>",
|
39 |
"lstrip": false,
|
40 |
-
"normalized":
|
41 |
"rstrip": false,
|
42 |
"single_word": false
|
43 |
},
|
|
|
9 |
"cls_token": {
|
10 |
"content": "<s>",
|
11 |
"lstrip": false,
|
12 |
+
"normalized": true,
|
13 |
"rstrip": false,
|
14 |
"single_word": false
|
15 |
},
|
|
|
37 |
"sep_token": {
|
38 |
"content": "</s>",
|
39 |
"lstrip": false,
|
40 |
+
"normalized": true,
|
41 |
"rstrip": false,
|
42 |
"single_word": false
|
43 |
},
|
pytorch_model.bin → test_data.pickle
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01ca36406ff9a66f7eb69641c5ff9bc16adb0f521bdd43510fc8971821846980
|
3 |
+
size 71802
|
val_data.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:201eeb8bf97f7d77ce923b8cfccd5bad6023d15532393c3fc315de2a764f2766
|
3 |
+
size 443286
|