96abhishekarora
commited on
Commit
·
d7282fd
1
Parent(s):
fa6fe3c
Updated model with better training and evaluation. Test and val data included as pickle files. Older Legacy files were removed to avoid confusion.
Browse files- .gitattributes +3 -41
- Information-Retrieval_evaluation_eval_results.csv +12 -0
- Information-Retrieval_evaluation_test_results.csv +6 -0
- README.md +1 -1
- config.json +1 -1
- eval/Information-Retrieval_evaluation_eval_results.csv +0 -0
- special_tokens_map.json +2 -2
- pytorch_model.bin → test_data.pickle +2 -2
- val_data.pickle +3 -0
.gitattributes
CHANGED
@@ -1,43 +1,5 @@
|
|
1 |
-
*.7z filter=lfs diff=lfs merge=lfs -text
|
2 |
-
*.arrow filter=lfs diff=lfs merge=lfs -text
|
3 |
-
*.bin filter=lfs diff=lfs merge=lfs -text
|
4 |
-
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
5 |
-
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
6 |
-
*.ftz filter=lfs diff=lfs merge=lfs -text
|
7 |
-
*.gz filter=lfs diff=lfs merge=lfs -text
|
8 |
-
*.h5 filter=lfs diff=lfs merge=lfs -text
|
9 |
-
*.joblib filter=lfs diff=lfs merge=lfs -text
|
10 |
-
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
11 |
-
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
12 |
-
*.model filter=lfs diff=lfs merge=lfs -text
|
13 |
-
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
14 |
-
*.npy filter=lfs diff=lfs merge=lfs -text
|
15 |
-
*.npz filter=lfs diff=lfs merge=lfs -text
|
16 |
-
*.onnx filter=lfs diff=lfs merge=lfs -text
|
17 |
-
*.ot filter=lfs diff=lfs merge=lfs -text
|
18 |
-
*.parquet filter=lfs diff=lfs merge=lfs -text
|
19 |
-
*.pb filter=lfs diff=lfs merge=lfs -text
|
20 |
-
*.pickle filter=lfs diff=lfs merge=lfs -text
|
21 |
-
*.pkl filter=lfs diff=lfs merge=lfs -text
|
22 |
-
*.pt filter=lfs diff=lfs merge=lfs -text
|
23 |
-
*.pth filter=lfs diff=lfs merge=lfs -text
|
24 |
-
*.rar filter=lfs diff=lfs merge=lfs -text
|
25 |
-
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
26 |
-
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
27 |
-
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
28 |
-
*.tar filter=lfs diff=lfs merge=lfs -text
|
29 |
-
*.tflite filter=lfs diff=lfs merge=lfs -text
|
30 |
-
*.tgz filter=lfs diff=lfs merge=lfs -text
|
31 |
-
*.wasm filter=lfs diff=lfs merge=lfs -text
|
32 |
-
*.xz filter=lfs diff=lfs merge=lfs -text
|
33 |
-
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
-
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
-
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
-
pytorch_model.bin filter=lfs diff=lfs merge=lfs -text
|
37 |
-
.git/lfs/objects/b9/11/b911c3e2edc66fc22baf3a41faa6ecd12dd7a79455502a652e5001a279b7f15f filter=lfs diff=lfs merge=lfs -text
|
38 |
model.safetensors filter=lfs diff=lfs merge=lfs -text
|
|
|
39 |
.git/lfs/objects/36/ca/36caa36e14df19a70caed556f433229d251ce8402b77e85b5147c3188d23de80 filter=lfs diff=lfs merge=lfs -text
|
40 |
-
.
|
41 |
-
.
|
42 |
-
.git/lfs/objects/33/3c/333cf8c7c098370c3631b0b33ba6d007a4b89e5b5f0e4b01d75bb5a200fecd27 filter=lfs diff=lfs merge=lfs -text
|
43 |
-
.git/lfs/objects/f8/dd/f8ddd74f6db9899ea59ba31258f3d1ef2bc610c289a535c6f2a3d1a204065faa filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
model.safetensors filter=lfs diff=lfs merge=lfs -text
|
2 |
+
.git/lfs/objects/c2/28/c2283afe3337976a32efe44a79e065aa6f81371ef9d77ee94f0ba681bb40bc05 filter=lfs diff=lfs merge=lfs -text
|
3 |
.git/lfs/objects/36/ca/36caa36e14df19a70caed556f433229d251ce8402b77e85b5147c3188d23de80 filter=lfs diff=lfs merge=lfs -text
|
4 |
+
test_data.pickle filter=lfs diff=lfs merge=lfs -text
|
5 |
+
val_data.pickle filter=lfs diff=lfs merge=lfs -text
|
|
|
|
Information-Retrieval_evaluation_eval_results.csv
ADDED
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
epoch,steps,cos_sim-Accuracy@1,cos_sim-Accuracy@3,cos_sim-Accuracy@5,cos_sim-Accuracy@10,cos_sim-Precision@1,cos_sim-Recall@1,cos_sim-Precision@3,cos_sim-Recall@3,cos_sim-Precision@5,cos_sim-Recall@5,cos_sim-Precision@10,cos_sim-Recall@10,cos_sim-MRR@10,cos_sim-NDCG@10,cos_sim-MAP@100
|
2 |
+
0,0,0.7430910951893551,0.8863868986693961,0.9150460593654043,0.9713408393039918,0.7430910951893551,0.7430910951893551,0.29546229955646536,0.8863868986693961,0.18300921187308086,0.9150460593654043,0.09713408393039918,0.9713408393039918,0.8213185001056036,0.8575851944745084,0.8233771807496896
|
3 |
+
0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
|
4 |
+
0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
|
5 |
+
0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
|
6 |
+
0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
|
7 |
+
0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
|
8 |
+
0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
|
9 |
+
0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
|
10 |
+
0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
|
11 |
+
0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
|
12 |
+
0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
|
Information-Retrieval_evaluation_test_results.csv
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
epoch,steps,cos_sim-Accuracy@1,cos_sim-Accuracy@3,cos_sim-Accuracy@5,cos_sim-Accuracy@10,cos_sim-Precision@1,cos_sim-Recall@1,cos_sim-Precision@3,cos_sim-Recall@3,cos_sim-Precision@5,cos_sim-Recall@5,cos_sim-Precision@10,cos_sim-Recall@10,cos_sim-MRR@10,cos_sim-NDCG@10,cos_sim-MAP@100
|
2 |
+
0,0,0.8670886075949367,0.9746835443037974,0.9810126582278481,0.9978902953586498,0.8670886075949367,0.8670886075949367,0.32489451476793246,0.9746835443037974,0.19620253164556964,0.9810126582278481,0.09978902953586499,0.9978902953586498,0.9227923447860157,0.9416311386929686,0.922909550599424
|
3 |
+
0,0,0.7953586497890295,0.9725738396624473,0.9873417721518988,1.0,0.7953586497890295,0.7953586497890295,0.32419127988748236,0.9725738396624473,0.1974683544303798,0.9873417721518988,0.1,1.0,0.8854606188466945,0.9144827706487932,0.8854606188466949
|
4 |
+
0,0,0.7890295358649789,0.9725738396624473,0.9873417721518988,1.0,0.7890295358649789,0.7890295358649789,0.32419127988748236,0.9725738396624473,0.1974683544303798,0.9873417721518988,0.1,1.0,0.8824777308954521,0.9123013400185618,0.8824777308954525
|
5 |
+
0,0,0.7953586497890295,0.9725738396624473,0.9873417721518988,1.0,0.7953586497890295,0.7953586497890295,0.32419127988748236,0.9725738396624473,0.1974683544303798,0.9873417721518988,0.1,1.0,0.8854313173933424,0.9144523173130932,0.8854313173933427
|
6 |
+
0,0,0.8037974683544303,0.9662447257383966,0.9810126582278481,1.0,0.8037974683544303,0.8037974683544303,0.3220815752461321,0.9662447257383966,0.19620253164556964,0.9810126582278481,0.1,1.0,0.8887616368629027,0.9167893473515547,0.8887616368629027
|
README.md
CHANGED
@@ -10,7 +10,7 @@ tags:
|
|
10 |
|
11 |
---
|
12 |
|
13 |
-
#
|
14 |
|
15 |
This is a [LinkTransformer](https://linktransformer.github.io/) model. At its core this model this is a sentence transformer model [sentence-transformers](https://www.SBERT.net) model- it just wraps around the class.
|
16 |
It is designed for quick and easy record linkage (entity-matching) through the LinkTransformer package. The tasks include clustering, deduplication, linking, aggregation and more.
|
|
|
10 |
|
11 |
---
|
12 |
|
13 |
+
# {MODEL_NAME}
|
14 |
|
15 |
This is a [LinkTransformer](https://linktransformer.github.io/) model. At its core this model this is a sentence transformer model [sentence-transformers](https://www.SBERT.net) model- it just wraps around the class.
|
16 |
It is designed for quick and easy record linkage (entity-matching) through the LinkTransformer package. The tasks include clustering, deduplication, linking, aggregation and more.
|
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"architectures": [
|
4 |
"MPNetModel"
|
5 |
],
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "sentence-transformers/multi-qa-mpnet-base-dot-v1",
|
3 |
"architectures": [
|
4 |
"MPNetModel"
|
5 |
],
|
eval/Information-Retrieval_evaluation_eval_results.csv
ADDED
The diff for this file is too large to render.
See raw diff
|
|
special_tokens_map.json
CHANGED
@@ -9,7 +9,7 @@
|
|
9 |
"cls_token": {
|
10 |
"content": "<s>",
|
11 |
"lstrip": false,
|
12 |
-
"normalized":
|
13 |
"rstrip": false,
|
14 |
"single_word": false
|
15 |
},
|
@@ -37,7 +37,7 @@
|
|
37 |
"sep_token": {
|
38 |
"content": "</s>",
|
39 |
"lstrip": false,
|
40 |
-
"normalized":
|
41 |
"rstrip": false,
|
42 |
"single_word": false
|
43 |
},
|
|
|
9 |
"cls_token": {
|
10 |
"content": "<s>",
|
11 |
"lstrip": false,
|
12 |
+
"normalized": true,
|
13 |
"rstrip": false,
|
14 |
"single_word": false
|
15 |
},
|
|
|
37 |
"sep_token": {
|
38 |
"content": "</s>",
|
39 |
"lstrip": false,
|
40 |
+
"normalized": true,
|
41 |
"rstrip": false,
|
42 |
"single_word": false
|
43 |
},
|
pytorch_model.bin → test_data.pickle
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:695abd81d511020f8ee47022621c797f0b3823e61666d2374a3a50be7783bc64
|
3 |
+
size 53221
|
val_data.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51f67c116c521e3cf6e91c654a1b5ab34d9db1aba72360aef8f8f487448ed98e
|
3 |
+
size 400808
|