96abhishekarora commited on
Commit
d7282fd
·
1 Parent(s): fa6fe3c

Updated model with better training and evaluation. Test and val data included as pickle files. Older Legacy files were removed to avoid confusion.

Browse files
.gitattributes CHANGED
@@ -1,43 +1,5 @@
1
- *.7z filter=lfs diff=lfs merge=lfs -text
2
- *.arrow filter=lfs diff=lfs merge=lfs -text
3
- *.bin filter=lfs diff=lfs merge=lfs -text
4
- *.bz2 filter=lfs diff=lfs merge=lfs -text
5
- *.ckpt filter=lfs diff=lfs merge=lfs -text
6
- *.ftz filter=lfs diff=lfs merge=lfs -text
7
- *.gz filter=lfs diff=lfs merge=lfs -text
8
- *.h5 filter=lfs diff=lfs merge=lfs -text
9
- *.joblib filter=lfs diff=lfs merge=lfs -text
10
- *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
- *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
- *.model filter=lfs diff=lfs merge=lfs -text
13
- *.msgpack filter=lfs diff=lfs merge=lfs -text
14
- *.npy filter=lfs diff=lfs merge=lfs -text
15
- *.npz filter=lfs diff=lfs merge=lfs -text
16
- *.onnx filter=lfs diff=lfs merge=lfs -text
17
- *.ot filter=lfs diff=lfs merge=lfs -text
18
- *.parquet filter=lfs diff=lfs merge=lfs -text
19
- *.pb filter=lfs diff=lfs merge=lfs -text
20
- *.pickle filter=lfs diff=lfs merge=lfs -text
21
- *.pkl filter=lfs diff=lfs merge=lfs -text
22
- *.pt filter=lfs diff=lfs merge=lfs -text
23
- *.pth filter=lfs diff=lfs merge=lfs -text
24
- *.rar filter=lfs diff=lfs merge=lfs -text
25
- *.safetensors filter=lfs diff=lfs merge=lfs -text
26
- saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
- *.tar.* filter=lfs diff=lfs merge=lfs -text
28
- *.tar filter=lfs diff=lfs merge=lfs -text
29
- *.tflite filter=lfs diff=lfs merge=lfs -text
30
- *.tgz filter=lfs diff=lfs merge=lfs -text
31
- *.wasm filter=lfs diff=lfs merge=lfs -text
32
- *.xz filter=lfs diff=lfs merge=lfs -text
33
- *.zip filter=lfs diff=lfs merge=lfs -text
34
- *.zst filter=lfs diff=lfs merge=lfs -text
35
- *tfevents* filter=lfs diff=lfs merge=lfs -text
36
- pytorch_model.bin filter=lfs diff=lfs merge=lfs -text
37
- .git/lfs/objects/b9/11/b911c3e2edc66fc22baf3a41faa6ecd12dd7a79455502a652e5001a279b7f15f filter=lfs diff=lfs merge=lfs -text
38
  model.safetensors filter=lfs diff=lfs merge=lfs -text
 
39
  .git/lfs/objects/36/ca/36caa36e14df19a70caed556f433229d251ce8402b77e85b5147c3188d23de80 filter=lfs diff=lfs merge=lfs -text
40
- .git/lfs/objects/b9/59/b95969fa605d6c02eb71edd39b5268279900f24fbe5de0f2f35dafc5774c42a6 filter=lfs diff=lfs merge=lfs -text
41
- .git/lfs/objects/6d/b2/6db2a87329f5e868fe4b536e2cb9bc2aa144ce11680bfd0a7d30b97f5205911d filter=lfs diff=lfs merge=lfs -text
42
- .git/lfs/objects/33/3c/333cf8c7c098370c3631b0b33ba6d007a4b89e5b5f0e4b01d75bb5a200fecd27 filter=lfs diff=lfs merge=lfs -text
43
- .git/lfs/objects/f8/dd/f8ddd74f6db9899ea59ba31258f3d1ef2bc610c289a535c6f2a3d1a204065faa filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  model.safetensors filter=lfs diff=lfs merge=lfs -text
2
+ .git/lfs/objects/c2/28/c2283afe3337976a32efe44a79e065aa6f81371ef9d77ee94f0ba681bb40bc05 filter=lfs diff=lfs merge=lfs -text
3
  .git/lfs/objects/36/ca/36caa36e14df19a70caed556f433229d251ce8402b77e85b5147c3188d23de80 filter=lfs diff=lfs merge=lfs -text
4
+ test_data.pickle filter=lfs diff=lfs merge=lfs -text
5
+ val_data.pickle filter=lfs diff=lfs merge=lfs -text
 
 
Information-Retrieval_evaluation_eval_results.csv ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ epoch,steps,cos_sim-Accuracy@1,cos_sim-Accuracy@3,cos_sim-Accuracy@5,cos_sim-Accuracy@10,cos_sim-Precision@1,cos_sim-Recall@1,cos_sim-Precision@3,cos_sim-Recall@3,cos_sim-Precision@5,cos_sim-Recall@5,cos_sim-Precision@10,cos_sim-Recall@10,cos_sim-MRR@10,cos_sim-NDCG@10,cos_sim-MAP@100
2
+ 0,0,0.7430910951893551,0.8863868986693961,0.9150460593654043,0.9713408393039918,0.7430910951893551,0.7430910951893551,0.29546229955646536,0.8863868986693961,0.18300921187308086,0.9150460593654043,0.09713408393039918,0.9713408393039918,0.8213185001056036,0.8575851944745084,0.8233771807496896
3
+ 0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
4
+ 0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
5
+ 0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
6
+ 0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
7
+ 0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
8
+ 0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
9
+ 0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
10
+ 0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
11
+ 0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
12
+ 0,0,0.44319344933469806,0.6427840327533265,0.7236438075742068,0.827021494370522,0.44319344933469806,0.44319344933469806,0.21426134425110882,0.6427840327533265,0.14472876151484132,0.7236438075742068,0.0827021494370522,0.827021494370522,0.5663721954151841,0.628987972602642,0.5723712607178909
Information-Retrieval_evaluation_test_results.csv ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epoch,steps,cos_sim-Accuracy@1,cos_sim-Accuracy@3,cos_sim-Accuracy@5,cos_sim-Accuracy@10,cos_sim-Precision@1,cos_sim-Recall@1,cos_sim-Precision@3,cos_sim-Recall@3,cos_sim-Precision@5,cos_sim-Recall@5,cos_sim-Precision@10,cos_sim-Recall@10,cos_sim-MRR@10,cos_sim-NDCG@10,cos_sim-MAP@100
2
+ 0,0,0.8670886075949367,0.9746835443037974,0.9810126582278481,0.9978902953586498,0.8670886075949367,0.8670886075949367,0.32489451476793246,0.9746835443037974,0.19620253164556964,0.9810126582278481,0.09978902953586499,0.9978902953586498,0.9227923447860157,0.9416311386929686,0.922909550599424
3
+ 0,0,0.7953586497890295,0.9725738396624473,0.9873417721518988,1.0,0.7953586497890295,0.7953586497890295,0.32419127988748236,0.9725738396624473,0.1974683544303798,0.9873417721518988,0.1,1.0,0.8854606188466945,0.9144827706487932,0.8854606188466949
4
+ 0,0,0.7890295358649789,0.9725738396624473,0.9873417721518988,1.0,0.7890295358649789,0.7890295358649789,0.32419127988748236,0.9725738396624473,0.1974683544303798,0.9873417721518988,0.1,1.0,0.8824777308954521,0.9123013400185618,0.8824777308954525
5
+ 0,0,0.7953586497890295,0.9725738396624473,0.9873417721518988,1.0,0.7953586497890295,0.7953586497890295,0.32419127988748236,0.9725738396624473,0.1974683544303798,0.9873417721518988,0.1,1.0,0.8854313173933424,0.9144523173130932,0.8854313173933427
6
+ 0,0,0.8037974683544303,0.9662447257383966,0.9810126582278481,1.0,0.8037974683544303,0.8037974683544303,0.3220815752461321,0.9662447257383966,0.19620253164556964,0.9810126582278481,0.1,1.0,0.8887616368629027,0.9167893473515547,0.8887616368629027
README.md CHANGED
@@ -10,7 +10,7 @@ tags:
10
 
11
  ---
12
 
13
- # dell-research-harvard/lt-un-data-fine-industry-en
14
 
15
  This is a [LinkTransformer](https://linktransformer.github.io/) model. At its core this model this is a sentence transformer model [sentence-transformers](https://www.SBERT.net) model- it just wraps around the class.
16
  It is designed for quick and easy record linkage (entity-matching) through the LinkTransformer package. The tasks include clustering, deduplication, linking, aggregation and more.
 
10
 
11
  ---
12
 
13
+ # {MODEL_NAME}
14
 
15
  This is a [LinkTransformer](https://linktransformer.github.io/) model. At its core this model this is a sentence transformer model [sentence-transformers](https://www.SBERT.net) model- it just wraps around the class.
16
  It is designed for quick and easy record linkage (entity-matching) through the LinkTransformer package. The tasks include clustering, deduplication, linking, aggregation and more.
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "models/linkage_un_data_en_fine_industry",
3
  "architectures": [
4
  "MPNetModel"
5
  ],
 
1
  {
2
+ "_name_or_path": "sentence-transformers/multi-qa-mpnet-base-dot-v1",
3
  "architectures": [
4
  "MPNetModel"
5
  ],
eval/Information-Retrieval_evaluation_eval_results.csv ADDED
The diff for this file is too large to render. See raw diff
 
special_tokens_map.json CHANGED
@@ -9,7 +9,7 @@
9
  "cls_token": {
10
  "content": "<s>",
11
  "lstrip": false,
12
- "normalized": false,
13
  "rstrip": false,
14
  "single_word": false
15
  },
@@ -37,7 +37,7 @@
37
  "sep_token": {
38
  "content": "</s>",
39
  "lstrip": false,
40
- "normalized": false,
41
  "rstrip": false,
42
  "single_word": false
43
  },
 
9
  "cls_token": {
10
  "content": "<s>",
11
  "lstrip": false,
12
+ "normalized": true,
13
  "rstrip": false,
14
  "single_word": false
15
  },
 
37
  "sep_token": {
38
  "content": "</s>",
39
  "lstrip": false,
40
+ "normalized": true,
41
  "rstrip": false,
42
  "single_word": false
43
  },
pytorch_model.bin → test_data.pickle RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36caa36e14df19a70caed556f433229d251ce8402b77e85b5147c3188d23de80
3
- size 438009257
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:695abd81d511020f8ee47022621c797f0b3823e61666d2374a3a50be7783bc64
3
+ size 53221
val_data.pickle ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51f67c116c521e3cf6e91c654a1b5ab34d9db1aba72360aef8f8f487448ed98e
3
+ size 400808