96abhishekarora commited on
Commit
c262a06
1 Parent(s): bb9f12f

Updated model with better training and evaluation. Test and val data included as pickle files. Older Legacy files were removed to avoid confusion.

Browse files
.gitattributes CHANGED
@@ -1,42 +1,5 @@
1
- *.7z filter=lfs diff=lfs merge=lfs -text
2
- *.arrow filter=lfs diff=lfs merge=lfs -text
3
- *.bin filter=lfs diff=lfs merge=lfs -text
4
- *.bz2 filter=lfs diff=lfs merge=lfs -text
5
- *.ckpt filter=lfs diff=lfs merge=lfs -text
6
- *.ftz filter=lfs diff=lfs merge=lfs -text
7
- *.gz filter=lfs diff=lfs merge=lfs -text
8
- *.h5 filter=lfs diff=lfs merge=lfs -text
9
- *.joblib filter=lfs diff=lfs merge=lfs -text
10
- *.lfs.* filter=lfs diff=lfs merge=lfs -text
11
- *.mlmodel filter=lfs diff=lfs merge=lfs -text
12
- *.model filter=lfs diff=lfs merge=lfs -text
13
- *.msgpack filter=lfs diff=lfs merge=lfs -text
14
- *.npy filter=lfs diff=lfs merge=lfs -text
15
- *.npz filter=lfs diff=lfs merge=lfs -text
16
- *.onnx filter=lfs diff=lfs merge=lfs -text
17
- *.ot filter=lfs diff=lfs merge=lfs -text
18
- *.parquet filter=lfs diff=lfs merge=lfs -text
19
- *.pb filter=lfs diff=lfs merge=lfs -text
20
- *.pickle filter=lfs diff=lfs merge=lfs -text
21
- *.pkl filter=lfs diff=lfs merge=lfs -text
22
- *.pt filter=lfs diff=lfs merge=lfs -text
23
- *.pth filter=lfs diff=lfs merge=lfs -text
24
- *.rar filter=lfs diff=lfs merge=lfs -text
25
- *.safetensors filter=lfs diff=lfs merge=lfs -text
26
- saved_model/**/* filter=lfs diff=lfs merge=lfs -text
27
- *.tar.* filter=lfs diff=lfs merge=lfs -text
28
- *.tar filter=lfs diff=lfs merge=lfs -text
29
- *.tflite filter=lfs diff=lfs merge=lfs -text
30
- *.tgz filter=lfs diff=lfs merge=lfs -text
31
- *.wasm filter=lfs diff=lfs merge=lfs -text
32
- *.xz filter=lfs diff=lfs merge=lfs -text
33
- *.zip filter=lfs diff=lfs merge=lfs -text
34
- *.zst filter=lfs diff=lfs merge=lfs -text
35
- *tfevents* filter=lfs diff=lfs merge=lfs -text
36
- pytorch_model.bin filter=lfs diff=lfs merge=lfs -text
37
- .git/lfs/objects/3e/02/3e02186ca2008bfd4ebb104de46ce9beba276ae45c453fedfaeda087cc99f02e filter=lfs diff=lfs merge=lfs -text
38
  model.safetensors filter=lfs diff=lfs merge=lfs -text
 
39
  .git/lfs/objects/21/3e/213e31b950d84bee8f77e75c3cd557932d9bc7dc76dcd03aba223c2e4f841a0f filter=lfs diff=lfs merge=lfs -text
40
- .git/lfs/objects/3f/07/3f07f428adbf03a3e7902665664f5dd6f342a6b6c7a2a47a7026772c48cb0e73 filter=lfs diff=lfs merge=lfs -text
41
- .git/lfs/objects/3d/42/3d42ebe4f358451d3fde5790fe6516dcd94dc0e5c0159c25ebfe679e11eab41d filter=lfs diff=lfs merge=lfs -text
42
- .git/lfs/objects/82/e8/82e8a4b706199c597b03c69c5184163d6bded50042bbb9e85f3928b2f5be3818 filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  model.safetensors filter=lfs diff=lfs merge=lfs -text
2
+ .git/lfs/objects/3e/6b/3e6bdbead621753c09514da26bdf850f9758533dfd9d599e6ee947c8daea59e4 filter=lfs diff=lfs merge=lfs -text
3
  .git/lfs/objects/21/3e/213e31b950d84bee8f77e75c3cd557932d9bc7dc76dcd03aba223c2e4f841a0f filter=lfs diff=lfs merge=lfs -text
4
+ test_data.pickle filter=lfs diff=lfs merge=lfs -text
5
+ val_data.pickle filter=lfs diff=lfs merge=lfs -text
 
Information-Retrieval_evaluation_eval_results.csv ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ epoch,steps,cos_sim-Accuracy@1,cos_sim-Accuracy@3,cos_sim-Accuracy@5,cos_sim-Accuracy@10,cos_sim-Precision@1,cos_sim-Recall@1,cos_sim-Precision@3,cos_sim-Recall@3,cos_sim-Precision@5,cos_sim-Recall@5,cos_sim-Precision@10,cos_sim-Recall@10,cos_sim-MRR@10,cos_sim-NDCG@10,cos_sim-MAP@100
2
+ 0,0,0.7225806451612903,0.8580645161290322,0.9096774193548387,0.9419354838709677,0.7225806451612903,0.7161290322580646,0.2860215053763441,0.8516129032258064,0.18193548387096772,0.9032258064516129,0.09419354838709676,0.9354838709677419,0.7968433179723501,0.8271966295960388,0.7941603020635278
3
+ 0,0,0.40836012861736337,0.6334405144694534,0.7218649517684887,0.7958199356913184,0.40836012861736337,0.40836012861736337,0.21114683815648444,0.6334405144694534,0.14437299035369774,0.7218649517684887,0.07958199356913183,0.7958199356913184,0.5376760832950542,0.6002459895262535,0.5464104053868796
4
+ 0,0,0.40836012861736337,0.6334405144694534,0.7218649517684887,0.7958199356913184,0.40836012861736337,0.40836012861736337,0.21114683815648444,0.6334405144694534,0.14437299035369774,0.7218649517684887,0.07958199356913183,0.7958199356913184,0.5376760832950542,0.6002459895262535,0.5464104053868796
5
+ 0,0,0.40836012861736337,0.6334405144694534,0.7218649517684887,0.7958199356913184,0.40836012861736337,0.40836012861736337,0.21114683815648444,0.6334405144694534,0.14437299035369774,0.7218649517684887,0.07958199356913183,0.7958199356913184,0.5376760832950542,0.6002459895262535,0.5464104053868796
6
+ 0,0,0.40836012861736337,0.6334405144694534,0.7218649517684887,0.7958199356913184,0.40836012861736337,0.40836012861736337,0.21114683815648444,0.6334405144694534,0.14437299035369774,0.7218649517684887,0.07958199356913183,0.7958199356913184,0.5376760832950542,0.6002459895262535,0.5464104053868796
Information-Retrieval_evaluation_test_results.csv ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ epoch,steps,cos_sim-Accuracy@1,cos_sim-Accuracy@3,cos_sim-Accuracy@5,cos_sim-Accuracy@10,cos_sim-Precision@1,cos_sim-Recall@1,cos_sim-Precision@3,cos_sim-Recall@3,cos_sim-Precision@5,cos_sim-Recall@5,cos_sim-Precision@10,cos_sim-Recall@10,cos_sim-MRR@10,cos_sim-NDCG@10,cos_sim-MAP@100
2
+ 0,0,0.43214556482183475,0.654030831437958,0.7556229466767753,0.8660601465756886,0.43214556482183475,0.3960224195819343,0.22778198972285402,0.6125801773830585,0.16254738438210767,0.7189633801460943,0.0964619661359616,0.8379727908348076,0.5708841273852633,0.6230490170650043,0.5550214647187748
3
+ 0,0,0.7132075471698113,0.9075471698113208,0.9641509433962264,0.9943396226415094,0.7132075471698113,0.7132075471698113,0.30251572327044024,0.9075471698113208,0.19283018867924526,0.9641509433962264,0.09943396226415095,0.9943396226415094,0.8202126385145252,0.863367502871466,0.8205632189982911
4
+ 0,0,0.7056603773584905,0.9037735849056604,0.9547169811320755,0.9943396226415094,0.7056603773584905,0.7056603773584905,0.3012578616352201,0.9037735849056604,0.1909433962264151,0.9547169811320755,0.09943396226415095,0.9943396226415094,0.8155480682839175,0.8597937744367032,0.8159563688254032
5
+ 0,0,0.7188679245283018,0.9150943396226415,0.9641509433962264,0.9943396226415094,0.7188679245283018,0.7188679245283018,0.30503144654088044,0.9150943396226415,0.19283018867924526,0.9641509433962264,0.09943396226415095,0.9943396226415094,0.8241719077568133,0.8663694271169878,0.8245394331184973
README.md CHANGED
@@ -10,7 +10,7 @@ tags:
10
 
11
  ---
12
 
13
- # dell-research-harvard/lt-un-data-fine-industry-es
14
 
15
  This is a [LinkTransformer](https://linktransformer.github.io/) model. At its core this model this is a sentence transformer model [sentence-transformers](https://www.SBERT.net) model- it just wraps around the class.
16
  It is designed for quick and easy record linkage (entity-matching) through the LinkTransformer package. The tasks include clustering, deduplication, linking, aggregation and more.
 
10
 
11
  ---
12
 
13
+ # {MODEL_NAME}
14
 
15
  This is a [LinkTransformer](https://linktransformer.github.io/) model. At its core this model this is a sentence transformer model [sentence-transformers](https://www.SBERT.net) model- it just wraps around the class.
16
  It is designed for quick and easy record linkage (entity-matching) through the LinkTransformer package. The tasks include clustering, deduplication, linking, aggregation and more.
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "models/linkage_un_data_es_fine_industry",
3
  "architectures": [
4
  "BertModel"
5
  ],
 
1
  {
2
+ "_name_or_path": "hiiamsid/sentence_similarity_spanish_es",
3
  "architectures": [
4
  "BertModel"
5
  ],
eval/Information-Retrieval_evaluation_eval_results.csv ADDED
The diff for this file is too large to render. See raw diff
 
special_tokens_map.json CHANGED
@@ -1,37 +1,7 @@
1
  {
2
- "cls_token": {
3
- "content": "[CLS]",
4
- "lstrip": false,
5
- "normalized": false,
6
- "rstrip": false,
7
- "single_word": false
8
- },
9
- "mask_token": {
10
- "content": "[MASK]",
11
- "lstrip": false,
12
- "normalized": false,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "pad_token": {
17
- "content": "[PAD]",
18
- "lstrip": false,
19
- "normalized": false,
20
- "rstrip": false,
21
- "single_word": false
22
- },
23
- "sep_token": {
24
- "content": "[SEP]",
25
- "lstrip": false,
26
- "normalized": false,
27
- "rstrip": false,
28
- "single_word": false
29
- },
30
- "unk_token": {
31
- "content": "[UNK]",
32
- "lstrip": false,
33
- "normalized": false,
34
- "rstrip": false,
35
- "single_word": false
36
- }
37
  }
 
1
  {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  }
pytorch_model.bin → test_data.pickle RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:213e31b950d84bee8f77e75c3cd557932d9bc7dc76dcd03aba223c2e4f841a0f
3
- size 439467497
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:258a6afd4ec0a61ce7ba4d9c64eaacba49cc242d396981ac6224dd00efc5c5e6
3
+ size 68516
val_data.pickle ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e1fb31aaa096101bf8cb0a320022e521d1d021cae177a11ea143ff78ecfaf71
3
+ size 228390