96abhishekarora
commited on
Commit
•
c262a06
1
Parent(s):
bb9f12f
Updated model with better training and evaluation. Test and val data included as pickle files. Older Legacy files were removed to avoid confusion.
Browse files- .gitattributes +3 -40
- Information-Retrieval_evaluation_eval_results.csv +6 -0
- Information-Retrieval_evaluation_test_results.csv +5 -0
- README.md +1 -1
- config.json +1 -1
- eval/Information-Retrieval_evaluation_eval_results.csv +0 -0
- special_tokens_map.json +5 -35
- pytorch_model.bin → test_data.pickle +2 -2
- val_data.pickle +3 -0
.gitattributes
CHANGED
@@ -1,42 +1,5 @@
|
|
1 |
-
*.7z filter=lfs diff=lfs merge=lfs -text
|
2 |
-
*.arrow filter=lfs diff=lfs merge=lfs -text
|
3 |
-
*.bin filter=lfs diff=lfs merge=lfs -text
|
4 |
-
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
5 |
-
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
6 |
-
*.ftz filter=lfs diff=lfs merge=lfs -text
|
7 |
-
*.gz filter=lfs diff=lfs merge=lfs -text
|
8 |
-
*.h5 filter=lfs diff=lfs merge=lfs -text
|
9 |
-
*.joblib filter=lfs diff=lfs merge=lfs -text
|
10 |
-
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
11 |
-
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
12 |
-
*.model filter=lfs diff=lfs merge=lfs -text
|
13 |
-
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
14 |
-
*.npy filter=lfs diff=lfs merge=lfs -text
|
15 |
-
*.npz filter=lfs diff=lfs merge=lfs -text
|
16 |
-
*.onnx filter=lfs diff=lfs merge=lfs -text
|
17 |
-
*.ot filter=lfs diff=lfs merge=lfs -text
|
18 |
-
*.parquet filter=lfs diff=lfs merge=lfs -text
|
19 |
-
*.pb filter=lfs diff=lfs merge=lfs -text
|
20 |
-
*.pickle filter=lfs diff=lfs merge=lfs -text
|
21 |
-
*.pkl filter=lfs diff=lfs merge=lfs -text
|
22 |
-
*.pt filter=lfs diff=lfs merge=lfs -text
|
23 |
-
*.pth filter=lfs diff=lfs merge=lfs -text
|
24 |
-
*.rar filter=lfs diff=lfs merge=lfs -text
|
25 |
-
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
26 |
-
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
27 |
-
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
28 |
-
*.tar filter=lfs diff=lfs merge=lfs -text
|
29 |
-
*.tflite filter=lfs diff=lfs merge=lfs -text
|
30 |
-
*.tgz filter=lfs diff=lfs merge=lfs -text
|
31 |
-
*.wasm filter=lfs diff=lfs merge=lfs -text
|
32 |
-
*.xz filter=lfs diff=lfs merge=lfs -text
|
33 |
-
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
-
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
-
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
-
pytorch_model.bin filter=lfs diff=lfs merge=lfs -text
|
37 |
-
.git/lfs/objects/3e/02/3e02186ca2008bfd4ebb104de46ce9beba276ae45c453fedfaeda087cc99f02e filter=lfs diff=lfs merge=lfs -text
|
38 |
model.safetensors filter=lfs diff=lfs merge=lfs -text
|
|
|
39 |
.git/lfs/objects/21/3e/213e31b950d84bee8f77e75c3cd557932d9bc7dc76dcd03aba223c2e4f841a0f filter=lfs diff=lfs merge=lfs -text
|
40 |
-
.
|
41 |
-
.
|
42 |
-
.git/lfs/objects/82/e8/82e8a4b706199c597b03c69c5184163d6bded50042bbb9e85f3928b2f5be3818 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
model.safetensors filter=lfs diff=lfs merge=lfs -text
|
2 |
+
.git/lfs/objects/3e/6b/3e6bdbead621753c09514da26bdf850f9758533dfd9d599e6ee947c8daea59e4 filter=lfs diff=lfs merge=lfs -text
|
3 |
.git/lfs/objects/21/3e/213e31b950d84bee8f77e75c3cd557932d9bc7dc76dcd03aba223c2e4f841a0f filter=lfs diff=lfs merge=lfs -text
|
4 |
+
test_data.pickle filter=lfs diff=lfs merge=lfs -text
|
5 |
+
val_data.pickle filter=lfs diff=lfs merge=lfs -text
|
|
Information-Retrieval_evaluation_eval_results.csv
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
epoch,steps,cos_sim-Accuracy@1,cos_sim-Accuracy@3,cos_sim-Accuracy@5,cos_sim-Accuracy@10,cos_sim-Precision@1,cos_sim-Recall@1,cos_sim-Precision@3,cos_sim-Recall@3,cos_sim-Precision@5,cos_sim-Recall@5,cos_sim-Precision@10,cos_sim-Recall@10,cos_sim-MRR@10,cos_sim-NDCG@10,cos_sim-MAP@100
|
2 |
+
0,0,0.7225806451612903,0.8580645161290322,0.9096774193548387,0.9419354838709677,0.7225806451612903,0.7161290322580646,0.2860215053763441,0.8516129032258064,0.18193548387096772,0.9032258064516129,0.09419354838709676,0.9354838709677419,0.7968433179723501,0.8271966295960388,0.7941603020635278
|
3 |
+
0,0,0.40836012861736337,0.6334405144694534,0.7218649517684887,0.7958199356913184,0.40836012861736337,0.40836012861736337,0.21114683815648444,0.6334405144694534,0.14437299035369774,0.7218649517684887,0.07958199356913183,0.7958199356913184,0.5376760832950542,0.6002459895262535,0.5464104053868796
|
4 |
+
0,0,0.40836012861736337,0.6334405144694534,0.7218649517684887,0.7958199356913184,0.40836012861736337,0.40836012861736337,0.21114683815648444,0.6334405144694534,0.14437299035369774,0.7218649517684887,0.07958199356913183,0.7958199356913184,0.5376760832950542,0.6002459895262535,0.5464104053868796
|
5 |
+
0,0,0.40836012861736337,0.6334405144694534,0.7218649517684887,0.7958199356913184,0.40836012861736337,0.40836012861736337,0.21114683815648444,0.6334405144694534,0.14437299035369774,0.7218649517684887,0.07958199356913183,0.7958199356913184,0.5376760832950542,0.6002459895262535,0.5464104053868796
|
6 |
+
0,0,0.40836012861736337,0.6334405144694534,0.7218649517684887,0.7958199356913184,0.40836012861736337,0.40836012861736337,0.21114683815648444,0.6334405144694534,0.14437299035369774,0.7218649517684887,0.07958199356913183,0.7958199356913184,0.5376760832950542,0.6002459895262535,0.5464104053868796
|
Information-Retrieval_evaluation_test_results.csv
ADDED
@@ -0,0 +1,5 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
epoch,steps,cos_sim-Accuracy@1,cos_sim-Accuracy@3,cos_sim-Accuracy@5,cos_sim-Accuracy@10,cos_sim-Precision@1,cos_sim-Recall@1,cos_sim-Precision@3,cos_sim-Recall@3,cos_sim-Precision@5,cos_sim-Recall@5,cos_sim-Precision@10,cos_sim-Recall@10,cos_sim-MRR@10,cos_sim-NDCG@10,cos_sim-MAP@100
|
2 |
+
0,0,0.43214556482183475,0.654030831437958,0.7556229466767753,0.8660601465756886,0.43214556482183475,0.3960224195819343,0.22778198972285402,0.6125801773830585,0.16254738438210767,0.7189633801460943,0.0964619661359616,0.8379727908348076,0.5708841273852633,0.6230490170650043,0.5550214647187748
|
3 |
+
0,0,0.7132075471698113,0.9075471698113208,0.9641509433962264,0.9943396226415094,0.7132075471698113,0.7132075471698113,0.30251572327044024,0.9075471698113208,0.19283018867924526,0.9641509433962264,0.09943396226415095,0.9943396226415094,0.8202126385145252,0.863367502871466,0.8205632189982911
|
4 |
+
0,0,0.7056603773584905,0.9037735849056604,0.9547169811320755,0.9943396226415094,0.7056603773584905,0.7056603773584905,0.3012578616352201,0.9037735849056604,0.1909433962264151,0.9547169811320755,0.09943396226415095,0.9943396226415094,0.8155480682839175,0.8597937744367032,0.8159563688254032
|
5 |
+
0,0,0.7188679245283018,0.9150943396226415,0.9641509433962264,0.9943396226415094,0.7188679245283018,0.7188679245283018,0.30503144654088044,0.9150943396226415,0.19283018867924526,0.9641509433962264,0.09943396226415095,0.9943396226415094,0.8241719077568133,0.8663694271169878,0.8245394331184973
|
README.md
CHANGED
@@ -10,7 +10,7 @@ tags:
|
|
10 |
|
11 |
---
|
12 |
|
13 |
-
#
|
14 |
|
15 |
This is a [LinkTransformer](https://linktransformer.github.io/) model. At its core this model this is a sentence transformer model [sentence-transformers](https://www.SBERT.net) model- it just wraps around the class.
|
16 |
It is designed for quick and easy record linkage (entity-matching) through the LinkTransformer package. The tasks include clustering, deduplication, linking, aggregation and more.
|
|
|
10 |
|
11 |
---
|
12 |
|
13 |
+
# {MODEL_NAME}
|
14 |
|
15 |
This is a [LinkTransformer](https://linktransformer.github.io/) model. At its core this model this is a sentence transformer model [sentence-transformers](https://www.SBERT.net) model- it just wraps around the class.
|
16 |
It is designed for quick and easy record linkage (entity-matching) through the LinkTransformer package. The tasks include clustering, deduplication, linking, aggregation and more.
|
config.json
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
{
|
2 |
-
"_name_or_path": "
|
3 |
"architectures": [
|
4 |
"BertModel"
|
5 |
],
|
|
|
1 |
{
|
2 |
+
"_name_or_path": "hiiamsid/sentence_similarity_spanish_es",
|
3 |
"architectures": [
|
4 |
"BertModel"
|
5 |
],
|
eval/Information-Retrieval_evaluation_eval_results.csv
ADDED
The diff for this file is too large to render.
See raw diff
|
|
special_tokens_map.json
CHANGED
@@ -1,37 +1,7 @@
|
|
1 |
{
|
2 |
-
"cls_token":
|
3 |
-
|
4 |
-
|
5 |
-
|
6 |
-
|
7 |
-
"single_word": false
|
8 |
-
},
|
9 |
-
"mask_token": {
|
10 |
-
"content": "[MASK]",
|
11 |
-
"lstrip": false,
|
12 |
-
"normalized": false,
|
13 |
-
"rstrip": false,
|
14 |
-
"single_word": false
|
15 |
-
},
|
16 |
-
"pad_token": {
|
17 |
-
"content": "[PAD]",
|
18 |
-
"lstrip": false,
|
19 |
-
"normalized": false,
|
20 |
-
"rstrip": false,
|
21 |
-
"single_word": false
|
22 |
-
},
|
23 |
-
"sep_token": {
|
24 |
-
"content": "[SEP]",
|
25 |
-
"lstrip": false,
|
26 |
-
"normalized": false,
|
27 |
-
"rstrip": false,
|
28 |
-
"single_word": false
|
29 |
-
},
|
30 |
-
"unk_token": {
|
31 |
-
"content": "[UNK]",
|
32 |
-
"lstrip": false,
|
33 |
-
"normalized": false,
|
34 |
-
"rstrip": false,
|
35 |
-
"single_word": false
|
36 |
-
}
|
37 |
}
|
|
|
1 |
{
|
2 |
+
"cls_token": "[CLS]",
|
3 |
+
"mask_token": "[MASK]",
|
4 |
+
"pad_token": "[PAD]",
|
5 |
+
"sep_token": "[SEP]",
|
6 |
+
"unk_token": "[UNK]"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
7 |
}
|
pytorch_model.bin → test_data.pickle
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:258a6afd4ec0a61ce7ba4d9c64eaacba49cc242d396981ac6224dd00efc5c5e6
|
3 |
+
size 68516
|
val_data.pickle
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e1fb31aaa096101bf8cb0a320022e521d1d021cae177a11ea143ff78ecfaf71
|
3 |
+
size 228390
|