Commit
·
7827ffb
1
Parent(s):
13e9978
Modified validation and training for linktransformer model
Browse files- .gitattributes +1 -0
- LT_training_config.json +5 -3
- README.md +3 -3
- model.safetensors +1 -1
.gitattributes
CHANGED
@@ -38,3 +38,4 @@ pytorch_model.bin filter=lfs diff=lfs merge=lfs -text
|
|
38 |
model.safetensors filter=lfs diff=lfs merge=lfs -text
|
39 |
.git/lfs/objects/21/3e/213e31b950d84bee8f77e75c3cd557932d9bc7dc76dcd03aba223c2e4f841a0f filter=lfs diff=lfs merge=lfs -text
|
40 |
.git/lfs/objects/3f/07/3f07f428adbf03a3e7902665664f5dd6f342a6b6c7a2a47a7026772c48cb0e73 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
38 |
model.safetensors filter=lfs diff=lfs merge=lfs -text
|
39 |
.git/lfs/objects/21/3e/213e31b950d84bee8f77e75c3cd557932d9bc7dc76dcd03aba223c2e4f841a0f filter=lfs diff=lfs merge=lfs -text
|
40 |
.git/lfs/objects/3f/07/3f07f428adbf03a3e7902665664f5dd6f342a6b6c7a2a47a7026772c48cb0e73 filter=lfs diff=lfs merge=lfs -text
|
41 |
+
.git/lfs/objects/3d/42/3d42ebe4f358451d3fde5790fe6516dcd94dc0e5c0159c25ebfe679e11eab41d filter=lfs diff=lfs merge=lfs -text
|
LT_training_config.json
CHANGED
@@ -1,10 +1,10 @@
|
|
1 |
{
|
2 |
"model_save_dir": "models",
|
3 |
"model_save_name": "linkage_un_data_es_fine_industry",
|
4 |
-
"opt_model_description": "This model was trained on a dataset prepared by linking product classifications from [UN stats](https://unstats.un.org/unsd/classifications/Econ). \n This model is designed to link different products to their industrial classification (ISIC) - trained on variation brought on by product level correspondance. It was trained for
|
5 |
"opt_model_lang": "es",
|
6 |
"train_batch_size": 64,
|
7 |
-
"num_epochs":
|
8 |
"warm_up_perc": 1,
|
9 |
"learning_rate": 2e-05,
|
10 |
"loss_type": "supcon",
|
@@ -20,8 +20,10 @@
|
|
20 |
"eval_steps_perc": 0.5,
|
21 |
"test_at_end": true,
|
22 |
"save_val_test_pickles": true,
|
23 |
-
"val_query_prop": 0.
|
24 |
"loss_params": {},
|
|
|
|
|
25 |
"eval_type": "retrieval",
|
26 |
"training_dataset": "dataframe",
|
27 |
"base_model_path": "hiiamsid/sentence_similarity_spanish_es",
|
|
|
1 |
{
|
2 |
"model_save_dir": "models",
|
3 |
"model_save_name": "linkage_un_data_es_fine_industry",
|
4 |
+
"opt_model_description": "This model was trained on a dataset prepared by linking product classifications from [UN stats](https://unstats.un.org/unsd/classifications/Econ). \n This model is designed to link different products to their industrial classification (ISIC) - trained on variation brought on by product level correspondance. It was trained for 30 epochs using other defaults that can be found in the repo's LinkTransformer config file - LT_training_config.json \n ",
|
5 |
"opt_model_lang": "es",
|
6 |
"train_batch_size": 64,
|
7 |
+
"num_epochs": 30,
|
8 |
"warm_up_perc": 1,
|
9 |
"learning_rate": 2e-05,
|
10 |
"loss_type": "supcon",
|
|
|
20 |
"eval_steps_perc": 0.5,
|
21 |
"test_at_end": true,
|
22 |
"save_val_test_pickles": true,
|
23 |
+
"val_query_prop": 0.2,
|
24 |
"loss_params": {},
|
25 |
+
"lr": 2e-06,
|
26 |
+
"warmup_perc": 0.5,
|
27 |
"eval_type": "retrieval",
|
28 |
"training_dataset": "dataframe",
|
29 |
"base_model_path": "hiiamsid/sentence_similarity_spanish_es",
|
README.md
CHANGED
@@ -23,7 +23,7 @@ This model has been fine-tuned on the model : hiiamsid/sentence_similarity_spani
|
|
23 |
|
24 |
|
25 |
This model was trained on a dataset prepared by linking product classifications from [UN stats](https://unstats.un.org/unsd/classifications/Econ).
|
26 |
-
This model is designed to link different products to their industrial classification (ISIC) - trained on variation brought on by product level correspondance. It was trained for
|
27 |
|
28 |
|
29 |
## Usage (LinkTransformer)
|
@@ -109,7 +109,7 @@ The model was trained with the parameters:
|
|
109 |
Parameters of the fit()-Method:
|
110 |
```
|
111 |
{
|
112 |
-
"epochs":
|
113 |
"evaluation_steps": 33,
|
114 |
"evaluator": "sentence_transformers.evaluation.SequentialEvaluator.SequentialEvaluator",
|
115 |
"max_grad_norm": 1,
|
@@ -119,7 +119,7 @@ Parameters of the fit()-Method:
|
|
119 |
},
|
120 |
"scheduler": "WarmupLinear",
|
121 |
"steps_per_epoch": null,
|
122 |
-
"warmup_steps":
|
123 |
"weight_decay": 0.01
|
124 |
}
|
125 |
```
|
|
|
23 |
|
24 |
|
25 |
This model was trained on a dataset prepared by linking product classifications from [UN stats](https://unstats.un.org/unsd/classifications/Econ).
|
26 |
+
This model is designed to link different products to their industrial classification (ISIC) - trained on variation brought on by product level correspondance. It was trained for 30 epochs using other defaults that can be found in the repo's LinkTransformer config file - LT_training_config.json
|
27 |
|
28 |
|
29 |
## Usage (LinkTransformer)
|
|
|
109 |
Parameters of the fit()-Method:
|
110 |
```
|
111 |
{
|
112 |
+
"epochs": 30,
|
113 |
"evaluation_steps": 33,
|
114 |
"evaluator": "sentence_transformers.evaluation.SequentialEvaluator.SequentialEvaluator",
|
115 |
"max_grad_norm": 1,
|
|
|
119 |
},
|
120 |
"scheduler": "WarmupLinear",
|
121 |
"steps_per_epoch": null,
|
122 |
+
"warmup_steps": 1950,
|
123 |
"weight_decay": 0.01
|
124 |
}
|
125 |
```
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 439425888
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82e8a4b706199c597b03c69c5184163d6bded50042bbb9e85f3928b2f5be3818
|
3 |
size 439425888
|