96abhishekarora commited on
Commit
7827ffb
·
1 Parent(s): 13e9978

Modified validation and training for linktransformer model

Browse files
Files changed (4) hide show
  1. .gitattributes +1 -0
  2. LT_training_config.json +5 -3
  3. README.md +3 -3
  4. model.safetensors +1 -1
.gitattributes CHANGED
@@ -38,3 +38,4 @@ pytorch_model.bin filter=lfs diff=lfs merge=lfs -text
38
  model.safetensors filter=lfs diff=lfs merge=lfs -text
39
  .git/lfs/objects/21/3e/213e31b950d84bee8f77e75c3cd557932d9bc7dc76dcd03aba223c2e4f841a0f filter=lfs diff=lfs merge=lfs -text
40
  .git/lfs/objects/3f/07/3f07f428adbf03a3e7902665664f5dd6f342a6b6c7a2a47a7026772c48cb0e73 filter=lfs diff=lfs merge=lfs -text
 
 
38
  model.safetensors filter=lfs diff=lfs merge=lfs -text
39
  .git/lfs/objects/21/3e/213e31b950d84bee8f77e75c3cd557932d9bc7dc76dcd03aba223c2e4f841a0f filter=lfs diff=lfs merge=lfs -text
40
  .git/lfs/objects/3f/07/3f07f428adbf03a3e7902665664f5dd6f342a6b6c7a2a47a7026772c48cb0e73 filter=lfs diff=lfs merge=lfs -text
41
+ .git/lfs/objects/3d/42/3d42ebe4f358451d3fde5790fe6516dcd94dc0e5c0159c25ebfe679e11eab41d filter=lfs diff=lfs merge=lfs -text
LT_training_config.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
  "model_save_dir": "models",
3
  "model_save_name": "linkage_un_data_es_fine_industry",
4
- "opt_model_description": "This model was trained on a dataset prepared by linking product classifications from [UN stats](https://unstats.un.org/unsd/classifications/Econ). \n This model is designed to link different products to their industrial classification (ISIC) - trained on variation brought on by product level correspondance. It was trained for 70 epochs using other defaults that can be found in the repo's LinkTransformer config file - LT_training_config.json \n ",
5
  "opt_model_lang": "es",
6
  "train_batch_size": 64,
7
- "num_epochs": 70,
8
  "warm_up_perc": 1,
9
  "learning_rate": 2e-05,
10
  "loss_type": "supcon",
@@ -20,8 +20,10 @@
20
  "eval_steps_perc": 0.5,
21
  "test_at_end": true,
22
  "save_val_test_pickles": true,
23
- "val_query_prop": 0.5,
24
  "loss_params": {},
 
 
25
  "eval_type": "retrieval",
26
  "training_dataset": "dataframe",
27
  "base_model_path": "hiiamsid/sentence_similarity_spanish_es",
 
1
  {
2
  "model_save_dir": "models",
3
  "model_save_name": "linkage_un_data_es_fine_industry",
4
+ "opt_model_description": "This model was trained on a dataset prepared by linking product classifications from [UN stats](https://unstats.un.org/unsd/classifications/Econ). \n This model is designed to link different products to their industrial classification (ISIC) - trained on variation brought on by product level correspondance. It was trained for 30 epochs using other defaults that can be found in the repo's LinkTransformer config file - LT_training_config.json \n ",
5
  "opt_model_lang": "es",
6
  "train_batch_size": 64,
7
+ "num_epochs": 30,
8
  "warm_up_perc": 1,
9
  "learning_rate": 2e-05,
10
  "loss_type": "supcon",
 
20
  "eval_steps_perc": 0.5,
21
  "test_at_end": true,
22
  "save_val_test_pickles": true,
23
+ "val_query_prop": 0.2,
24
  "loss_params": {},
25
+ "lr": 2e-06,
26
+ "warmup_perc": 0.5,
27
  "eval_type": "retrieval",
28
  "training_dataset": "dataframe",
29
  "base_model_path": "hiiamsid/sentence_similarity_spanish_es",
README.md CHANGED
@@ -23,7 +23,7 @@ This model has been fine-tuned on the model : hiiamsid/sentence_similarity_spani
23
 
24
 
25
  This model was trained on a dataset prepared by linking product classifications from [UN stats](https://unstats.un.org/unsd/classifications/Econ).
26
- This model is designed to link different products to their industrial classification (ISIC) - trained on variation brought on by product level correspondance. It was trained for 70 epochs using other defaults that can be found in the repo's LinkTransformer config file - LT_training_config.json
27
 
28
 
29
  ## Usage (LinkTransformer)
@@ -109,7 +109,7 @@ The model was trained with the parameters:
109
  Parameters of the fit()-Method:
110
  ```
111
  {
112
- "epochs": 70,
113
  "evaluation_steps": 33,
114
  "evaluator": "sentence_transformers.evaluation.SequentialEvaluator.SequentialEvaluator",
115
  "max_grad_norm": 1,
@@ -119,7 +119,7 @@ Parameters of the fit()-Method:
119
  },
120
  "scheduler": "WarmupLinear",
121
  "steps_per_epoch": null,
122
- "warmup_steps": 4550,
123
  "weight_decay": 0.01
124
  }
125
  ```
 
23
 
24
 
25
  This model was trained on a dataset prepared by linking product classifications from [UN stats](https://unstats.un.org/unsd/classifications/Econ).
26
+ This model is designed to link different products to their industrial classification (ISIC) - trained on variation brought on by product level correspondance. It was trained for 30 epochs using other defaults that can be found in the repo's LinkTransformer config file - LT_training_config.json
27
 
28
 
29
  ## Usage (LinkTransformer)
 
109
  Parameters of the fit()-Method:
110
  ```
111
  {
112
+ "epochs": 30,
113
  "evaluation_steps": 33,
114
  "evaluator": "sentence_transformers.evaluation.SequentialEvaluator.SequentialEvaluator",
115
  "max_grad_norm": 1,
 
119
  },
120
  "scheduler": "WarmupLinear",
121
  "steps_per_epoch": null,
122
+ "warmup_steps": 1950,
123
  "weight_decay": 0.01
124
  }
125
  ```
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d42ebe4f358451d3fde5790fe6516dcd94dc0e5c0159c25ebfe679e11eab41d
3
  size 439425888
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82e8a4b706199c597b03c69c5184163d6bded50042bbb9e85f3928b2f5be3818
3
  size 439425888