s3766882 commited on
Commit
b09b21e
·
1 Parent(s): 21aaa3a

update models

Browse files
Files changed (4) hide show
  1. config.json +2 -86
  2. model_args.json +1 -1
  3. pytorch_model.bin +2 -2
  4. training_args.bin +1 -1
config.json CHANGED
@@ -94,49 +94,7 @@
94
  "80": "LABEL_80",
95
  "81": "LABEL_81",
96
  "82": "LABEL_82",
97
- "83": "LABEL_83",
98
- "84": "LABEL_84",
99
- "85": "LABEL_85",
100
- "86": "LABEL_86",
101
- "87": "LABEL_87",
102
- "88": "LABEL_88",
103
- "89": "LABEL_89",
104
- "90": "LABEL_90",
105
- "91": "LABEL_91",
106
- "92": "LABEL_92",
107
- "93": "LABEL_93",
108
- "94": "LABEL_94",
109
- "95": "LABEL_95",
110
- "96": "LABEL_96",
111
- "97": "LABEL_97",
112
- "98": "LABEL_98",
113
- "99": "LABEL_99",
114
- "100": "LABEL_100",
115
- "101": "LABEL_101",
116
- "102": "LABEL_102",
117
- "103": "LABEL_103",
118
- "104": "LABEL_104",
119
- "105": "LABEL_105",
120
- "106": "LABEL_106",
121
- "107": "LABEL_107",
122
- "108": "LABEL_108",
123
- "109": "LABEL_109",
124
- "110": "LABEL_110",
125
- "111": "LABEL_111",
126
- "112": "LABEL_112",
127
- "113": "LABEL_113",
128
- "114": "LABEL_114",
129
- "115": "LABEL_115",
130
- "116": "LABEL_116",
131
- "117": "LABEL_117",
132
- "118": "LABEL_118",
133
- "119": "LABEL_119",
134
- "120": "LABEL_120",
135
- "121": "LABEL_121",
136
- "122": "LABEL_122",
137
- "123": "LABEL_123",
138
- "124": "LABEL_124",
139
- "125": "LABEL_125"
140
  },
141
  "initializer_range": 0.02,
142
  "intermediate_size": 3072,
@@ -144,34 +102,8 @@
144
  "LABEL_0": 0,
145
  "LABEL_1": 1,
146
  "LABEL_10": 10,
147
- "LABEL_100": 100,
148
- "LABEL_101": 101,
149
- "LABEL_102": 102,
150
- "LABEL_103": 103,
151
- "LABEL_104": 104,
152
- "LABEL_105": 105,
153
- "LABEL_106": 106,
154
- "LABEL_107": 107,
155
- "LABEL_108": 108,
156
- "LABEL_109": 109,
157
  "LABEL_11": 11,
158
- "LABEL_110": 110,
159
- "LABEL_111": 111,
160
- "LABEL_112": 112,
161
- "LABEL_113": 113,
162
- "LABEL_114": 114,
163
- "LABEL_115": 115,
164
- "LABEL_116": 116,
165
- "LABEL_117": 117,
166
- "LABEL_118": 118,
167
- "LABEL_119": 119,
168
  "LABEL_12": 12,
169
- "LABEL_120": 120,
170
- "LABEL_121": 121,
171
- "LABEL_122": 122,
172
- "LABEL_123": 123,
173
- "LABEL_124": 124,
174
- "LABEL_125": 125,
175
  "LABEL_13": 13,
176
  "LABEL_14": 14,
177
  "LABEL_15": 15,
@@ -250,23 +182,7 @@
250
  "LABEL_81": 81,
251
  "LABEL_82": 82,
252
  "LABEL_83": 83,
253
- "LABEL_84": 84,
254
- "LABEL_85": 85,
255
- "LABEL_86": 86,
256
- "LABEL_87": 87,
257
- "LABEL_88": 88,
258
- "LABEL_89": 89,
259
- "LABEL_9": 9,
260
- "LABEL_90": 90,
261
- "LABEL_91": 91,
262
- "LABEL_92": 92,
263
- "LABEL_93": 93,
264
- "LABEL_94": 94,
265
- "LABEL_95": 95,
266
- "LABEL_96": 96,
267
- "LABEL_97": 97,
268
- "LABEL_98": 98,
269
- "LABEL_99": 99
270
  },
271
  "layer_norm_eps": 1e-05,
272
  "max_position_embeddings": 514,
 
94
  "80": "LABEL_80",
95
  "81": "LABEL_81",
96
  "82": "LABEL_82",
97
+ "83": "LABEL_83"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
98
  },
99
  "initializer_range": 0.02,
100
  "intermediate_size": 3072,
 
102
  "LABEL_0": 0,
103
  "LABEL_1": 1,
104
  "LABEL_10": 10,
 
 
 
 
 
 
 
 
 
 
105
  "LABEL_11": 11,
 
 
 
 
 
 
 
 
 
 
106
  "LABEL_12": 12,
 
 
 
 
 
 
107
  "LABEL_13": 13,
108
  "LABEL_14": 14,
109
  "LABEL_15": 15,
 
182
  "LABEL_81": 81,
183
  "LABEL_82": 82,
184
  "LABEL_83": 83,
185
+ "LABEL_9": 9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
186
  },
187
  "layer_norm_eps": 1e-05,
188
  "max_position_embeddings": 514,
model_args.json CHANGED
@@ -1 +1 @@
1
- {"adafactor_beta1": null, "adafactor_clip_threshold": 1.0, "adafactor_decay_rate": -0.8, "adafactor_eps": [1e-30, 0.001], "adafactor_relative_step": true, "adafactor_scale_parameter": true, "adafactor_warmup_init": true, "adam_epsilon": 1e-08, "best_model_dir": "outputs/best_model", "cache_dir": "cache_dir/", "config": {}, "cosine_schedule_num_cycles": 0.5, "custom_layer_parameters": [], "custom_parameter_groups": [], "dataloader_num_workers": 0, "do_lower_case": false, "dynamic_quantize": false, "early_stopping_consider_epochs": false, "early_stopping_delta": 0, "early_stopping_metric": "eval_loss", "early_stopping_metric_minimize": true, "early_stopping_patience": 3, "encoding": null, "eval_batch_size": 8, "evaluate_during_training": false, "evaluate_during_training_silent": true, "evaluate_during_training_steps": 2000, "evaluate_during_training_verbose": false, "evaluate_each_epoch": true, "fp16": false, "gradient_accumulation_steps": 1, "learning_rate": 4e-05, "local_rank": -1, "logging_steps": 50, "loss_type": null, "loss_args": {}, "manual_seed": null, "max_grad_norm": 1.0, "max_seq_length": 128, "model_name": "roberta-base", "model_type": "roberta", "multiprocessing_chunksize": -1, "n_gpu": 1, "no_cache": false, "no_save": false, "not_saved_args": [], "num_train_epochs": 5, "optimizer": "AdamW", "output_dir": "outputs/", "overwrite_output_dir": true, "polynomial_decay_schedule_lr_end": 1e-07, "polynomial_decay_schedule_power": 1.0, "process_count": 1, "quantized_model": false, "reprocess_input_data": true, "save_best_model": true, "save_eval_checkpoints": true, "save_model_every_epoch": true, "save_optimizer_and_scheduler": true, "save_steps": 2000, "scheduler": "linear_schedule_with_warmup", "silent": false, "skip_special_tokens": true, "tensorboard_dir": null, "thread_count": null, "tokenizer_name": null, "tokenizer_type": null, "train_batch_size": 8, "train_custom_parameters_only": false, "use_cached_eval_features": false, "use_early_stopping": false, "use_hf_datasets": false, "use_multiprocessing": true, "use_multiprocessing_for_evaluation": true, "wandb_kwargs": {}, "wandb_project": null, "warmup_ratio": 0.06, "warmup_steps": 4, "weight_decay": 0.0, "model_class": "MultiLabelClassificationModel", "sliding_window": false, "stride": 0.8, "threshold": 0.5, "tie_value": 1, "labels_list": [], "labels_map": {}, "lazy_loading": false, "special_tokens_list": []}
 
1
+ {"adafactor_beta1": null, "adafactor_clip_threshold": 1.0, "adafactor_decay_rate": -0.8, "adafactor_eps": [1e-30, 0.001], "adafactor_relative_step": true, "adafactor_scale_parameter": true, "adafactor_warmup_init": true, "adam_epsilon": 1e-08, "best_model_dir": "outputs/best_model", "cache_dir": "cache_dir/", "config": {}, "cosine_schedule_num_cycles": 0.5, "custom_layer_parameters": [], "custom_parameter_groups": [], "dataloader_num_workers": 0, "do_lower_case": false, "dynamic_quantize": false, "early_stopping_consider_epochs": false, "early_stopping_delta": 0, "early_stopping_metric": "eval_loss", "early_stopping_metric_minimize": true, "early_stopping_patience": 3, "encoding": null, "eval_batch_size": 8, "evaluate_during_training": false, "evaluate_during_training_silent": true, "evaluate_during_training_steps": 2000, "evaluate_during_training_verbose": false, "evaluate_each_epoch": true, "fp16": true, "gradient_accumulation_steps": 1, "learning_rate": 1e-05, "local_rank": -1, "logging_steps": 50, "loss_type": null, "loss_args": {}, "manual_seed": null, "max_grad_norm": 1.0, "max_seq_length": 128, "model_name": "roberta-base", "model_type": "roberta", "multiprocessing_chunksize": -1, "n_gpu": 1, "no_cache": false, "no_save": false, "not_saved_args": [], "num_train_epochs": 6, "optimizer": "AdamW", "output_dir": "outputs/", "overwrite_output_dir": true, "polynomial_decay_schedule_lr_end": 1e-07, "polynomial_decay_schedule_power": 1.0, "process_count": 1, "quantized_model": false, "reprocess_input_data": true, "save_best_model": true, "save_eval_checkpoints": true, "save_model_every_epoch": false, "save_optimizer_and_scheduler": true, "save_steps": 2000, "scheduler": "linear_schedule_with_warmup", "silent": false, "skip_special_tokens": true, "tensorboard_dir": null, "thread_count": null, "tokenizer_name": null, "tokenizer_type": null, "train_batch_size": 8, "train_custom_parameters_only": false, "use_cached_eval_features": false, "use_early_stopping": false, "use_hf_datasets": false, "use_multiprocessing": true, "use_multiprocessing_for_evaluation": true, "wandb_kwargs": {}, "wandb_project": null, "warmup_ratio": 0.06, "warmup_steps": 3, "weight_decay": 0.0, "model_class": "MultiLabelClassificationModel", "sliding_window": false, "stride": 0.8, "threshold": 0.5, "tie_value": 1, "labels_list": [], "labels_map": {}, "lazy_loading": false, "special_tokens_list": []}
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:960f1151ad13b50357396d7ae2a5726bb8befbac3c0c5b0e076a24e70530f360
3
- size 501418601
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7359a64f7ac60b11e4347b3abdd42df81ae484eafb169932fb8d8078dcceebe
3
+ size 501289449
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e3b3a2da7d9bd8647168d70d64cc07829d39d3f896e827082dfd311213eeebf
3
  size 2991
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ce85e0f40402828049238da313ad4b732e6efa682dca78dfe6fed583681441e
3
  size 2991