s3766882
commited on
Commit
·
b09b21e
1
Parent(s):
21aaa3a
update models
Browse files- config.json +2 -86
- model_args.json +1 -1
- pytorch_model.bin +2 -2
- training_args.bin +1 -1
config.json
CHANGED
@@ -94,49 +94,7 @@
|
|
94 |
"80": "LABEL_80",
|
95 |
"81": "LABEL_81",
|
96 |
"82": "LABEL_82",
|
97 |
-
"83": "LABEL_83"
|
98 |
-
"84": "LABEL_84",
|
99 |
-
"85": "LABEL_85",
|
100 |
-
"86": "LABEL_86",
|
101 |
-
"87": "LABEL_87",
|
102 |
-
"88": "LABEL_88",
|
103 |
-
"89": "LABEL_89",
|
104 |
-
"90": "LABEL_90",
|
105 |
-
"91": "LABEL_91",
|
106 |
-
"92": "LABEL_92",
|
107 |
-
"93": "LABEL_93",
|
108 |
-
"94": "LABEL_94",
|
109 |
-
"95": "LABEL_95",
|
110 |
-
"96": "LABEL_96",
|
111 |
-
"97": "LABEL_97",
|
112 |
-
"98": "LABEL_98",
|
113 |
-
"99": "LABEL_99",
|
114 |
-
"100": "LABEL_100",
|
115 |
-
"101": "LABEL_101",
|
116 |
-
"102": "LABEL_102",
|
117 |
-
"103": "LABEL_103",
|
118 |
-
"104": "LABEL_104",
|
119 |
-
"105": "LABEL_105",
|
120 |
-
"106": "LABEL_106",
|
121 |
-
"107": "LABEL_107",
|
122 |
-
"108": "LABEL_108",
|
123 |
-
"109": "LABEL_109",
|
124 |
-
"110": "LABEL_110",
|
125 |
-
"111": "LABEL_111",
|
126 |
-
"112": "LABEL_112",
|
127 |
-
"113": "LABEL_113",
|
128 |
-
"114": "LABEL_114",
|
129 |
-
"115": "LABEL_115",
|
130 |
-
"116": "LABEL_116",
|
131 |
-
"117": "LABEL_117",
|
132 |
-
"118": "LABEL_118",
|
133 |
-
"119": "LABEL_119",
|
134 |
-
"120": "LABEL_120",
|
135 |
-
"121": "LABEL_121",
|
136 |
-
"122": "LABEL_122",
|
137 |
-
"123": "LABEL_123",
|
138 |
-
"124": "LABEL_124",
|
139 |
-
"125": "LABEL_125"
|
140 |
},
|
141 |
"initializer_range": 0.02,
|
142 |
"intermediate_size": 3072,
|
@@ -144,34 +102,8 @@
|
|
144 |
"LABEL_0": 0,
|
145 |
"LABEL_1": 1,
|
146 |
"LABEL_10": 10,
|
147 |
-
"LABEL_100": 100,
|
148 |
-
"LABEL_101": 101,
|
149 |
-
"LABEL_102": 102,
|
150 |
-
"LABEL_103": 103,
|
151 |
-
"LABEL_104": 104,
|
152 |
-
"LABEL_105": 105,
|
153 |
-
"LABEL_106": 106,
|
154 |
-
"LABEL_107": 107,
|
155 |
-
"LABEL_108": 108,
|
156 |
-
"LABEL_109": 109,
|
157 |
"LABEL_11": 11,
|
158 |
-
"LABEL_110": 110,
|
159 |
-
"LABEL_111": 111,
|
160 |
-
"LABEL_112": 112,
|
161 |
-
"LABEL_113": 113,
|
162 |
-
"LABEL_114": 114,
|
163 |
-
"LABEL_115": 115,
|
164 |
-
"LABEL_116": 116,
|
165 |
-
"LABEL_117": 117,
|
166 |
-
"LABEL_118": 118,
|
167 |
-
"LABEL_119": 119,
|
168 |
"LABEL_12": 12,
|
169 |
-
"LABEL_120": 120,
|
170 |
-
"LABEL_121": 121,
|
171 |
-
"LABEL_122": 122,
|
172 |
-
"LABEL_123": 123,
|
173 |
-
"LABEL_124": 124,
|
174 |
-
"LABEL_125": 125,
|
175 |
"LABEL_13": 13,
|
176 |
"LABEL_14": 14,
|
177 |
"LABEL_15": 15,
|
@@ -250,23 +182,7 @@
|
|
250 |
"LABEL_81": 81,
|
251 |
"LABEL_82": 82,
|
252 |
"LABEL_83": 83,
|
253 |
-
"
|
254 |
-
"LABEL_85": 85,
|
255 |
-
"LABEL_86": 86,
|
256 |
-
"LABEL_87": 87,
|
257 |
-
"LABEL_88": 88,
|
258 |
-
"LABEL_89": 89,
|
259 |
-
"LABEL_9": 9,
|
260 |
-
"LABEL_90": 90,
|
261 |
-
"LABEL_91": 91,
|
262 |
-
"LABEL_92": 92,
|
263 |
-
"LABEL_93": 93,
|
264 |
-
"LABEL_94": 94,
|
265 |
-
"LABEL_95": 95,
|
266 |
-
"LABEL_96": 96,
|
267 |
-
"LABEL_97": 97,
|
268 |
-
"LABEL_98": 98,
|
269 |
-
"LABEL_99": 99
|
270 |
},
|
271 |
"layer_norm_eps": 1e-05,
|
272 |
"max_position_embeddings": 514,
|
|
|
94 |
"80": "LABEL_80",
|
95 |
"81": "LABEL_81",
|
96 |
"82": "LABEL_82",
|
97 |
+
"83": "LABEL_83"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
98 |
},
|
99 |
"initializer_range": 0.02,
|
100 |
"intermediate_size": 3072,
|
|
|
102 |
"LABEL_0": 0,
|
103 |
"LABEL_1": 1,
|
104 |
"LABEL_10": 10,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
105 |
"LABEL_11": 11,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
106 |
"LABEL_12": 12,
|
|
|
|
|
|
|
|
|
|
|
|
|
107 |
"LABEL_13": 13,
|
108 |
"LABEL_14": 14,
|
109 |
"LABEL_15": 15,
|
|
|
182 |
"LABEL_81": 81,
|
183 |
"LABEL_82": 82,
|
184 |
"LABEL_83": 83,
|
185 |
+
"LABEL_9": 9
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
186 |
},
|
187 |
"layer_norm_eps": 1e-05,
|
188 |
"max_position_embeddings": 514,
|
model_args.json
CHANGED
@@ -1 +1 @@
|
|
1 |
-
{"adafactor_beta1": null, "adafactor_clip_threshold": 1.0, "adafactor_decay_rate": -0.8, "adafactor_eps": [1e-30, 0.001], "adafactor_relative_step": true, "adafactor_scale_parameter": true, "adafactor_warmup_init": true, "adam_epsilon": 1e-08, "best_model_dir": "outputs/best_model", "cache_dir": "cache_dir/", "config": {}, "cosine_schedule_num_cycles": 0.5, "custom_layer_parameters": [], "custom_parameter_groups": [], "dataloader_num_workers": 0, "do_lower_case": false, "dynamic_quantize": false, "early_stopping_consider_epochs": false, "early_stopping_delta": 0, "early_stopping_metric": "eval_loss", "early_stopping_metric_minimize": true, "early_stopping_patience": 3, "encoding": null, "eval_batch_size": 8, "evaluate_during_training": false, "evaluate_during_training_silent": true, "evaluate_during_training_steps": 2000, "evaluate_during_training_verbose": false, "evaluate_each_epoch": true, "fp16":
|
|
|
1 |
+
{"adafactor_beta1": null, "adafactor_clip_threshold": 1.0, "adafactor_decay_rate": -0.8, "adafactor_eps": [1e-30, 0.001], "adafactor_relative_step": true, "adafactor_scale_parameter": true, "adafactor_warmup_init": true, "adam_epsilon": 1e-08, "best_model_dir": "outputs/best_model", "cache_dir": "cache_dir/", "config": {}, "cosine_schedule_num_cycles": 0.5, "custom_layer_parameters": [], "custom_parameter_groups": [], "dataloader_num_workers": 0, "do_lower_case": false, "dynamic_quantize": false, "early_stopping_consider_epochs": false, "early_stopping_delta": 0, "early_stopping_metric": "eval_loss", "early_stopping_metric_minimize": true, "early_stopping_patience": 3, "encoding": null, "eval_batch_size": 8, "evaluate_during_training": false, "evaluate_during_training_silent": true, "evaluate_during_training_steps": 2000, "evaluate_during_training_verbose": false, "evaluate_each_epoch": true, "fp16": true, "gradient_accumulation_steps": 1, "learning_rate": 1e-05, "local_rank": -1, "logging_steps": 50, "loss_type": null, "loss_args": {}, "manual_seed": null, "max_grad_norm": 1.0, "max_seq_length": 128, "model_name": "roberta-base", "model_type": "roberta", "multiprocessing_chunksize": -1, "n_gpu": 1, "no_cache": false, "no_save": false, "not_saved_args": [], "num_train_epochs": 6, "optimizer": "AdamW", "output_dir": "outputs/", "overwrite_output_dir": true, "polynomial_decay_schedule_lr_end": 1e-07, "polynomial_decay_schedule_power": 1.0, "process_count": 1, "quantized_model": false, "reprocess_input_data": true, "save_best_model": true, "save_eval_checkpoints": true, "save_model_every_epoch": false, "save_optimizer_and_scheduler": true, "save_steps": 2000, "scheduler": "linear_schedule_with_warmup", "silent": false, "skip_special_tokens": true, "tensorboard_dir": null, "thread_count": null, "tokenizer_name": null, "tokenizer_type": null, "train_batch_size": 8, "train_custom_parameters_only": false, "use_cached_eval_features": false, "use_early_stopping": false, "use_hf_datasets": false, "use_multiprocessing": true, "use_multiprocessing_for_evaluation": true, "wandb_kwargs": {}, "wandb_project": null, "warmup_ratio": 0.06, "warmup_steps": 3, "weight_decay": 0.0, "model_class": "MultiLabelClassificationModel", "sliding_window": false, "stride": 0.8, "threshold": 0.5, "tie_value": 1, "labels_list": [], "labels_map": {}, "lazy_loading": false, "special_tokens_list": []}
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7359a64f7ac60b11e4347b3abdd42df81ae484eafb169932fb8d8078dcceebe
|
3 |
+
size 501289449
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2991
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ce85e0f40402828049238da313ad4b732e6efa682dca78dfe6fed583681441e
|
3 |
size 2991
|