Ubuntu commited on
Commit
2e0c701
1 Parent(s): 7bd8341

added finetuned categorical classification model + more evaluated dataset modifications

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. data_categories/Computers_and_Electronics.csv +2 -2
  2. data_categories/Final_Category_Data_With_Labels.csv +2 -2
  3. data_categories/Food_and_Drink.csv +2 -2
  4. data_categories/Online Communities.csv +2 -2
  5. finetuned_entity_categorical_classification/checkpoint-11032/added_tokens.json +7 -0
  6. finetuned_entity_categorical_classification/checkpoint-11032/config.json +83 -0
  7. finetuned_entity_categorical_classification/checkpoint-11032/optimizer.pt +3 -0
  8. finetuned_entity_categorical_classification/checkpoint-11032/pytorch_model.bin +3 -0
  9. finetuned_entity_categorical_classification/checkpoint-11032/rng_state.pth +0 -0
  10. finetuned_entity_categorical_classification/checkpoint-11032/scheduler.pt +3 -0
  11. finetuned_entity_categorical_classification/checkpoint-11032/special_tokens_map.json +7 -0
  12. finetuned_entity_categorical_classification/checkpoint-11032/tokenizer.json +0 -0
  13. finetuned_entity_categorical_classification/checkpoint-11032/tokenizer_config.json +56 -0
  14. finetuned_entity_categorical_classification/checkpoint-11032/trainer_state.json +214 -0
  15. finetuned_entity_categorical_classification/checkpoint-11032/training_args.bin +3 -0
  16. finetuned_entity_categorical_classification/checkpoint-11032/vocab.txt +0 -0
  17. finetuned_entity_categorical_classification/checkpoint-12608/added_tokens.json +7 -0
  18. finetuned_entity_categorical_classification/checkpoint-12608/config.json +83 -0
  19. finetuned_entity_categorical_classification/checkpoint-12608/optimizer.pt +3 -0
  20. finetuned_entity_categorical_classification/checkpoint-12608/pytorch_model.bin +3 -0
  21. finetuned_entity_categorical_classification/checkpoint-12608/rng_state.pth +0 -0
  22. finetuned_entity_categorical_classification/checkpoint-12608/scheduler.pt +3 -0
  23. finetuned_entity_categorical_classification/checkpoint-12608/special_tokens_map.json +7 -0
  24. finetuned_entity_categorical_classification/checkpoint-12608/tokenizer.json +0 -0
  25. finetuned_entity_categorical_classification/checkpoint-12608/tokenizer_config.json +56 -0
  26. finetuned_entity_categorical_classification/checkpoint-12608/trainer_state.json +241 -0
  27. finetuned_entity_categorical_classification/checkpoint-12608/training_args.bin +3 -0
  28. finetuned_entity_categorical_classification/checkpoint-12608/vocab.txt +0 -0
  29. finetuned_entity_categorical_classification/checkpoint-14184/added_tokens.json +7 -0
  30. finetuned_entity_categorical_classification/checkpoint-14184/config.json +83 -0
  31. finetuned_entity_categorical_classification/checkpoint-14184/optimizer.pt +3 -0
  32. finetuned_entity_categorical_classification/checkpoint-14184/pytorch_model.bin +3 -0
  33. finetuned_entity_categorical_classification/checkpoint-14184/rng_state.pth +0 -0
  34. finetuned_entity_categorical_classification/checkpoint-14184/scheduler.pt +3 -0
  35. finetuned_entity_categorical_classification/checkpoint-14184/special_tokens_map.json +7 -0
  36. finetuned_entity_categorical_classification/checkpoint-14184/tokenizer.json +0 -0
  37. finetuned_entity_categorical_classification/checkpoint-14184/tokenizer_config.json +56 -0
  38. finetuned_entity_categorical_classification/checkpoint-14184/trainer_state.json +268 -0
  39. finetuned_entity_categorical_classification/checkpoint-14184/training_args.bin +3 -0
  40. finetuned_entity_categorical_classification/checkpoint-14184/vocab.txt +0 -0
  41. finetuned_entity_categorical_classification/checkpoint-1576/added_tokens.json +7 -0
  42. finetuned_entity_categorical_classification/checkpoint-1576/config.json +83 -0
  43. finetuned_entity_categorical_classification/checkpoint-1576/optimizer.pt +3 -0
  44. finetuned_entity_categorical_classification/checkpoint-1576/pytorch_model.bin +3 -0
  45. finetuned_entity_categorical_classification/checkpoint-1576/rng_state.pth +0 -0
  46. finetuned_entity_categorical_classification/checkpoint-1576/scheduler.pt +3 -0
  47. finetuned_entity_categorical_classification/checkpoint-1576/special_tokens_map.json +7 -0
  48. finetuned_entity_categorical_classification/checkpoint-1576/tokenizer.json +0 -0
  49. finetuned_entity_categorical_classification/checkpoint-1576/tokenizer_config.json +56 -0
  50. finetuned_entity_categorical_classification/checkpoint-1576/trainer_state.json +46 -0
data_categories/Computers_and_Electronics.csv CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23ba5a3666e7d67ef57a7fcf301685ae7b66ffc1ed4f33ee6d7b01d11af136ed
3
- size 27167
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:951be0765dfdba915851bf70958f057fa8e57ee652368599652c09134597cdb5
3
+ size 32224
data_categories/Final_Category_Data_With_Labels.csv CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8c2ba96d90a437a017a25af64364a58c7e2954ca1519a5fce27d0e55addae8da
3
- size 1810529
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cc9c2f33eb98166acba40de7c124801b57c19ececb8d24900980fb9d5cbabe6
3
+ size 1671966
data_categories/Food_and_Drink.csv CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:317f8d87736b3523b83ec3fe0c8bcd2d36df06fce8076a4a414125bfc1ca249b
3
- size 42073
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f25d7848aac215feb6ac57d256005b70d1e39eb0f46bd8cbdc60b94469c3a368
3
+ size 46822
data_categories/Online Communities.csv CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:903899c0689fab2c6648a715e5e488429b847054af33c1d26b252eb36352cf29
3
- size 46352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65ae0ed633eae668652cee2a7aab4e48a873a1815edb094521257af71360d5d3
3
+ size 55212
finetuned_entity_categorical_classification/checkpoint-11032/added_tokens.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "[CLS]": 101,
3
+ "[MASK]": 103,
4
+ "[PAD]": 0,
5
+ "[SEP]": 102,
6
+ "[UNK]": 100
7
+ }
finetuned_entity_categorical_classification/checkpoint-11032/config.json ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilbert-base-uncased",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForSequenceClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "id2label": {
12
+ "0": "Beauty_and_Fitness",
13
+ "1": "People_and_Society",
14
+ "2": "Travel_and_Transportation",
15
+ "3": "Shopping",
16
+ "4": "Adult",
17
+ "5": "Sports",
18
+ "6": "Science",
19
+ "7": "Food_and_Drink",
20
+ "8": "News",
21
+ "9": "Sensitive Subjects",
22
+ "10": "Autos_and_Vehicles",
23
+ "11": "Law_and_Government",
24
+ "12": "Business_and_Industrial",
25
+ "13": "Health",
26
+ "14": "Real Estate",
27
+ "15": "Books_and_Literature",
28
+ "16": "Computers_and_Electronics",
29
+ "17": "Internet_and_Telecom",
30
+ "18": "Home_and_Garden",
31
+ "19": "Jobs_and_Education",
32
+ "20": "Online Communities",
33
+ "21": "Finance",
34
+ "22": "Arts_and_Entertainment",
35
+ "23": "Games",
36
+ "24": "Hobbies_and_Leisure",
37
+ "25": "Reference",
38
+ "26": "Pets_and_Animals"
39
+ },
40
+ "initializer_range": 0.02,
41
+ "label2id": {
42
+ "Adult": 4,
43
+ "Arts_and_Entertainment": 22,
44
+ "Autos_and_Vehicles": 10,
45
+ "Beauty_and_Fitness": 0,
46
+ "Books_and_Literature": 15,
47
+ "Business_and_Industrial": 12,
48
+ "Computers_and_Electronics": 16,
49
+ "Finance": 21,
50
+ "Food_and_Drink": 7,
51
+ "Games": 23,
52
+ "Health": 13,
53
+ "Hobbies_and_Leisure": 24,
54
+ "Home_and_Garden": 18,
55
+ "Internet_and_Telecom": 17,
56
+ "Jobs_and_Education": 19,
57
+ "Law_and_Government": 11,
58
+ "News": 8,
59
+ "Online Communities": 20,
60
+ "People_and_Society": 1,
61
+ "Pets_and_Animals": 26,
62
+ "Real Estate": 14,
63
+ "Reference": 25,
64
+ "Science": 6,
65
+ "Sensitive Subjects": 9,
66
+ "Shopping": 3,
67
+ "Sports": 5,
68
+ "Travel_and_Transportation": 2
69
+ },
70
+ "max_position_embeddings": 512,
71
+ "model_type": "distilbert",
72
+ "n_heads": 12,
73
+ "n_layers": 6,
74
+ "pad_token_id": 0,
75
+ "problem_type": "single_label_classification",
76
+ "qa_dropout": 0.1,
77
+ "seq_classif_dropout": 0.2,
78
+ "sinusoidal_pos_embds": false,
79
+ "tie_weights_": true,
80
+ "torch_dtype": "float32",
81
+ "transformers_version": "4.34.0",
82
+ "vocab_size": 30522
83
+ }
finetuned_entity_categorical_classification/checkpoint-11032/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f7ab679648567dedd5ee16883a5b327f5addcd457801f36d1cf2fde78ddd114
3
+ size 535881018
finetuned_entity_categorical_classification/checkpoint-11032/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eaedbcf0c17b7424c96b7c789c62d9d7a5b1e7ec2f611accbc326a6346dfc71b
3
+ size 267932842
finetuned_entity_categorical_classification/checkpoint-11032/rng_state.pth ADDED
Binary file (14.2 kB). View file
 
finetuned_entity_categorical_classification/checkpoint-11032/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d5094212461ae02915e8b4efcecec1cdff5f9e5d485a0996bdaf106d8d66aa6
3
+ size 1064
finetuned_entity_categorical_classification/checkpoint-11032/special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
finetuned_entity_categorical_classification/checkpoint-11032/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
finetuned_entity_categorical_classification/checkpoint-11032/tokenizer_config.json ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "additional_special_tokens": [],
45
+ "clean_up_tokenization_spaces": true,
46
+ "cls_token": "[CLS]",
47
+ "do_lower_case": true,
48
+ "mask_token": "[MASK]",
49
+ "model_max_length": 512,
50
+ "pad_token": "[PAD]",
51
+ "sep_token": "[SEP]",
52
+ "strip_accents": null,
53
+ "tokenize_chinese_chars": true,
54
+ "tokenizer_class": "DistilBertTokenizer",
55
+ "unk_token": "[UNK]"
56
+ }
finetuned_entity_categorical_classification/checkpoint-11032/trainer_state.json ADDED
@@ -0,0 +1,214 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.21237443387508392,
3
+ "best_model_checkpoint": "finetuned_entity_categorical_classification/checkpoint-4728",
4
+ "epoch": 7.0,
5
+ "eval_steps": 500,
6
+ "global_step": 11032,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.32,
13
+ "learning_rate": 1.957698815566836e-05,
14
+ "loss": 1.5567,
15
+ "step": 500
16
+ },
17
+ {
18
+ "epoch": 0.63,
19
+ "learning_rate": 1.915397631133672e-05,
20
+ "loss": 0.3944,
21
+ "step": 1000
22
+ },
23
+ {
24
+ "epoch": 0.95,
25
+ "learning_rate": 1.873096446700508e-05,
26
+ "loss": 0.2773,
27
+ "step": 1500
28
+ },
29
+ {
30
+ "epoch": 1.0,
31
+ "eval_accuracy": 0.9374900840869427,
32
+ "eval_loss": 0.2187376469373703,
33
+ "eval_runtime": 2.2114,
34
+ "eval_samples_per_second": 2850.256,
35
+ "eval_steps_per_second": 178.169,
36
+ "step": 1576
37
+ },
38
+ {
39
+ "epoch": 1.27,
40
+ "learning_rate": 1.830795262267344e-05,
41
+ "loss": 0.1997,
42
+ "step": 2000
43
+ },
44
+ {
45
+ "epoch": 1.59,
46
+ "learning_rate": 1.7884940778341796e-05,
47
+ "loss": 0.202,
48
+ "step": 2500
49
+ },
50
+ {
51
+ "epoch": 1.9,
52
+ "learning_rate": 1.7461928934010152e-05,
53
+ "loss": 0.1797,
54
+ "step": 3000
55
+ },
56
+ {
57
+ "epoch": 2.0,
58
+ "eval_accuracy": 0.9452641599238458,
59
+ "eval_loss": 0.22844311594963074,
60
+ "eval_runtime": 2.2403,
61
+ "eval_samples_per_second": 2813.437,
62
+ "eval_steps_per_second": 175.868,
63
+ "step": 3152
64
+ },
65
+ {
66
+ "epoch": 2.22,
67
+ "learning_rate": 1.7038917089678512e-05,
68
+ "loss": 0.148,
69
+ "step": 3500
70
+ },
71
+ {
72
+ "epoch": 2.54,
73
+ "learning_rate": 1.661590524534687e-05,
74
+ "loss": 0.1357,
75
+ "step": 4000
76
+ },
77
+ {
78
+ "epoch": 2.86,
79
+ "learning_rate": 1.619289340101523e-05,
80
+ "loss": 0.1525,
81
+ "step": 4500
82
+ },
83
+ {
84
+ "epoch": 3.0,
85
+ "eval_accuracy": 0.9481199428843408,
86
+ "eval_loss": 0.21237443387508392,
87
+ "eval_runtime": 2.2281,
88
+ "eval_samples_per_second": 2828.834,
89
+ "eval_steps_per_second": 176.83,
90
+ "step": 4728
91
+ },
92
+ {
93
+ "epoch": 3.17,
94
+ "learning_rate": 1.576988155668359e-05,
95
+ "loss": 0.1218,
96
+ "step": 5000
97
+ },
98
+ {
99
+ "epoch": 3.49,
100
+ "learning_rate": 1.5346869712351946e-05,
101
+ "loss": 0.1147,
102
+ "step": 5500
103
+ },
104
+ {
105
+ "epoch": 3.81,
106
+ "learning_rate": 1.4923857868020306e-05,
107
+ "loss": 0.1195,
108
+ "step": 6000
109
+ },
110
+ {
111
+ "epoch": 4.0,
112
+ "eval_accuracy": 0.94859590671109,
113
+ "eval_loss": 0.2216227501630783,
114
+ "eval_runtime": 2.2255,
115
+ "eval_samples_per_second": 2832.161,
116
+ "eval_steps_per_second": 177.038,
117
+ "step": 6304
118
+ },
119
+ {
120
+ "epoch": 4.12,
121
+ "learning_rate": 1.4500846023688663e-05,
122
+ "loss": 0.114,
123
+ "step": 6500
124
+ },
125
+ {
126
+ "epoch": 4.44,
127
+ "learning_rate": 1.4077834179357023e-05,
128
+ "loss": 0.104,
129
+ "step": 7000
130
+ },
131
+ {
132
+ "epoch": 4.76,
133
+ "learning_rate": 1.3654822335025382e-05,
134
+ "loss": 0.0936,
135
+ "step": 7500
136
+ },
137
+ {
138
+ "epoch": 5.0,
139
+ "eval_accuracy": 0.9462160875773441,
140
+ "eval_loss": 0.24313929677009583,
141
+ "eval_runtime": 2.1752,
142
+ "eval_samples_per_second": 2897.6,
143
+ "eval_steps_per_second": 181.129,
144
+ "step": 7880
145
+ },
146
+ {
147
+ "epoch": 5.08,
148
+ "learning_rate": 1.323181049069374e-05,
149
+ "loss": 0.099,
150
+ "step": 8000
151
+ },
152
+ {
153
+ "epoch": 5.39,
154
+ "learning_rate": 1.28087986463621e-05,
155
+ "loss": 0.0929,
156
+ "step": 8500
157
+ },
158
+ {
159
+ "epoch": 5.71,
160
+ "learning_rate": 1.2385786802030457e-05,
161
+ "loss": 0.0872,
162
+ "step": 9000
163
+ },
164
+ {
165
+ "epoch": 6.0,
166
+ "eval_accuracy": 0.9465333967951769,
167
+ "eval_loss": 0.25265371799468994,
168
+ "eval_runtime": 2.2222,
169
+ "eval_samples_per_second": 2836.351,
170
+ "eval_steps_per_second": 177.3,
171
+ "step": 9456
172
+ },
173
+ {
174
+ "epoch": 6.03,
175
+ "learning_rate": 1.1962774957698817e-05,
176
+ "loss": 0.0963,
177
+ "step": 9500
178
+ },
179
+ {
180
+ "epoch": 6.35,
181
+ "learning_rate": 1.1539763113367176e-05,
182
+ "loss": 0.0733,
183
+ "step": 10000
184
+ },
185
+ {
186
+ "epoch": 6.66,
187
+ "learning_rate": 1.1116751269035532e-05,
188
+ "loss": 0.0812,
189
+ "step": 10500
190
+ },
191
+ {
192
+ "epoch": 6.98,
193
+ "learning_rate": 1.0693739424703892e-05,
194
+ "loss": 0.0929,
195
+ "step": 11000
196
+ },
197
+ {
198
+ "epoch": 7.0,
199
+ "eval_accuracy": 0.9490718705378391,
200
+ "eval_loss": 0.23417465388774872,
201
+ "eval_runtime": 2.1699,
202
+ "eval_samples_per_second": 2904.721,
203
+ "eval_steps_per_second": 181.574,
204
+ "step": 11032
205
+ }
206
+ ],
207
+ "logging_steps": 500,
208
+ "max_steps": 23640,
209
+ "num_train_epochs": 15,
210
+ "save_steps": 500,
211
+ "total_flos": 703983650219928.0,
212
+ "trial_name": null,
213
+ "trial_params": null
214
+ }
finetuned_entity_categorical_classification/checkpoint-11032/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:665da3b0732e752c339d7e2fda57582d0f87bae18392c4edd4fe1327453b2e44
3
+ size 4600
finetuned_entity_categorical_classification/checkpoint-11032/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
 
finetuned_entity_categorical_classification/checkpoint-12608/added_tokens.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "[CLS]": 101,
3
+ "[MASK]": 103,
4
+ "[PAD]": 0,
5
+ "[SEP]": 102,
6
+ "[UNK]": 100
7
+ }
finetuned_entity_categorical_classification/checkpoint-12608/config.json ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilbert-base-uncased",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForSequenceClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "id2label": {
12
+ "0": "Beauty_and_Fitness",
13
+ "1": "People_and_Society",
14
+ "2": "Travel_and_Transportation",
15
+ "3": "Shopping",
16
+ "4": "Adult",
17
+ "5": "Sports",
18
+ "6": "Science",
19
+ "7": "Food_and_Drink",
20
+ "8": "News",
21
+ "9": "Sensitive Subjects",
22
+ "10": "Autos_and_Vehicles",
23
+ "11": "Law_and_Government",
24
+ "12": "Business_and_Industrial",
25
+ "13": "Health",
26
+ "14": "Real Estate",
27
+ "15": "Books_and_Literature",
28
+ "16": "Computers_and_Electronics",
29
+ "17": "Internet_and_Telecom",
30
+ "18": "Home_and_Garden",
31
+ "19": "Jobs_and_Education",
32
+ "20": "Online Communities",
33
+ "21": "Finance",
34
+ "22": "Arts_and_Entertainment",
35
+ "23": "Games",
36
+ "24": "Hobbies_and_Leisure",
37
+ "25": "Reference",
38
+ "26": "Pets_and_Animals"
39
+ },
40
+ "initializer_range": 0.02,
41
+ "label2id": {
42
+ "Adult": 4,
43
+ "Arts_and_Entertainment": 22,
44
+ "Autos_and_Vehicles": 10,
45
+ "Beauty_and_Fitness": 0,
46
+ "Books_and_Literature": 15,
47
+ "Business_and_Industrial": 12,
48
+ "Computers_and_Electronics": 16,
49
+ "Finance": 21,
50
+ "Food_and_Drink": 7,
51
+ "Games": 23,
52
+ "Health": 13,
53
+ "Hobbies_and_Leisure": 24,
54
+ "Home_and_Garden": 18,
55
+ "Internet_and_Telecom": 17,
56
+ "Jobs_and_Education": 19,
57
+ "Law_and_Government": 11,
58
+ "News": 8,
59
+ "Online Communities": 20,
60
+ "People_and_Society": 1,
61
+ "Pets_and_Animals": 26,
62
+ "Real Estate": 14,
63
+ "Reference": 25,
64
+ "Science": 6,
65
+ "Sensitive Subjects": 9,
66
+ "Shopping": 3,
67
+ "Sports": 5,
68
+ "Travel_and_Transportation": 2
69
+ },
70
+ "max_position_embeddings": 512,
71
+ "model_type": "distilbert",
72
+ "n_heads": 12,
73
+ "n_layers": 6,
74
+ "pad_token_id": 0,
75
+ "problem_type": "single_label_classification",
76
+ "qa_dropout": 0.1,
77
+ "seq_classif_dropout": 0.2,
78
+ "sinusoidal_pos_embds": false,
79
+ "tie_weights_": true,
80
+ "torch_dtype": "float32",
81
+ "transformers_version": "4.34.0",
82
+ "vocab_size": 30522
83
+ }
finetuned_entity_categorical_classification/checkpoint-12608/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5067b387ccee9053d789251b1a5c5acf414f391a88bf14a4a7c607312ff4f8f8
3
+ size 535881018
finetuned_entity_categorical_classification/checkpoint-12608/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6b0aec1e67b9a8171d7b46316b23bbf9fee0086b5973a30240e840a0b0f91d6
3
+ size 267932842
finetuned_entity_categorical_classification/checkpoint-12608/rng_state.pth ADDED
Binary file (14.2 kB). View file
 
finetuned_entity_categorical_classification/checkpoint-12608/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5110991592dae080d60ce2bceb93f31532f0a386693c0950a2c500d7d21275c
3
+ size 1064
finetuned_entity_categorical_classification/checkpoint-12608/special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
finetuned_entity_categorical_classification/checkpoint-12608/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
finetuned_entity_categorical_classification/checkpoint-12608/tokenizer_config.json ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "additional_special_tokens": [],
45
+ "clean_up_tokenization_spaces": true,
46
+ "cls_token": "[CLS]",
47
+ "do_lower_case": true,
48
+ "mask_token": "[MASK]",
49
+ "model_max_length": 512,
50
+ "pad_token": "[PAD]",
51
+ "sep_token": "[SEP]",
52
+ "strip_accents": null,
53
+ "tokenize_chinese_chars": true,
54
+ "tokenizer_class": "DistilBertTokenizer",
55
+ "unk_token": "[UNK]"
56
+ }
finetuned_entity_categorical_classification/checkpoint-12608/trainer_state.json ADDED
@@ -0,0 +1,241 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.21237443387508392,
3
+ "best_model_checkpoint": "finetuned_entity_categorical_classification/checkpoint-4728",
4
+ "epoch": 8.0,
5
+ "eval_steps": 500,
6
+ "global_step": 12608,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.32,
13
+ "learning_rate": 1.957698815566836e-05,
14
+ "loss": 1.5567,
15
+ "step": 500
16
+ },
17
+ {
18
+ "epoch": 0.63,
19
+ "learning_rate": 1.915397631133672e-05,
20
+ "loss": 0.3944,
21
+ "step": 1000
22
+ },
23
+ {
24
+ "epoch": 0.95,
25
+ "learning_rate": 1.873096446700508e-05,
26
+ "loss": 0.2773,
27
+ "step": 1500
28
+ },
29
+ {
30
+ "epoch": 1.0,
31
+ "eval_accuracy": 0.9374900840869427,
32
+ "eval_loss": 0.2187376469373703,
33
+ "eval_runtime": 2.2114,
34
+ "eval_samples_per_second": 2850.256,
35
+ "eval_steps_per_second": 178.169,
36
+ "step": 1576
37
+ },
38
+ {
39
+ "epoch": 1.27,
40
+ "learning_rate": 1.830795262267344e-05,
41
+ "loss": 0.1997,
42
+ "step": 2000
43
+ },
44
+ {
45
+ "epoch": 1.59,
46
+ "learning_rate": 1.7884940778341796e-05,
47
+ "loss": 0.202,
48
+ "step": 2500
49
+ },
50
+ {
51
+ "epoch": 1.9,
52
+ "learning_rate": 1.7461928934010152e-05,
53
+ "loss": 0.1797,
54
+ "step": 3000
55
+ },
56
+ {
57
+ "epoch": 2.0,
58
+ "eval_accuracy": 0.9452641599238458,
59
+ "eval_loss": 0.22844311594963074,
60
+ "eval_runtime": 2.2403,
61
+ "eval_samples_per_second": 2813.437,
62
+ "eval_steps_per_second": 175.868,
63
+ "step": 3152
64
+ },
65
+ {
66
+ "epoch": 2.22,
67
+ "learning_rate": 1.7038917089678512e-05,
68
+ "loss": 0.148,
69
+ "step": 3500
70
+ },
71
+ {
72
+ "epoch": 2.54,
73
+ "learning_rate": 1.661590524534687e-05,
74
+ "loss": 0.1357,
75
+ "step": 4000
76
+ },
77
+ {
78
+ "epoch": 2.86,
79
+ "learning_rate": 1.619289340101523e-05,
80
+ "loss": 0.1525,
81
+ "step": 4500
82
+ },
83
+ {
84
+ "epoch": 3.0,
85
+ "eval_accuracy": 0.9481199428843408,
86
+ "eval_loss": 0.21237443387508392,
87
+ "eval_runtime": 2.2281,
88
+ "eval_samples_per_second": 2828.834,
89
+ "eval_steps_per_second": 176.83,
90
+ "step": 4728
91
+ },
92
+ {
93
+ "epoch": 3.17,
94
+ "learning_rate": 1.576988155668359e-05,
95
+ "loss": 0.1218,
96
+ "step": 5000
97
+ },
98
+ {
99
+ "epoch": 3.49,
100
+ "learning_rate": 1.5346869712351946e-05,
101
+ "loss": 0.1147,
102
+ "step": 5500
103
+ },
104
+ {
105
+ "epoch": 3.81,
106
+ "learning_rate": 1.4923857868020306e-05,
107
+ "loss": 0.1195,
108
+ "step": 6000
109
+ },
110
+ {
111
+ "epoch": 4.0,
112
+ "eval_accuracy": 0.94859590671109,
113
+ "eval_loss": 0.2216227501630783,
114
+ "eval_runtime": 2.2255,
115
+ "eval_samples_per_second": 2832.161,
116
+ "eval_steps_per_second": 177.038,
117
+ "step": 6304
118
+ },
119
+ {
120
+ "epoch": 4.12,
121
+ "learning_rate": 1.4500846023688663e-05,
122
+ "loss": 0.114,
123
+ "step": 6500
124
+ },
125
+ {
126
+ "epoch": 4.44,
127
+ "learning_rate": 1.4077834179357023e-05,
128
+ "loss": 0.104,
129
+ "step": 7000
130
+ },
131
+ {
132
+ "epoch": 4.76,
133
+ "learning_rate": 1.3654822335025382e-05,
134
+ "loss": 0.0936,
135
+ "step": 7500
136
+ },
137
+ {
138
+ "epoch": 5.0,
139
+ "eval_accuracy": 0.9462160875773441,
140
+ "eval_loss": 0.24313929677009583,
141
+ "eval_runtime": 2.1752,
142
+ "eval_samples_per_second": 2897.6,
143
+ "eval_steps_per_second": 181.129,
144
+ "step": 7880
145
+ },
146
+ {
147
+ "epoch": 5.08,
148
+ "learning_rate": 1.323181049069374e-05,
149
+ "loss": 0.099,
150
+ "step": 8000
151
+ },
152
+ {
153
+ "epoch": 5.39,
154
+ "learning_rate": 1.28087986463621e-05,
155
+ "loss": 0.0929,
156
+ "step": 8500
157
+ },
158
+ {
159
+ "epoch": 5.71,
160
+ "learning_rate": 1.2385786802030457e-05,
161
+ "loss": 0.0872,
162
+ "step": 9000
163
+ },
164
+ {
165
+ "epoch": 6.0,
166
+ "eval_accuracy": 0.9465333967951769,
167
+ "eval_loss": 0.25265371799468994,
168
+ "eval_runtime": 2.2222,
169
+ "eval_samples_per_second": 2836.351,
170
+ "eval_steps_per_second": 177.3,
171
+ "step": 9456
172
+ },
173
+ {
174
+ "epoch": 6.03,
175
+ "learning_rate": 1.1962774957698817e-05,
176
+ "loss": 0.0963,
177
+ "step": 9500
178
+ },
179
+ {
180
+ "epoch": 6.35,
181
+ "learning_rate": 1.1539763113367176e-05,
182
+ "loss": 0.0733,
183
+ "step": 10000
184
+ },
185
+ {
186
+ "epoch": 6.66,
187
+ "learning_rate": 1.1116751269035532e-05,
188
+ "loss": 0.0812,
189
+ "step": 10500
190
+ },
191
+ {
192
+ "epoch": 6.98,
193
+ "learning_rate": 1.0693739424703892e-05,
194
+ "loss": 0.0929,
195
+ "step": 11000
196
+ },
197
+ {
198
+ "epoch": 7.0,
199
+ "eval_accuracy": 0.9490718705378391,
200
+ "eval_loss": 0.23417465388774872,
201
+ "eval_runtime": 2.1699,
202
+ "eval_samples_per_second": 2904.721,
203
+ "eval_steps_per_second": 181.574,
204
+ "step": 11032
205
+ },
206
+ {
207
+ "epoch": 7.3,
208
+ "learning_rate": 1.0270727580372251e-05,
209
+ "loss": 0.0629,
210
+ "step": 11500
211
+ },
212
+ {
213
+ "epoch": 7.61,
214
+ "learning_rate": 9.84771573604061e-06,
215
+ "loss": 0.0802,
216
+ "step": 12000
217
+ },
218
+ {
219
+ "epoch": 7.93,
220
+ "learning_rate": 9.424703891708968e-06,
221
+ "loss": 0.0757,
222
+ "step": 12500
223
+ },
224
+ {
225
+ "epoch": 8.0,
226
+ "eval_accuracy": 0.9490718705378391,
227
+ "eval_loss": 0.24814845621585846,
228
+ "eval_runtime": 2.241,
229
+ "eval_samples_per_second": 2812.616,
230
+ "eval_steps_per_second": 175.816,
231
+ "step": 12608
232
+ }
233
+ ],
234
+ "logging_steps": 500,
235
+ "max_steps": 23640,
236
+ "num_train_epochs": 15,
237
+ "save_steps": 500,
238
+ "total_flos": 804434563822968.0,
239
+ "trial_name": null,
240
+ "trial_params": null
241
+ }
finetuned_entity_categorical_classification/checkpoint-12608/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:665da3b0732e752c339d7e2fda57582d0f87bae18392c4edd4fe1327453b2e44
3
+ size 4600
finetuned_entity_categorical_classification/checkpoint-12608/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
 
finetuned_entity_categorical_classification/checkpoint-14184/added_tokens.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "[CLS]": 101,
3
+ "[MASK]": 103,
4
+ "[PAD]": 0,
5
+ "[SEP]": 102,
6
+ "[UNK]": 100
7
+ }
finetuned_entity_categorical_classification/checkpoint-14184/config.json ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilbert-base-uncased",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForSequenceClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "id2label": {
12
+ "0": "Beauty_and_Fitness",
13
+ "1": "People_and_Society",
14
+ "2": "Travel_and_Transportation",
15
+ "3": "Shopping",
16
+ "4": "Adult",
17
+ "5": "Sports",
18
+ "6": "Science",
19
+ "7": "Food_and_Drink",
20
+ "8": "News",
21
+ "9": "Sensitive Subjects",
22
+ "10": "Autos_and_Vehicles",
23
+ "11": "Law_and_Government",
24
+ "12": "Business_and_Industrial",
25
+ "13": "Health",
26
+ "14": "Real Estate",
27
+ "15": "Books_and_Literature",
28
+ "16": "Computers_and_Electronics",
29
+ "17": "Internet_and_Telecom",
30
+ "18": "Home_and_Garden",
31
+ "19": "Jobs_and_Education",
32
+ "20": "Online Communities",
33
+ "21": "Finance",
34
+ "22": "Arts_and_Entertainment",
35
+ "23": "Games",
36
+ "24": "Hobbies_and_Leisure",
37
+ "25": "Reference",
38
+ "26": "Pets_and_Animals"
39
+ },
40
+ "initializer_range": 0.02,
41
+ "label2id": {
42
+ "Adult": 4,
43
+ "Arts_and_Entertainment": 22,
44
+ "Autos_and_Vehicles": 10,
45
+ "Beauty_and_Fitness": 0,
46
+ "Books_and_Literature": 15,
47
+ "Business_and_Industrial": 12,
48
+ "Computers_and_Electronics": 16,
49
+ "Finance": 21,
50
+ "Food_and_Drink": 7,
51
+ "Games": 23,
52
+ "Health": 13,
53
+ "Hobbies_and_Leisure": 24,
54
+ "Home_and_Garden": 18,
55
+ "Internet_and_Telecom": 17,
56
+ "Jobs_and_Education": 19,
57
+ "Law_and_Government": 11,
58
+ "News": 8,
59
+ "Online Communities": 20,
60
+ "People_and_Society": 1,
61
+ "Pets_and_Animals": 26,
62
+ "Real Estate": 14,
63
+ "Reference": 25,
64
+ "Science": 6,
65
+ "Sensitive Subjects": 9,
66
+ "Shopping": 3,
67
+ "Sports": 5,
68
+ "Travel_and_Transportation": 2
69
+ },
70
+ "max_position_embeddings": 512,
71
+ "model_type": "distilbert",
72
+ "n_heads": 12,
73
+ "n_layers": 6,
74
+ "pad_token_id": 0,
75
+ "problem_type": "single_label_classification",
76
+ "qa_dropout": 0.1,
77
+ "seq_classif_dropout": 0.2,
78
+ "sinusoidal_pos_embds": false,
79
+ "tie_weights_": true,
80
+ "torch_dtype": "float32",
81
+ "transformers_version": "4.34.0",
82
+ "vocab_size": 30522
83
+ }
finetuned_entity_categorical_classification/checkpoint-14184/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7aa590b9129b35b41a2d1ce971a668ce5e1163066050e58b78e70e810d954b14
3
+ size 535881018
finetuned_entity_categorical_classification/checkpoint-14184/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc27a7b4430993ed96dc4ca6a093c1d56f91af41b7dae7656f4123bafb7cc351
3
+ size 267932842
finetuned_entity_categorical_classification/checkpoint-14184/rng_state.pth ADDED
Binary file (14.2 kB). View file
 
finetuned_entity_categorical_classification/checkpoint-14184/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91556a0da86661baaedcd0c391f9995fe50cace2508f811078e409ba7f709686
3
+ size 1064
finetuned_entity_categorical_classification/checkpoint-14184/special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
finetuned_entity_categorical_classification/checkpoint-14184/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
finetuned_entity_categorical_classification/checkpoint-14184/tokenizer_config.json ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "additional_special_tokens": [],
45
+ "clean_up_tokenization_spaces": true,
46
+ "cls_token": "[CLS]",
47
+ "do_lower_case": true,
48
+ "mask_token": "[MASK]",
49
+ "model_max_length": 512,
50
+ "pad_token": "[PAD]",
51
+ "sep_token": "[SEP]",
52
+ "strip_accents": null,
53
+ "tokenize_chinese_chars": true,
54
+ "tokenizer_class": "DistilBertTokenizer",
55
+ "unk_token": "[UNK]"
56
+ }
finetuned_entity_categorical_classification/checkpoint-14184/trainer_state.json ADDED
@@ -0,0 +1,268 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.21237443387508392,
3
+ "best_model_checkpoint": "finetuned_entity_categorical_classification/checkpoint-4728",
4
+ "epoch": 9.0,
5
+ "eval_steps": 500,
6
+ "global_step": 14184,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.32,
13
+ "learning_rate": 1.957698815566836e-05,
14
+ "loss": 1.5567,
15
+ "step": 500
16
+ },
17
+ {
18
+ "epoch": 0.63,
19
+ "learning_rate": 1.915397631133672e-05,
20
+ "loss": 0.3944,
21
+ "step": 1000
22
+ },
23
+ {
24
+ "epoch": 0.95,
25
+ "learning_rate": 1.873096446700508e-05,
26
+ "loss": 0.2773,
27
+ "step": 1500
28
+ },
29
+ {
30
+ "epoch": 1.0,
31
+ "eval_accuracy": 0.9374900840869427,
32
+ "eval_loss": 0.2187376469373703,
33
+ "eval_runtime": 2.2114,
34
+ "eval_samples_per_second": 2850.256,
35
+ "eval_steps_per_second": 178.169,
36
+ "step": 1576
37
+ },
38
+ {
39
+ "epoch": 1.27,
40
+ "learning_rate": 1.830795262267344e-05,
41
+ "loss": 0.1997,
42
+ "step": 2000
43
+ },
44
+ {
45
+ "epoch": 1.59,
46
+ "learning_rate": 1.7884940778341796e-05,
47
+ "loss": 0.202,
48
+ "step": 2500
49
+ },
50
+ {
51
+ "epoch": 1.9,
52
+ "learning_rate": 1.7461928934010152e-05,
53
+ "loss": 0.1797,
54
+ "step": 3000
55
+ },
56
+ {
57
+ "epoch": 2.0,
58
+ "eval_accuracy": 0.9452641599238458,
59
+ "eval_loss": 0.22844311594963074,
60
+ "eval_runtime": 2.2403,
61
+ "eval_samples_per_second": 2813.437,
62
+ "eval_steps_per_second": 175.868,
63
+ "step": 3152
64
+ },
65
+ {
66
+ "epoch": 2.22,
67
+ "learning_rate": 1.7038917089678512e-05,
68
+ "loss": 0.148,
69
+ "step": 3500
70
+ },
71
+ {
72
+ "epoch": 2.54,
73
+ "learning_rate": 1.661590524534687e-05,
74
+ "loss": 0.1357,
75
+ "step": 4000
76
+ },
77
+ {
78
+ "epoch": 2.86,
79
+ "learning_rate": 1.619289340101523e-05,
80
+ "loss": 0.1525,
81
+ "step": 4500
82
+ },
83
+ {
84
+ "epoch": 3.0,
85
+ "eval_accuracy": 0.9481199428843408,
86
+ "eval_loss": 0.21237443387508392,
87
+ "eval_runtime": 2.2281,
88
+ "eval_samples_per_second": 2828.834,
89
+ "eval_steps_per_second": 176.83,
90
+ "step": 4728
91
+ },
92
+ {
93
+ "epoch": 3.17,
94
+ "learning_rate": 1.576988155668359e-05,
95
+ "loss": 0.1218,
96
+ "step": 5000
97
+ },
98
+ {
99
+ "epoch": 3.49,
100
+ "learning_rate": 1.5346869712351946e-05,
101
+ "loss": 0.1147,
102
+ "step": 5500
103
+ },
104
+ {
105
+ "epoch": 3.81,
106
+ "learning_rate": 1.4923857868020306e-05,
107
+ "loss": 0.1195,
108
+ "step": 6000
109
+ },
110
+ {
111
+ "epoch": 4.0,
112
+ "eval_accuracy": 0.94859590671109,
113
+ "eval_loss": 0.2216227501630783,
114
+ "eval_runtime": 2.2255,
115
+ "eval_samples_per_second": 2832.161,
116
+ "eval_steps_per_second": 177.038,
117
+ "step": 6304
118
+ },
119
+ {
120
+ "epoch": 4.12,
121
+ "learning_rate": 1.4500846023688663e-05,
122
+ "loss": 0.114,
123
+ "step": 6500
124
+ },
125
+ {
126
+ "epoch": 4.44,
127
+ "learning_rate": 1.4077834179357023e-05,
128
+ "loss": 0.104,
129
+ "step": 7000
130
+ },
131
+ {
132
+ "epoch": 4.76,
133
+ "learning_rate": 1.3654822335025382e-05,
134
+ "loss": 0.0936,
135
+ "step": 7500
136
+ },
137
+ {
138
+ "epoch": 5.0,
139
+ "eval_accuracy": 0.9462160875773441,
140
+ "eval_loss": 0.24313929677009583,
141
+ "eval_runtime": 2.1752,
142
+ "eval_samples_per_second": 2897.6,
143
+ "eval_steps_per_second": 181.129,
144
+ "step": 7880
145
+ },
146
+ {
147
+ "epoch": 5.08,
148
+ "learning_rate": 1.323181049069374e-05,
149
+ "loss": 0.099,
150
+ "step": 8000
151
+ },
152
+ {
153
+ "epoch": 5.39,
154
+ "learning_rate": 1.28087986463621e-05,
155
+ "loss": 0.0929,
156
+ "step": 8500
157
+ },
158
+ {
159
+ "epoch": 5.71,
160
+ "learning_rate": 1.2385786802030457e-05,
161
+ "loss": 0.0872,
162
+ "step": 9000
163
+ },
164
+ {
165
+ "epoch": 6.0,
166
+ "eval_accuracy": 0.9465333967951769,
167
+ "eval_loss": 0.25265371799468994,
168
+ "eval_runtime": 2.2222,
169
+ "eval_samples_per_second": 2836.351,
170
+ "eval_steps_per_second": 177.3,
171
+ "step": 9456
172
+ },
173
+ {
174
+ "epoch": 6.03,
175
+ "learning_rate": 1.1962774957698817e-05,
176
+ "loss": 0.0963,
177
+ "step": 9500
178
+ },
179
+ {
180
+ "epoch": 6.35,
181
+ "learning_rate": 1.1539763113367176e-05,
182
+ "loss": 0.0733,
183
+ "step": 10000
184
+ },
185
+ {
186
+ "epoch": 6.66,
187
+ "learning_rate": 1.1116751269035532e-05,
188
+ "loss": 0.0812,
189
+ "step": 10500
190
+ },
191
+ {
192
+ "epoch": 6.98,
193
+ "learning_rate": 1.0693739424703892e-05,
194
+ "loss": 0.0929,
195
+ "step": 11000
196
+ },
197
+ {
198
+ "epoch": 7.0,
199
+ "eval_accuracy": 0.9490718705378391,
200
+ "eval_loss": 0.23417465388774872,
201
+ "eval_runtime": 2.1699,
202
+ "eval_samples_per_second": 2904.721,
203
+ "eval_steps_per_second": 181.574,
204
+ "step": 11032
205
+ },
206
+ {
207
+ "epoch": 7.3,
208
+ "learning_rate": 1.0270727580372251e-05,
209
+ "loss": 0.0629,
210
+ "step": 11500
211
+ },
212
+ {
213
+ "epoch": 7.61,
214
+ "learning_rate": 9.84771573604061e-06,
215
+ "loss": 0.0802,
216
+ "step": 12000
217
+ },
218
+ {
219
+ "epoch": 7.93,
220
+ "learning_rate": 9.424703891708968e-06,
221
+ "loss": 0.0757,
222
+ "step": 12500
223
+ },
224
+ {
225
+ "epoch": 8.0,
226
+ "eval_accuracy": 0.9490718705378391,
227
+ "eval_loss": 0.24814845621585846,
228
+ "eval_runtime": 2.241,
229
+ "eval_samples_per_second": 2812.616,
230
+ "eval_steps_per_second": 175.816,
231
+ "step": 12608
232
+ },
233
+ {
234
+ "epoch": 8.25,
235
+ "learning_rate": 9.001692047377328e-06,
236
+ "loss": 0.063,
237
+ "step": 13000
238
+ },
239
+ {
240
+ "epoch": 8.57,
241
+ "learning_rate": 8.578680203045686e-06,
242
+ "loss": 0.0619,
243
+ "step": 13500
244
+ },
245
+ {
246
+ "epoch": 8.88,
247
+ "learning_rate": 8.155668358714045e-06,
248
+ "loss": 0.0673,
249
+ "step": 14000
250
+ },
251
+ {
252
+ "epoch": 9.0,
253
+ "eval_accuracy": 0.9474853244486753,
254
+ "eval_loss": 0.2526280879974365,
255
+ "eval_runtime": 2.1778,
256
+ "eval_samples_per_second": 2894.229,
257
+ "eval_steps_per_second": 180.918,
258
+ "step": 14184
259
+ }
260
+ ],
261
+ "logging_steps": 500,
262
+ "max_steps": 23640,
263
+ "num_train_epochs": 15,
264
+ "save_steps": 500,
265
+ "total_flos": 904402998290376.0,
266
+ "trial_name": null,
267
+ "trial_params": null
268
+ }
finetuned_entity_categorical_classification/checkpoint-14184/training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:665da3b0732e752c339d7e2fda57582d0f87bae18392c4edd4fe1327453b2e44
3
+ size 4600
finetuned_entity_categorical_classification/checkpoint-14184/vocab.txt ADDED
The diff for this file is too large to render. See raw diff
 
finetuned_entity_categorical_classification/checkpoint-1576/added_tokens.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "[CLS]": 101,
3
+ "[MASK]": 103,
4
+ "[PAD]": 0,
5
+ "[SEP]": 102,
6
+ "[UNK]": 100
7
+ }
finetuned_entity_categorical_classification/checkpoint-1576/config.json ADDED
@@ -0,0 +1,83 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilbert-base-uncased",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForSequenceClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "id2label": {
12
+ "0": "Beauty_and_Fitness",
13
+ "1": "People_and_Society",
14
+ "2": "Travel_and_Transportation",
15
+ "3": "Shopping",
16
+ "4": "Adult",
17
+ "5": "Sports",
18
+ "6": "Science",
19
+ "7": "Food_and_Drink",
20
+ "8": "News",
21
+ "9": "Sensitive Subjects",
22
+ "10": "Autos_and_Vehicles",
23
+ "11": "Law_and_Government",
24
+ "12": "Business_and_Industrial",
25
+ "13": "Health",
26
+ "14": "Real Estate",
27
+ "15": "Books_and_Literature",
28
+ "16": "Computers_and_Electronics",
29
+ "17": "Internet_and_Telecom",
30
+ "18": "Home_and_Garden",
31
+ "19": "Jobs_and_Education",
32
+ "20": "Online Communities",
33
+ "21": "Finance",
34
+ "22": "Arts_and_Entertainment",
35
+ "23": "Games",
36
+ "24": "Hobbies_and_Leisure",
37
+ "25": "Reference",
38
+ "26": "Pets_and_Animals"
39
+ },
40
+ "initializer_range": 0.02,
41
+ "label2id": {
42
+ "Adult": 4,
43
+ "Arts_and_Entertainment": 22,
44
+ "Autos_and_Vehicles": 10,
45
+ "Beauty_and_Fitness": 0,
46
+ "Books_and_Literature": 15,
47
+ "Business_and_Industrial": 12,
48
+ "Computers_and_Electronics": 16,
49
+ "Finance": 21,
50
+ "Food_and_Drink": 7,
51
+ "Games": 23,
52
+ "Health": 13,
53
+ "Hobbies_and_Leisure": 24,
54
+ "Home_and_Garden": 18,
55
+ "Internet_and_Telecom": 17,
56
+ "Jobs_and_Education": 19,
57
+ "Law_and_Government": 11,
58
+ "News": 8,
59
+ "Online Communities": 20,
60
+ "People_and_Society": 1,
61
+ "Pets_and_Animals": 26,
62
+ "Real Estate": 14,
63
+ "Reference": 25,
64
+ "Science": 6,
65
+ "Sensitive Subjects": 9,
66
+ "Shopping": 3,
67
+ "Sports": 5,
68
+ "Travel_and_Transportation": 2
69
+ },
70
+ "max_position_embeddings": 512,
71
+ "model_type": "distilbert",
72
+ "n_heads": 12,
73
+ "n_layers": 6,
74
+ "pad_token_id": 0,
75
+ "problem_type": "single_label_classification",
76
+ "qa_dropout": 0.1,
77
+ "seq_classif_dropout": 0.2,
78
+ "sinusoidal_pos_embds": false,
79
+ "tie_weights_": true,
80
+ "torch_dtype": "float32",
81
+ "transformers_version": "4.34.0",
82
+ "vocab_size": 30522
83
+ }
finetuned_entity_categorical_classification/checkpoint-1576/optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e20e493b3480b24380280eb5e21c5fd12d4881adfb9cb57a5dd4559f3e85680
3
+ size 535881018
finetuned_entity_categorical_classification/checkpoint-1576/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:732fd46b0cb9afaec1d14b6595994279ae8d82e40715c5b60b128db60718e69b
3
+ size 267932842
finetuned_entity_categorical_classification/checkpoint-1576/rng_state.pth ADDED
Binary file (14.2 kB). View file
 
finetuned_entity_categorical_classification/checkpoint-1576/scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:774c81fc50874cca433d334a482dfa90f04ccfdc642ea608612d6233e8d60700
3
+ size 1064
finetuned_entity_categorical_classification/checkpoint-1576/special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
finetuned_entity_categorical_classification/checkpoint-1576/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
finetuned_entity_categorical_classification/checkpoint-1576/tokenizer_config.json ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "additional_special_tokens": [],
45
+ "clean_up_tokenization_spaces": true,
46
+ "cls_token": "[CLS]",
47
+ "do_lower_case": true,
48
+ "mask_token": "[MASK]",
49
+ "model_max_length": 512,
50
+ "pad_token": "[PAD]",
51
+ "sep_token": "[SEP]",
52
+ "strip_accents": null,
53
+ "tokenize_chinese_chars": true,
54
+ "tokenizer_class": "DistilBertTokenizer",
55
+ "unk_token": "[UNK]"
56
+ }
finetuned_entity_categorical_classification/checkpoint-1576/trainer_state.json ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.2187376469373703,
3
+ "best_model_checkpoint": "finetuned_entity_categorical_classification/checkpoint-1576",
4
+ "epoch": 1.0,
5
+ "eval_steps": 500,
6
+ "global_step": 1576,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.32,
13
+ "learning_rate": 1.957698815566836e-05,
14
+ "loss": 1.5567,
15
+ "step": 500
16
+ },
17
+ {
18
+ "epoch": 0.63,
19
+ "learning_rate": 1.915397631133672e-05,
20
+ "loss": 0.3944,
21
+ "step": 1000
22
+ },
23
+ {
24
+ "epoch": 0.95,
25
+ "learning_rate": 1.873096446700508e-05,
26
+ "loss": 0.2773,
27
+ "step": 1500
28
+ },
29
+ {
30
+ "epoch": 1.0,
31
+ "eval_accuracy": 0.9374900840869427,
32
+ "eval_loss": 0.2187376469373703,
33
+ "eval_runtime": 2.2114,
34
+ "eval_samples_per_second": 2850.256,
35
+ "eval_steps_per_second": 178.169,
36
+ "step": 1576
37
+ }
38
+ ],
39
+ "logging_steps": 500,
40
+ "max_steps": 23640,
41
+ "num_train_epochs": 15,
42
+ "save_steps": 500,
43
+ "total_flos": 100414675899720.0,
44
+ "trial_name": null,
45
+ "trial_params": null
46
+ }