langecod commited on
Commit
4d26e42
1 Parent(s): b0d14a4

Upload 13 files

Browse files
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d9eff9d490ea169b19c96ec0b7a7aa47e850cad8df78fbf4db75d91ed2bfd8ad
3
+ size 713814663
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f3134c9dd5033c3a89cb338119f227d68ef1261e80f374ccf72042459f980cf
3
  size 1421591285
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6066ad4414615b6368555670b459519b2820e6b99ee620f01150d2e2756b8639
3
  size 1421591285
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77a2047396ff3a03eafb808ad429303a7a717ab9bdf2f4620b0795d537b1fd0c
3
+ size 14575
scaler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:365dfcb3374d3aec2825a15b9cf142dba091285f91be8d42e49a8ac8a7d8ba6c
3
+ size 557
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da46f0788b903dbf639a0a6caca06a50b8d0e108bfa4679f0632362fea827fbc
3
+ size 627
tokenizer.json CHANGED
@@ -2,13 +2,13 @@
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
- "max_length": 135,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
- "Fixed": 135
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
 
2
  "version": "1.0",
3
  "truncation": {
4
  "direction": "Right",
5
+ "max_length": 133,
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
  "padding": {
10
  "strategy": {
11
+ "Fixed": 133
12
  },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
trainer_state.json ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.13875289261341095,
3
+ "best_model_checkpoint": "Sentiment_Analysis_1stPass\\checkpoint-176",
4
+ "epoch": 4.0,
5
+ "global_step": 176,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 1.0,
12
+ "eval_accuracy": 0.8753623188405797,
13
+ "eval_f1_macro": 0.8703821629281211,
14
+ "eval_f1_weighted": 0.8772325635732019,
15
+ "eval_loss": 0.5208103060722351,
16
+ "eval_precision_macro": 0.8405041286397218,
17
+ "eval_precision_weighted": 0.899241350641498,
18
+ "eval_recall_macro": 0.9222675594092165,
19
+ "eval_recall_weighted": 0.8753623188405797,
20
+ "eval_runtime": 0.879,
21
+ "eval_samples_per_second": 392.476,
22
+ "eval_steps_per_second": 6.826,
23
+ "step": 44
24
+ },
25
+ {
26
+ "epoch": 2.0,
27
+ "eval_accuracy": 0.9391304347826087,
28
+ "eval_f1_macro": 0.9313039001501803,
29
+ "eval_f1_weighted": 0.9395501058165897,
30
+ "eval_loss": 0.22994813323020935,
31
+ "eval_precision_macro": 0.9169520950537658,
32
+ "eval_precision_weighted": 0.9419409097611233,
33
+ "eval_recall_macro": 0.947968910690742,
34
+ "eval_recall_weighted": 0.9391304347826087,
35
+ "eval_runtime": 0.9126,
36
+ "eval_samples_per_second": 378.058,
37
+ "eval_steps_per_second": 6.575,
38
+ "step": 88
39
+ },
40
+ {
41
+ "epoch": 3.0,
42
+ "eval_accuracy": 0.936231884057971,
43
+ "eval_f1_macro": 0.9263587826781255,
44
+ "eval_f1_weighted": 0.9366114221156357,
45
+ "eval_loss": 0.2097598910331726,
46
+ "eval_precision_macro": 0.9145166032673613,
47
+ "eval_precision_weighted": 0.9386677436958241,
48
+ "eval_recall_macro": 0.940032402754234,
49
+ "eval_recall_weighted": 0.936231884057971,
50
+ "eval_runtime": 0.8647,
51
+ "eval_samples_per_second": 398.986,
52
+ "eval_steps_per_second": 6.939,
53
+ "step": 132
54
+ },
55
+ {
56
+ "epoch": 4.0,
57
+ "eval_accuracy": 0.9623188405797102,
58
+ "eval_f1_macro": 0.9548373952056096,
59
+ "eval_f1_weighted": 0.962275452270214,
60
+ "eval_loss": 0.13875289261341095,
61
+ "eval_precision_macro": 0.9579058508118398,
62
+ "eval_precision_weighted": 0.9622718192803769,
63
+ "eval_recall_macro": 0.9518634083897131,
64
+ "eval_recall_weighted": 0.9623188405797102,
65
+ "eval_runtime": 0.9154,
66
+ "eval_samples_per_second": 376.876,
67
+ "eval_steps_per_second": 6.554,
68
+ "step": 176
69
+ }
70
+ ],
71
+ "max_steps": 660,
72
+ "num_train_epochs": 15,
73
+ "total_flos": 2674550119470096.0,
74
+ "trial_name": null,
75
+ "trial_params": null
76
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:090bce03ba80405dcd41540fb6d1c8768803e726c36be241275d952d0cd149a7
3
+ size 3899