cp 2800
Browse files- optimizer.pt +1 -1
- pytorch_model.bin +1 -1
- scheduler.pt +1 -1
- trainer_state.json +31 -3
optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2490339591
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:415f789cebf94dc975e2af37856a750f6a78c4e12af0b81cbeef753992d90419
|
3 |
size 2490339591
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1262065048
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0dc27a79ad93085f47b570fdaf3825b555caa80cf07cabe1ba820b1fd6247b8a
|
3 |
size 1262065048
|
scheduler.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 623
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69fca0da0f8fa986f151fcf8b07e0888193c079c13d2d8004abe9580c45c5584
|
3 |
size 623
|
trainer_state.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
-
"epoch": 2.
|
5 |
-
"global_step":
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
@@ -76,11 +76,39 @@
|
|
76 |
"eval_samples_per_second": 7.991,
|
77 |
"eval_wer": 0.42106879606879605,
|
78 |
"step": 2000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
79 |
}
|
80 |
],
|
81 |
"max_steps": 29490,
|
82 |
"num_train_epochs": 30,
|
83 |
-
"total_flos": 1.
|
84 |
"trial_name": null,
|
85 |
"trial_params": null
|
86 |
}
|
|
|
1 |
{
|
2 |
"best_metric": null,
|
3 |
"best_model_checkpoint": null,
|
4 |
+
"epoch": 2.8484231943031535,
|
5 |
+
"global_step": 2800,
|
6 |
"is_hyper_param_search": false,
|
7 |
"is_local_process_zero": true,
|
8 |
"is_world_process_zero": true,
|
|
|
76 |
"eval_samples_per_second": 7.991,
|
77 |
"eval_wer": 0.42106879606879605,
|
78 |
"step": 2000
|
79 |
+
},
|
80 |
+
{
|
81 |
+
"epoch": 2.44,
|
82 |
+
"learning_rate": 0.0002803380476026216,
|
83 |
+
"loss": 0.2606,
|
84 |
+
"step": 2400
|
85 |
+
},
|
86 |
+
{
|
87 |
+
"epoch": 2.44,
|
88 |
+
"eval_loss": 0.39613404870033264,
|
89 |
+
"eval_runtime": 233.8224,
|
90 |
+
"eval_samples_per_second": 8.002,
|
91 |
+
"eval_wer": 0.4057125307125307,
|
92 |
+
"step": 2400
|
93 |
+
},
|
94 |
+
{
|
95 |
+
"epoch": 2.85,
|
96 |
+
"learning_rate": 0.0002761986892031735,
|
97 |
+
"loss": 0.2475,
|
98 |
+
"step": 2800
|
99 |
+
},
|
100 |
+
{
|
101 |
+
"epoch": 2.85,
|
102 |
+
"eval_loss": 0.3680589497089386,
|
103 |
+
"eval_runtime": 235.255,
|
104 |
+
"eval_samples_per_second": 7.953,
|
105 |
+
"eval_wer": 0.39256756756756755,
|
106 |
+
"step": 2800
|
107 |
}
|
108 |
],
|
109 |
"max_steps": 29490,
|
110 |
"num_train_epochs": 30,
|
111 |
+
"total_flos": 1.5548475390462444e+19,
|
112 |
"trial_name": null,
|
113 |
"trial_params": null
|
114 |
}
|