marinone94 commited on
Commit
881b745
β€’
1 Parent(s): fc2f4cd

Training in progress, step 3000

Browse files
{checkpoint-2600 β†’ checkpoint-2900}/config.json RENAMED
File without changes
{checkpoint-2600 β†’ checkpoint-2900}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:446a2b6be86378473522da6f8340e8995c1f93f317dbf12dd45b200fe2a7cc10
3
  size 2490337809
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:459fd9cc8b47164c5e619165015eaa256572f1c2c4cf53b6619361a7675d46a1
3
  size 2490337809
{checkpoint-2600 β†’ checkpoint-2900}/preprocessor_config.json RENAMED
File without changes
{checkpoint-2700 β†’ checkpoint-2900}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7dbbb4678046f14503aa95af2d02c0cc6a2fb7071e468967b463cf71594e2914
3
  size 1262063089
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d39abe947b6927f79b7ffad55a6a3ba07cdd2ab995efc1159bb1ca188d440e7f
3
  size 1262063089
{checkpoint-2600 β†’ checkpoint-2900}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c9452e603549f04f4903c5fb527b7bfc83e1fbaca4162bb7fdd612e22dd24235
3
  size 14567
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d40993892ed72701230daaea4a79ca45b84c615b387b7bc61e6e9982f8358e4
3
  size 14567
{checkpoint-2700 β†’ checkpoint-2900}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7970626d52baf6e9c965f8503c1a6318b3c55b1f5ba73fdd8b8209e28d5d529e
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:daedbf6df7d4c1927bb965444b3e2d13f98980e3a59e64cf90683cbd1e80bdf5
3
  size 559
{checkpoint-2600 β†’ checkpoint-2900}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7e6505acc346b949554e5cbd939e1a9cf4a757843e611b8b1dc1e36690134723
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da5b41dc4267a4eb8832f6b51e0de784a14e4fa5985ff5c1c6135876b04560d7
3
  size 623
{checkpoint-2700 β†’ checkpoint-2900}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 29.666666666666668,
5
- "global_step": 2700,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1059,11 +1059,89 @@
1059
  "eval_steps_per_second": 0.803,
1060
  "eval_wer": 0.14774340051092819,
1061
  "step": 2700
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1062
  }
1063
  ],
1064
  "max_steps": 4550,
1065
  "num_train_epochs": 50,
1066
- "total_flos": 4.176183820424104e+19,
1067
  "trial_name": null,
1068
  "trial_params": null
1069
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 31.863387978142075,
5
+ "global_step": 2900,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1059
  "eval_steps_per_second": 0.803,
1060
  "eval_wer": 0.14774340051092819,
1061
  "step": 2700
1062
+ },
1063
+ {
1064
+ "epoch": 29.89,
1065
+ "learning_rate": 0.0001796078431372549,
1066
+ "loss": 0.8573,
1067
+ "step": 2720
1068
+ },
1069
+ {
1070
+ "epoch": 30.11,
1071
+ "learning_rate": 0.00017764705882352942,
1072
+ "loss": 0.8686,
1073
+ "step": 2740
1074
+ },
1075
+ {
1076
+ "epoch": 30.33,
1077
+ "learning_rate": 0.00017568627450980392,
1078
+ "loss": 0.8462,
1079
+ "step": 2760
1080
+ },
1081
+ {
1082
+ "epoch": 30.55,
1083
+ "learning_rate": 0.00017372549019607845,
1084
+ "loss": 0.8419,
1085
+ "step": 2780
1086
+ },
1087
+ {
1088
+ "epoch": 30.77,
1089
+ "learning_rate": 0.00017176470588235293,
1090
+ "loss": 0.8659,
1091
+ "step": 2800
1092
+ },
1093
+ {
1094
+ "epoch": 30.77,
1095
+ "eval_loss": 0.1636602133512497,
1096
+ "eval_runtime": 190.245,
1097
+ "eval_samples_per_second": 25.457,
1098
+ "eval_steps_per_second": 0.799,
1099
+ "eval_wer": 0.1422367300596083,
1100
+ "step": 2800
1101
+ },
1102
+ {
1103
+ "epoch": 30.98,
1104
+ "learning_rate": 0.00016980392156862745,
1105
+ "loss": 0.8607,
1106
+ "step": 2820
1107
+ },
1108
+ {
1109
+ "epoch": 31.21,
1110
+ "learning_rate": 0.00016784313725490196,
1111
+ "loss": 0.8484,
1112
+ "step": 2840
1113
+ },
1114
+ {
1115
+ "epoch": 31.43,
1116
+ "learning_rate": 0.00016588235294117648,
1117
+ "loss": 0.8335,
1118
+ "step": 2860
1119
+ },
1120
+ {
1121
+ "epoch": 31.64,
1122
+ "learning_rate": 0.00016392156862745098,
1123
+ "loss": 0.8321,
1124
+ "step": 2880
1125
+ },
1126
+ {
1127
+ "epoch": 31.86,
1128
+ "learning_rate": 0.00016196078431372549,
1129
+ "loss": 0.8419,
1130
+ "step": 2900
1131
+ },
1132
+ {
1133
+ "epoch": 31.86,
1134
+ "eval_loss": 0.16137854754924774,
1135
+ "eval_runtime": 190.2053,
1136
+ "eval_samples_per_second": 25.462,
1137
+ "eval_steps_per_second": 0.799,
1138
+ "eval_wer": 0.1397104740278172,
1139
+ "step": 2900
1140
  }
1141
  ],
1142
  "max_steps": 4550,
1143
  "num_train_epochs": 50,
1144
+ "total_flos": 4.48632216197919e+19,
1145
  "trial_name": null,
1146
  "trial_params": null
1147
  }
{checkpoint-2600 β†’ checkpoint-2900}/training_args.bin RENAMED
File without changes
{checkpoint-2700 β†’ checkpoint-3000}/config.json RENAMED
File without changes
{checkpoint-2700 β†’ checkpoint-3000}/optimizer.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:865f44abdd5045a8acf626b3b992e8fdc983a2d4a3ba5dd6901b27ee83a91484
3
  size 2490337809
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:023713187972aa2b714a036a65a7542d7e006ad45109ce7ddc7eafb956260fe3
3
  size 2490337809
{checkpoint-2700 β†’ checkpoint-3000}/preprocessor_config.json RENAMED
File without changes
{checkpoint-2600 β†’ checkpoint-3000}/pytorch_model.bin RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:91a8acf504932720b905a27cdf2f6f7fe41c15519686ef918a30514dacbc0cee
3
  size 1262063089
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e2564558a2c8e9677d5526af137102a80a73cbd4be834bcb3fa95a0e5c8ecef
3
  size 1262063089
{checkpoint-2700 β†’ checkpoint-3000}/rng_state.pth RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9213f1eed5d75326eef26e352d35aa78d567c2885250ab304bce7d59c834157a
3
- size 14631
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:813a474ad7f864479df922c7e373032d552ed88f79371c0f5114bee90fb0f0c6
3
+ size 14567
{checkpoint-2600 β†’ checkpoint-3000}/scaler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:981227375b8c6d2439b9fd2664e9cd784500649faa2e607c97ed38e07fc17be3
3
  size 559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba461c86794433c4a650b89cfa19a2a74f927a6e243d52bc4fa86b75cc0b4312
3
  size 559
{checkpoint-2700 β†’ checkpoint-3000}/scheduler.pt RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:89b50e7b743fe5caf734a580430810fca62d132f602e2a17e8e075ce20b82717
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fff88e552e894e867e2247a229e76319848f876eaeb56445f8251bd260defd4d
3
  size 623
{checkpoint-2600 β†’ checkpoint-3000}/trainer_state.json RENAMED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 28.56830601092896,
5
- "global_step": 2600,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1020,11 +1020,167 @@
1020
  "eval_steps_per_second": 0.774,
1021
  "eval_wer": 0.14459267669599773,
1022
  "step": 2600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1023
  }
1024
  ],
1025
  "max_steps": 4550,
1026
  "num_train_epochs": 50,
1027
- "total_flos": 4.023333138533005e+19,
1028
  "trial_name": null,
1029
  "trial_params": null
1030
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 32.96174863387978,
5
+ "global_step": 3000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1020
  "eval_steps_per_second": 0.774,
1021
  "eval_wer": 0.14459267669599773,
1022
  "step": 2600
1023
+ },
1024
+ {
1025
+ "epoch": 28.79,
1026
+ "learning_rate": 0.00018941176470588236,
1027
+ "loss": 0.8796,
1028
+ "step": 2620
1029
+ },
1030
+ {
1031
+ "epoch": 29.01,
1032
+ "learning_rate": 0.00018745098039215686,
1033
+ "loss": 0.9045,
1034
+ "step": 2640
1035
+ },
1036
+ {
1037
+ "epoch": 29.23,
1038
+ "learning_rate": 0.00018549019607843137,
1039
+ "loss": 0.8515,
1040
+ "step": 2660
1041
+ },
1042
+ {
1043
+ "epoch": 29.45,
1044
+ "learning_rate": 0.0001835294117647059,
1045
+ "loss": 0.861,
1046
+ "step": 2680
1047
+ },
1048
+ {
1049
+ "epoch": 29.67,
1050
+ "learning_rate": 0.0001815686274509804,
1051
+ "loss": 0.8513,
1052
+ "step": 2700
1053
+ },
1054
+ {
1055
+ "epoch": 29.67,
1056
+ "eval_loss": 0.16488835215568542,
1057
+ "eval_runtime": 189.1938,
1058
+ "eval_samples_per_second": 25.598,
1059
+ "eval_steps_per_second": 0.803,
1060
+ "eval_wer": 0.14774340051092819,
1061
+ "step": 2700
1062
+ },
1063
+ {
1064
+ "epoch": 29.89,
1065
+ "learning_rate": 0.0001796078431372549,
1066
+ "loss": 0.8573,
1067
+ "step": 2720
1068
+ },
1069
+ {
1070
+ "epoch": 30.11,
1071
+ "learning_rate": 0.00017764705882352942,
1072
+ "loss": 0.8686,
1073
+ "step": 2740
1074
+ },
1075
+ {
1076
+ "epoch": 30.33,
1077
+ "learning_rate": 0.00017568627450980392,
1078
+ "loss": 0.8462,
1079
+ "step": 2760
1080
+ },
1081
+ {
1082
+ "epoch": 30.55,
1083
+ "learning_rate": 0.00017372549019607845,
1084
+ "loss": 0.8419,
1085
+ "step": 2780
1086
+ },
1087
+ {
1088
+ "epoch": 30.77,
1089
+ "learning_rate": 0.00017176470588235293,
1090
+ "loss": 0.8659,
1091
+ "step": 2800
1092
+ },
1093
+ {
1094
+ "epoch": 30.77,
1095
+ "eval_loss": 0.1636602133512497,
1096
+ "eval_runtime": 190.245,
1097
+ "eval_samples_per_second": 25.457,
1098
+ "eval_steps_per_second": 0.799,
1099
+ "eval_wer": 0.1422367300596083,
1100
+ "step": 2800
1101
+ },
1102
+ {
1103
+ "epoch": 30.98,
1104
+ "learning_rate": 0.00016980392156862745,
1105
+ "loss": 0.8607,
1106
+ "step": 2820
1107
+ },
1108
+ {
1109
+ "epoch": 31.21,
1110
+ "learning_rate": 0.00016784313725490196,
1111
+ "loss": 0.8484,
1112
+ "step": 2840
1113
+ },
1114
+ {
1115
+ "epoch": 31.43,
1116
+ "learning_rate": 0.00016588235294117648,
1117
+ "loss": 0.8335,
1118
+ "step": 2860
1119
+ },
1120
+ {
1121
+ "epoch": 31.64,
1122
+ "learning_rate": 0.00016392156862745098,
1123
+ "loss": 0.8321,
1124
+ "step": 2880
1125
+ },
1126
+ {
1127
+ "epoch": 31.86,
1128
+ "learning_rate": 0.00016196078431372549,
1129
+ "loss": 0.8419,
1130
+ "step": 2900
1131
+ },
1132
+ {
1133
+ "epoch": 31.86,
1134
+ "eval_loss": 0.16137854754924774,
1135
+ "eval_runtime": 190.2053,
1136
+ "eval_samples_per_second": 25.462,
1137
+ "eval_steps_per_second": 0.799,
1138
+ "eval_wer": 0.1397104740278172,
1139
+ "step": 2900
1140
+ },
1141
+ {
1142
+ "epoch": 32.09,
1143
+ "learning_rate": 0.00016,
1144
+ "loss": 0.8634,
1145
+ "step": 2920
1146
+ },
1147
+ {
1148
+ "epoch": 32.31,
1149
+ "learning_rate": 0.00015803921568627451,
1150
+ "loss": 0.8351,
1151
+ "step": 2940
1152
+ },
1153
+ {
1154
+ "epoch": 32.52,
1155
+ "learning_rate": 0.00015607843137254901,
1156
+ "loss": 0.8427,
1157
+ "step": 2960
1158
+ },
1159
+ {
1160
+ "epoch": 32.74,
1161
+ "learning_rate": 0.00015411764705882352,
1162
+ "loss": 0.8324,
1163
+ "step": 2980
1164
+ },
1165
+ {
1166
+ "epoch": 32.96,
1167
+ "learning_rate": 0.00015215686274509804,
1168
+ "loss": 0.8491,
1169
+ "step": 3000
1170
+ },
1171
+ {
1172
+ "epoch": 32.96,
1173
+ "eval_loss": 0.1594749242067337,
1174
+ "eval_runtime": 191.4631,
1175
+ "eval_samples_per_second": 25.295,
1176
+ "eval_steps_per_second": 0.794,
1177
+ "eval_wer": 0.1401362475163213,
1178
+ "step": 3000
1179
  }
1180
  ],
1181
  "max_steps": 4550,
1182
  "num_train_epochs": 50,
1183
+ "total_flos": 4.636386357187625e+19,
1184
  "trial_name": null,
1185
  "trial_params": null
1186
  }
{checkpoint-2700 β†’ checkpoint-3000}/training_args.bin RENAMED
File without changes