versae commited on
Commit
bf8318a
1 Parent(s): 6645cd2

End of training

Browse files
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
  "epoch": 1.0,
3
  "eval_loss": 0.27755075693130493,
4
- "eval_runtime": 384.9632,
5
  "eval_samples_per_second": 0.418,
6
  "eval_steps_per_second": 0.07,
7
  "eval_wer": 12.51522533495737,
8
- "train_loss": 0.6583859201431275,
9
- "train_runtime": 31239.5975,
10
- "train_samples_per_second": 1.921,
11
- "train_steps_per_second": 0.16
12
  }
 
1
  {
2
  "epoch": 1.0,
3
  "eval_loss": 0.27755075693130493,
4
+ "eval_runtime": 385.5995,
5
  "eval_samples_per_second": 0.418,
6
  "eval_steps_per_second": 0.07,
7
  "eval_wer": 12.51522533495737,
8
+ "train_loss": 0.00010507909137471822,
9
+ "train_runtime": 167.7323,
10
+ "train_samples_per_second": 357.713,
11
+ "train_steps_per_second": 29.809
12
  }
eval_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 1.0,
3
  "eval_loss": 0.27755075693130493,
4
- "eval_runtime": 384.9632,
5
  "eval_samples_per_second": 0.418,
6
  "eval_steps_per_second": 0.07,
7
  "eval_wer": 12.51522533495737
 
1
  {
2
  "epoch": 1.0,
3
  "eval_loss": 0.27755075693130493,
4
+ "eval_runtime": 385.5995,
5
  "eval_samples_per_second": 0.418,
6
  "eval_steps_per_second": 0.07,
7
  "eval_wer": 12.51522533495737
runs/Dec10_21-10-13_dante/events.out.tfevents.1670703878.dante.3904631.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fd8ce3059c2b75f54be418a4e22c49836ae752e23b2eb07db72e304fbd3626e
3
+ size 358
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "epoch": 1.0,
3
- "train_loss": 0.6583859201431275,
4
- "train_runtime": 31239.5975,
5
- "train_samples_per_second": 1.921,
6
- "train_steps_per_second": 0.16
7
  }
 
1
  {
2
  "epoch": 1.0,
3
+ "train_loss": 0.00010507909137471822,
4
+ "train_runtime": 167.7323,
5
+ "train_samples_per_second": 357.713,
6
+ "train_steps_per_second": 29.809
7
  }
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 12.51522533495737,
3
  "best_model_checkpoint": "./checkpoint-5000",
4
- "epoch": 1.0,
5
- "global_step": 5000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -1254,17 +1254,17 @@
1254
  },
1255
  {
1256
  "epoch": 1.0,
1257
- "step": 5000,
1258
- "total_flos": 1.2739025557174354e+20,
1259
- "train_loss": 0.6583859201431275,
1260
- "train_runtime": 31239.5975,
1261
- "train_samples_per_second": 1.921,
1262
- "train_steps_per_second": 0.16
1263
  }
1264
  ],
1265
  "max_steps": 5000,
1266
  "num_train_epochs": 9223372036854775807,
1267
- "total_flos": 1.2739025557174354e+20,
1268
  "trial_name": null,
1269
  "trial_params": null
1270
  }
 
1
  {
2
  "best_metric": 12.51522533495737,
3
  "best_model_checkpoint": "./checkpoint-5000",
4
+ "epoch": 1.0002,
5
+ "global_step": 5001,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
1254
  },
1255
  {
1256
  "epoch": 1.0,
1257
+ "step": 5001,
1258
+ "total_flos": 1.2741573362483357e+20,
1259
+ "train_loss": 0.00010507909137471822,
1260
+ "train_runtime": 167.7323,
1261
+ "train_samples_per_second": 357.713,
1262
+ "train_steps_per_second": 29.809
1263
  }
1264
  ],
1265
  "max_steps": 5000,
1266
  "num_train_epochs": 9223372036854775807,
1267
+ "total_flos": 1.2741573362483357e+20,
1268
  "trial_name": null,
1269
  "trial_params": null
1270
  }