mkopecki commited on
Commit
57e34a0
1 Parent(s): 76e6fa7

End of training

Browse files
Files changed (1) hide show
  1. trainer_state.json +30 -9
trainer_state.json CHANGED
@@ -3,23 +3,44 @@
3
  "best_model_checkpoint": null,
4
  "epoch": 3.0,
5
  "eval_steps": 500,
6
- "global_step": 30,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  {
12
  "epoch": 3.0,
13
- "step": 30,
14
- "total_flos": 388808857313280.0,
15
- "train_loss": 1.1855101267496744,
16
- "train_runtime": 71.2626,
17
- "train_samples_per_second": 0.421,
18
- "train_steps_per_second": 0.421
19
  }
20
  ],
21
  "logging_steps": 500,
22
- "max_steps": 30,
23
  "num_input_tokens_seen": 0,
24
  "num_train_epochs": 3,
25
  "save_steps": 500,
@@ -35,7 +56,7 @@
35
  "attributes": {}
36
  }
37
  },
38
- "total_flos": 388808857313280.0,
39
  "train_batch_size": 1,
40
  "trial_name": null,
41
  "trial_params": null
 
3
  "best_model_checkpoint": null,
4
  "epoch": 3.0,
5
  "eval_steps": 500,
6
+ "global_step": 1626,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
10
  "log_history": [
11
+ {
12
+ "epoch": 0.922509225092251,
13
+ "grad_norm": 0.6193047165870667,
14
+ "learning_rate": 3.4624846248462485e-05,
15
+ "loss": 0.5669,
16
+ "step": 500
17
+ },
18
+ {
19
+ "epoch": 1.8450184501845017,
20
+ "grad_norm": 0.5879950523376465,
21
+ "learning_rate": 1.924969249692497e-05,
22
+ "loss": 0.4066,
23
+ "step": 1000
24
+ },
25
+ {
26
+ "epoch": 2.767527675276753,
27
+ "grad_norm": 0.9034110307693481,
28
+ "learning_rate": 3.874538745387454e-06,
29
+ "loss": 0.3173,
30
+ "step": 1500
31
+ },
32
  {
33
  "epoch": 3.0,
34
+ "step": 1626,
35
+ "total_flos": 2.068561910815949e+16,
36
+ "train_loss": 0.41841167248189814,
37
+ "train_runtime": 3228.8428,
38
+ "train_samples_per_second": 0.504,
39
+ "train_steps_per_second": 0.504
40
  }
41
  ],
42
  "logging_steps": 500,
43
+ "max_steps": 1626,
44
  "num_input_tokens_seen": 0,
45
  "num_train_epochs": 3,
46
  "save_steps": 500,
 
56
  "attributes": {}
57
  }
58
  },
59
+ "total_flos": 2.068561910815949e+16,
60
  "train_batch_size": 1,
61
  "trial_name": null,
62
  "trial_params": null