File size: 1,377 Bytes
bc841eb
 
 
a320ff5
bc841eb
9e64091
bc841eb
 
 
 
 
 
fc2a210
a320ff5
bc841eb
 
fc2a210
 
 
a320ff5
fc2a210
 
 
 
 
a320ff5
fc2a210
 
 
 
 
a320ff5
fc2a210
 
 
 
 
a320ff5
fc2a210
 
bc841eb
a320ff5
fc2a210
a320ff5
bc841eb
 
 
a320ff5
9e64091
a320ff5
 
 
 
 
bc841eb
 
fc2a210
9e64091
bc841eb
 
 
a320ff5
bc841eb
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 0.0014344526845781992,
  "eval_steps": 500,
  "global_step": 100,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.0,
      "learning_rate": 2e-05,
      "loss": 0.0,
      "step": 1
    },
    {
      "epoch": 0.0,
      "learning_rate": 0.00019396926207859084,
      "loss": 0.0,
      "step": 20
    },
    {
      "epoch": 0.0,
      "learning_rate": 0.00015000000000000001,
      "loss": 0.0,
      "step": 40
    },
    {
      "epoch": 0.0,
      "learning_rate": 8.263518223330697e-05,
      "loss": 0.0,
      "step": 60
    },
    {
      "epoch": 0.0,
      "learning_rate": 2.339555568810221e-05,
      "loss": 0.0,
      "step": 80
    },
    {
      "epoch": 0.0,
      "learning_rate": 0.0,
      "loss": 0.0,
      "step": 100
    },
    {
      "epoch": 0.0,
      "step": 100,
      "total_flos": 1.768131718545408e+16,
      "train_loss": 0.0,
      "train_runtime": 501.823,
      "train_samples_per_second": 0.399,
      "train_steps_per_second": 0.199
    }
  ],
  "logging_steps": 20,
  "max_steps": 100,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 1,
  "save_steps": 100,
  "total_flos": 1.768131718545408e+16,
  "train_batch_size": 2,
  "trial_name": null,
  "trial_params": null
}