File size: 1,801 Bytes
5bb2226
 
 
 
 
 
 
 
 
 
 
 
4e3188d
5bb2226
 
 
 
0234203
4e3188d
5bb2226
 
 
 
0234203
4e3188d
5bb2226
 
 
 
4e3188d
 
5bb2226
 
 
 
4e3188d
 
5bb2226
 
 
 
4e3188d
 
5bb2226
 
 
 
4e3188d
 
5bb2226
 
 
 
4e3188d
 
5bb2226
 
 
 
4e3188d
 
5bb2226
 
 
 
4e3188d
 
5bb2226
 
 
 
4e3188d
 
5bb2226
 
 
 
4e3188d
 
5bb2226
 
 
 
 
4e3188d
5bb2226
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 0.07727975270479134,
  "global_step": 250,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.01,
      "learning_rate": 9.949107209404665e-05,
      "loss": 1.6279,
      "step": 20
    },
    {
      "epoch": 0.01,
      "learning_rate": 9.62558321769342e-05,
      "loss": 0.9748,
      "step": 40
    },
    {
      "epoch": 0.02,
      "learning_rate": 8.98317278228618e-05,
      "loss": 0.8434,
      "step": 60
    },
    {
      "epoch": 0.02,
      "learning_rate": 8.274303669726426e-05,
      "loss": 0.8162,
      "step": 80
    },
    {
      "epoch": 0.03,
      "learning_rate": 7.19444824755478e-05,
      "loss": 0.7719,
      "step": 100
    },
    {
      "epoch": 0.04,
      "learning_rate": 5.967492612770999e-05,
      "loss": 0.7687,
      "step": 120
    },
    {
      "epoch": 0.04,
      "learning_rate": 4.675683150061285e-05,
      "loss": 0.7753,
      "step": 140
    },
    {
      "epoch": 0.05,
      "learning_rate": 3.4056135837619074e-05,
      "loss": 0.7509,
      "step": 160
    },
    {
      "epoch": 0.06,
      "learning_rate": 2.2424203500786474e-05,
      "loss": 0.75,
      "step": 180
    },
    {
      "epoch": 0.06,
      "learning_rate": 1.2640756555442684e-05,
      "loss": 0.7337,
      "step": 200
    },
    {
      "epoch": 0.07,
      "learning_rate": 5.361607745106817e-06,
      "loss": 0.7484,
      "step": 220
    },
    {
      "epoch": 0.07,
      "learning_rate": 1.0746994666109234e-06,
      "loss": 0.7386,
      "step": 240
    }
  ],
  "max_steps": 250,
  "num_train_epochs": 1,
  "total_flos": 3.752851705482445e+16,
  "trial_name": null,
  "trial_params": null
}