File size: 1,852 Bytes
eb76149
 
 
 
 
 
 
 
 
 
 
8319bb4
eb76149
8319bb4
eb76149
 
 
8319bb4
eb76149
8319bb4
eb76149
 
 
8319bb4
eb76149
8319bb4
eb76149
 
 
8319bb4
 
 
 
 
 
eb76149
 
 
8319bb4
 
 
 
eb76149
 
 
8319bb4
eb76149
8319bb4
eb76149
 
 
8319bb4
eb76149
8319bb4
eb76149
 
 
8319bb4
eb76149
8319bb4
eb76149
 
 
 
8319bb4
 
 
 
 
eb76149
 
 
 
8319bb4
 
 
eb76149
 
 
 
 
 
 
8319bb4
eb76149
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 2.0,
  "eval_steps": 500,
  "global_step": 683,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.29,
      "learning_rate": 3e-05,
      "loss": 1.574,
      "step": 100
    },
    {
      "epoch": 0.59,
      "learning_rate": 3e-05,
      "loss": 1.474,
      "step": 200
    },
    {
      "epoch": 0.88,
      "learning_rate": 3e-05,
      "loss": 1.4104,
      "step": 300
    },
    {
      "epoch": 1.0,
      "eval_accuracy": 0.4536923076923077,
      "eval_loss": 3.3574578762054443,
      "eval_runtime": 4.4299,
      "eval_samples_per_second": 112.869,
      "eval_steps_per_second": 14.221,
      "step": 341
    },
    {
      "epoch": 1.0,
      "eval_bleu": 0.08840557310176213,
      "eval_exact_match": 0.0,
      "eval_prefix_exact_match": 0.058,
      "step": 341
    },
    {
      "epoch": 1.17,
      "learning_rate": 3e-05,
      "loss": 1.3889,
      "step": 400
    },
    {
      "epoch": 1.46,
      "learning_rate": 3e-05,
      "loss": 1.387,
      "step": 500
    },
    {
      "epoch": 1.76,
      "learning_rate": 3e-05,
      "loss": 1.389,
      "step": 600
    },
    {
      "epoch": 2.0,
      "eval_accuracy": 0.4543589743589744,
      "eval_loss": 3.4179794788360596,
      "eval_runtime": 4.1997,
      "eval_samples_per_second": 119.055,
      "eval_steps_per_second": 15.001,
      "step": 683
    },
    {
      "epoch": 2.0,
      "eval_bleu": 0.09820569565497561,
      "eval_exact_match": 0.0,
      "eval_prefix_exact_match": 0.056,
      "step": 683
    }
  ],
  "logging_steps": 100,
  "max_steps": 17050,
  "num_train_epochs": 50,
  "save_steps": 500,
  "total_flos": 1.3526659229967974e+17,
  "trial_name": null,
  "trial_params": null
}