File size: 1,860 Bytes
51ebc81
 
 
 
 
 
 
 
 
 
 
9713d73
51ebc81
9713d73
51ebc81
 
 
9713d73
51ebc81
9713d73
51ebc81
 
 
9713d73
51ebc81
9713d73
51ebc81
 
 
9713d73
 
 
 
 
 
51ebc81
 
 
9713d73
 
 
 
51ebc81
 
 
9713d73
51ebc81
9713d73
51ebc81
 
 
9713d73
51ebc81
9713d73
51ebc81
 
 
9713d73
51ebc81
9713d73
51ebc81
 
 
 
9713d73
 
 
 
 
51ebc81
 
 
 
9713d73
 
 
51ebc81
 
 
 
 
 
 
9713d73
51ebc81
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 2.0,
  "eval_steps": 500,
  "global_step": 683,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.29,
      "learning_rate": 0.0001,
      "loss": 1.4842,
      "step": 100
    },
    {
      "epoch": 0.59,
      "learning_rate": 0.0001,
      "loss": 1.4016,
      "step": 200
    },
    {
      "epoch": 0.88,
      "learning_rate": 0.0001,
      "loss": 1.3892,
      "step": 300
    },
    {
      "epoch": 1.0,
      "eval_accuracy": 0.4543589743589744,
      "eval_loss": 3.4055869579315186,
      "eval_runtime": 4.1688,
      "eval_samples_per_second": 119.938,
      "eval_steps_per_second": 15.112,
      "step": 341
    },
    {
      "epoch": 1.0,
      "eval_bleu": 0.09711501224106496,
      "eval_exact_match": 0.0,
      "eval_prefix_exact_match": 0.054,
      "step": 341
    },
    {
      "epoch": 1.17,
      "learning_rate": 0.0001,
      "loss": 1.3608,
      "step": 400
    },
    {
      "epoch": 1.46,
      "learning_rate": 0.0001,
      "loss": 1.3456,
      "step": 500
    },
    {
      "epoch": 1.76,
      "learning_rate": 0.0001,
      "loss": 1.3499,
      "step": 600
    },
    {
      "epoch": 2.0,
      "eval_accuracy": 0.4576923076923077,
      "eval_loss": 3.453113317489624,
      "eval_runtime": 4.4031,
      "eval_samples_per_second": 113.556,
      "eval_steps_per_second": 14.308,
      "step": 683
    },
    {
      "epoch": 2.0,
      "eval_bleu": 0.1225593574040313,
      "eval_exact_match": 0.0,
      "eval_prefix_exact_match": 0.056,
      "step": 683
    }
  ],
  "logging_steps": 100,
  "max_steps": 17050,
  "num_train_epochs": 50,
  "save_steps": 500,
  "total_flos": 1.3526659229967974e+17,
  "trial_name": null,
  "trial_params": null
}