File size: 2,653 Bytes
04378e2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
{
  "best_metric": 0.7140781182094741,
  "best_model_checkpoint": "OUTPUT/xlm-roberta-base/FalseTrue-0/0/checkpoint-296",
  "epoch": 8.0,
  "global_step": 296,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 1.0,
      "eval_accuracy": 0.5641025900840759,
      "eval_f1": 0.4068936527952921,
      "eval_loss": 0.6925989985466003,
      "eval_runtime": 0.8159,
      "eval_samples_per_second": 334.599,
      "eval_steps_per_second": 42.897,
      "step": 37
    },
    {
      "epoch": 2.0,
      "eval_accuracy": 0.5641025900840759,
      "eval_f1": 0.4068936527952921,
      "eval_loss": 0.7125938534736633,
      "eval_runtime": 0.8146,
      "eval_samples_per_second": 335.145,
      "eval_steps_per_second": 42.967,
      "step": 74
    },
    {
      "epoch": 3.0,
      "eval_accuracy": 0.5604395866394043,
      "eval_f1": 0.4052004333694475,
      "eval_loss": 0.7705000042915344,
      "eval_runtime": 0.8132,
      "eval_samples_per_second": 335.709,
      "eval_steps_per_second": 43.04,
      "step": 111
    },
    {
      "epoch": 4.0,
      "eval_accuracy": 0.7142857313156128,
      "eval_f1": 0.7028323699421966,
      "eval_loss": 0.8162457346916199,
      "eval_runtime": 0.814,
      "eval_samples_per_second": 335.389,
      "eval_steps_per_second": 42.999,
      "step": 148
    },
    {
      "epoch": 5.0,
      "eval_accuracy": 0.7069597244262695,
      "eval_f1": 0.6908952629291613,
      "eval_loss": 1.4020615816116333,
      "eval_runtime": 0.8166,
      "eval_samples_per_second": 334.305,
      "eval_steps_per_second": 42.86,
      "step": 185
    },
    {
      "epoch": 6.0,
      "eval_accuracy": 0.721611738204956,
      "eval_f1": 0.7063504997827033,
      "eval_loss": 1.4205191135406494,
      "eval_runtime": 0.8137,
      "eval_samples_per_second": 335.499,
      "eval_steps_per_second": 43.013,
      "step": 222
    },
    {
      "epoch": 7.0,
      "eval_accuracy": 0.7252747416496277,
      "eval_f1": 0.7118124041200964,
      "eval_loss": 1.5443077087402344,
      "eval_runtime": 0.8137,
      "eval_samples_per_second": 335.506,
      "eval_steps_per_second": 43.014,
      "step": 259
    },
    {
      "epoch": 8.0,
      "eval_accuracy": 0.7289377450942993,
      "eval_f1": 0.7140781182094741,
      "eval_loss": 1.6495815515518188,
      "eval_runtime": 0.8093,
      "eval_samples_per_second": 337.346,
      "eval_steps_per_second": 43.249,
      "step": 296
    }
  ],
  "max_steps": 333,
  "num_train_epochs": 9,
  "total_flos": 1988472400920576.0,
  "trial_name": null,
  "trial_params": null
}