File size: 2,655 Bytes
e30176f
1fd6c85
b7433e3
e30176f
 
 
 
 
 
 
 
 
1fd6c85
e30176f
1fd6c85
 
 
e30176f
 
 
 
 
1fd6c85
e30176f
1fd6c85
 
 
e30176f
 
 
 
 
1fd6c85
e30176f
1fd6c85
 
 
e30176f
 
 
 
 
1fd6c85
e30176f
1fd6c85
 
 
e30176f
 
 
 
 
1fd6c85
e30176f
1fd6c85
 
 
e30176f
 
 
 
 
1fd6c85
e30176f
1fd6c85
 
 
e30176f
 
 
 
 
1fd6c85
e30176f
1fd6c85
 
 
e30176f
 
 
 
 
1fd6c85
e30176f
1fd6c85
 
 
e30176f
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
{
  "best_metric": 0.7736625514403291,
  "best_model_checkpoint": "OS_OUT/harish/PT-UP-xlmR-FalseFalse-0_0_BEST/FalseFalse-0/2/checkpoint-40",
  "epoch": 8.0,
  "global_step": 40,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 1.0,
      "eval_accuracy": 0.6300366520881653,
      "eval_f1": 0.597609561752988,
      "eval_loss": 0.6447749137878418,
      "eval_runtime": 0.7675,
      "eval_samples_per_second": 355.702,
      "eval_steps_per_second": 45.603,
      "step": 5
    },
    {
      "epoch": 2.0,
      "eval_accuracy": 0.6813187003135681,
      "eval_f1": 0.6200873362445415,
      "eval_loss": 0.5641180872917175,
      "eval_runtime": 0.7675,
      "eval_samples_per_second": 355.721,
      "eval_steps_per_second": 45.605,
      "step": 10
    },
    {
      "epoch": 3.0,
      "eval_accuracy": 0.7289377450942993,
      "eval_f1": 0.6372549019607843,
      "eval_loss": 0.5698391795158386,
      "eval_runtime": 0.7673,
      "eval_samples_per_second": 355.789,
      "eval_steps_per_second": 45.614,
      "step": 15
    },
    {
      "epoch": 4.0,
      "eval_accuracy": 0.7289377450942993,
      "eval_f1": 0.7153846153846154,
      "eval_loss": 0.5229743719100952,
      "eval_runtime": 0.7688,
      "eval_samples_per_second": 355.082,
      "eval_steps_per_second": 45.523,
      "step": 20
    },
    {
      "epoch": 5.0,
      "eval_accuracy": 0.7582417726516724,
      "eval_f1": 0.7421875,
      "eval_loss": 0.5236229300498962,
      "eval_runtime": 0.7675,
      "eval_samples_per_second": 355.716,
      "eval_steps_per_second": 45.605,
      "step": 25
    },
    {
      "epoch": 6.0,
      "eval_accuracy": 0.7655677795410156,
      "eval_f1": 0.719298245614035,
      "eval_loss": 0.5164700150489807,
      "eval_runtime": 0.7779,
      "eval_samples_per_second": 350.939,
      "eval_steps_per_second": 44.992,
      "step": 30
    },
    {
      "epoch": 7.0,
      "eval_accuracy": 0.791208803653717,
      "eval_f1": 0.7673469387755103,
      "eval_loss": 0.5138589143753052,
      "eval_runtime": 0.7778,
      "eval_samples_per_second": 350.983,
      "eval_steps_per_second": 44.998,
      "step": 35
    },
    {
      "epoch": 8.0,
      "eval_accuracy": 0.7985348105430603,
      "eval_f1": 0.7736625514403291,
      "eval_loss": 0.5282412767410278,
      "eval_runtime": 0.7588,
      "eval_samples_per_second": 359.786,
      "eval_steps_per_second": 46.126,
      "step": 40
    }
  ],
  "max_steps": 45,
  "num_train_epochs": 9,
  "total_flos": 82090649272320.0,
  "trial_name": null,
  "trial_params": null
}