File size: 2,409 Bytes
a998879
d39ed56
 
a998879
d39ed56
a998879
 
 
 
 
 
 
d39ed56
 
a998879
 
 
d39ed56
 
79ddf3d
 
 
d39ed56
a998879
 
 
 
d39ed56
 
a998879
 
 
d39ed56
 
79ddf3d
 
 
d39ed56
a998879
 
 
 
d39ed56
 
a998879
 
 
d39ed56
 
79ddf3d
 
 
d39ed56
a998879
 
 
 
d39ed56
 
a998879
 
 
d39ed56
 
79ddf3d
 
 
d39ed56
a998879
 
 
 
d39ed56
 
a998879
 
 
d39ed56
 
79ddf3d
 
 
d39ed56
a998879
 
 
d39ed56
a998879
d39ed56
79ddf3d
 
 
a998879
 
d39ed56
a998879
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
{
  "best_metric": 0.8968609865470851,
  "best_model_checkpoint": "models/fake-news-bert-base-spanish-wwm-cased/checkpoint-420",
  "epoch": 5.0,
  "global_step": 700,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 1.0,
      "learning_rate": 1.6000000000000003e-05,
      "loss": 0.5098,
      "step": 140
    },
    {
      "epoch": 1.0,
      "eval_f1": 0.7340425531914895,
      "eval_loss": 0.49776777625083923,
      "eval_runtime": 7.5059,
      "eval_samples_per_second": 31.975,
      "eval_steps_per_second": 3.997,
      "step": 140
    },
    {
      "epoch": 2.0,
      "learning_rate": 1.2e-05,
      "loss": 0.2473,
      "step": 280
    },
    {
      "epoch": 2.0,
      "eval_f1": 0.8828828828828829,
      "eval_loss": 0.38877564668655396,
      "eval_runtime": 7.4929,
      "eval_samples_per_second": 32.03,
      "eval_steps_per_second": 4.004,
      "step": 280
    },
    {
      "epoch": 3.0,
      "learning_rate": 8.000000000000001e-06,
      "loss": 0.0908,
      "step": 420
    },
    {
      "epoch": 3.0,
      "eval_f1": 0.8968609865470851,
      "eval_loss": 0.44203802943229675,
      "eval_runtime": 7.4687,
      "eval_samples_per_second": 32.134,
      "eval_steps_per_second": 4.017,
      "step": 420
    },
    {
      "epoch": 4.0,
      "learning_rate": 4.000000000000001e-06,
      "loss": 0.0332,
      "step": 560
    },
    {
      "epoch": 4.0,
      "eval_f1": 0.8796296296296298,
      "eval_loss": 0.5603806376457214,
      "eval_runtime": 7.4592,
      "eval_samples_per_second": 32.175,
      "eval_steps_per_second": 4.022,
      "step": 560
    },
    {
      "epoch": 5.0,
      "learning_rate": 0.0,
      "loss": 0.0052,
      "step": 700
    },
    {
      "epoch": 5.0,
      "eval_f1": 0.8956521739130435,
      "eval_loss": 0.5154075622558594,
      "eval_runtime": 7.4542,
      "eval_samples_per_second": 32.197,
      "eval_steps_per_second": 4.025,
      "step": 700
    },
    {
      "epoch": 5.0,
      "step": 700,
      "total_flos": 1473421910016000.0,
      "train_loss": 0.17726608804294042,
      "train_runtime": 577.3687,
      "train_samples_per_second": 9.699,
      "train_steps_per_second": 1.212
    }
  ],
  "max_steps": 700,
  "num_train_epochs": 5,
  "total_flos": 1473421910016000.0,
  "trial_name": null,
  "trial_params": null
}