File size: 2,247 Bytes
53fc0f2
579cd93
 
6b08339
148c01d
6b08339
53fc0f2
 
 
 
 
148c01d
 
cef001b
148c01d
 
 
 
cef001b
 
 
 
5abe211
5d65a7b
 
 
cef001b
 
5d65a7b
 
 
 
cef001b
 
 
 
5d65a7b
579cd93
 
 
 
 
 
 
 
 
 
 
 
 
 
e3d98d9
 
 
 
 
 
 
 
 
 
 
 
 
 
6b08339
 
 
 
 
 
 
 
 
 
 
 
 
 
4ea6138
 
 
 
 
 
 
 
 
53fc0f2
 
148c01d
6789a54
a353654
6789a54
148c01d
6b08339
a353654
53fc0f2
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
{
  "best_metric": 4.924107074737549,
  "best_model_checkpoint": "ner-bert-ingredients/checkpoint-20",
  "epoch": 50.0,
  "eval_steps": 10,
  "global_step": 50,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 10.0,
      "learning_rate": 4e-05,
      "loss": 0.0466,
      "step": 10
    },
    {
      "epoch": 10.0,
      "eval_loss": 4.74609375,
      "eval_runtime": 0.0189,
      "eval_samples_per_second": 52.922,
      "eval_steps_per_second": 52.922,
      "step": 10
    },
    {
      "epoch": 20.0,
      "learning_rate": 4e-05,
      "loss": 0.0213,
      "step": 20
    },
    {
      "epoch": 20.0,
      "eval_loss": 4.924107074737549,
      "eval_runtime": 0.0183,
      "eval_samples_per_second": 54.52,
      "eval_steps_per_second": 54.52,
      "step": 20
    },
    {
      "epoch": 30.0,
      "learning_rate": 3e-05,
      "loss": 0.01,
      "step": 30
    },
    {
      "epoch": 30.0,
      "eval_loss": 5.040736675262451,
      "eval_runtime": 0.0178,
      "eval_samples_per_second": 56.023,
      "eval_steps_per_second": 56.023,
      "step": 30
    },
    {
      "epoch": 40.0,
      "learning_rate": 2e-05,
      "loss": 0.0063,
      "step": 40
    },
    {
      "epoch": 40.0,
      "eval_loss": 5.1612725257873535,
      "eval_runtime": 0.0185,
      "eval_samples_per_second": 54.098,
      "eval_steps_per_second": 54.098,
      "step": 40
    },
    {
      "epoch": 50.0,
      "learning_rate": 4e-05,
      "loss": 0.0043,
      "step": 50
    },
    {
      "epoch": 50.0,
      "eval_loss": 5.35546875,
      "eval_runtime": 0.0182,
      "eval_samples_per_second": 55.091,
      "eval_steps_per_second": 55.091,
      "step": 50
    },
    {
      "epoch": 50.0,
      "step": 50,
      "total_flos": 32856154788600.0,
      "train_loss": 0.0008505997806787491,
      "train_runtime": 23.3473,
      "train_samples_per_second": 19.274,
      "train_steps_per_second": 2.142
    }
  ],
  "logging_steps": 10,
  "max_steps": 50,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 50,
  "save_steps": 10,
  "total_flos": 32856154788600.0,
  "train_batch_size": 16,
  "trial_name": null,
  "trial_params": null
}