File size: 2,576 Bytes
b852d9b
e1974b7
 
 
 
b852d9b
 
 
 
 
 
8d52d2f
b852d9b
e1974b7
b852d9b
 
e1974b7
 
8d52d2f
 
b852d9b
 
 
8d52d2f
b852d9b
e1974b7
b852d9b
 
e1974b7
 
 
8d52d2f
b852d9b
 
 
e1974b7
b852d9b
e1974b7
b852d9b
 
e1974b7
 
 
8d52d2f
b852d9b
 
 
e1974b7
b852d9b
e1974b7
b852d9b
 
e1974b7
 
 
8d52d2f
b852d9b
 
e1974b7
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
b852d9b
 
e1974b7
 
 
b852d9b
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
{
  "best_metric": 0.026788420975208282,
  "best_model_checkpoint": "./roberta-large-condaqa-neg-tag-token-classifier/checkpoint-24",
  "epoch": 6.0,
  "global_step": 24,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 1.0,
      "eval_accuracy": 0.9587528418317636,
      "eval_f1": 0.0,
      "eval_loss": 0.15255515277385712,
      "eval_precision": 0.0,
      "eval_recall": 0.0,
      "eval_runtime": 1.8569,
      "eval_samples_per_second": 66.777,
      "eval_steps_per_second": 2.154,
      "step": 4
    },
    {
      "epoch": 2.0,
      "eval_accuracy": 0.9587528418317636,
      "eval_f1": 0.0,
      "eval_loss": 0.0874876081943512,
      "eval_precision": 0.0,
      "eval_recall": 0.0,
      "eval_runtime": 2.0477,
      "eval_samples_per_second": 60.555,
      "eval_steps_per_second": 1.953,
      "step": 8
    },
    {
      "epoch": 3.0,
      "eval_accuracy": 0.9876583306268268,
      "eval_f1": 0.0,
      "eval_loss": 0.03961525484919548,
      "eval_precision": 0.0,
      "eval_recall": 0.0,
      "eval_runtime": 2.0055,
      "eval_samples_per_second": 61.83,
      "eval_steps_per_second": 1.995,
      "step": 12
    },
    {
      "epoch": 4.0,
      "eval_accuracy": 0.9899317960376746,
      "eval_f1": 0.0,
      "eval_loss": 0.03219746798276901,
      "eval_precision": 0.0,
      "eval_recall": 0.0,
      "eval_runtime": 1.8577,
      "eval_samples_per_second": 66.749,
      "eval_steps_per_second": 2.153,
      "step": 16
    },
    {
      "epoch": 5.0,
      "eval_accuracy": 0.9905813575836311,
      "eval_f1": 0.0,
      "eval_loss": 0.026981903240084648,
      "eval_precision": 0.0,
      "eval_recall": 0.0,
      "eval_runtime": 1.8937,
      "eval_samples_per_second": 65.479,
      "eval_steps_per_second": 2.112,
      "step": 20
    },
    {
      "epoch": 6.0,
      "eval_accuracy": 0.9899317960376746,
      "eval_f1": 0.0,
      "eval_loss": 0.026788420975208282,
      "eval_precision": 0.0,
      "eval_recall": 0.0,
      "eval_runtime": 1.8835,
      "eval_samples_per_second": 65.835,
      "eval_steps_per_second": 2.124,
      "step": 24
    },
    {
      "epoch": 6.0,
      "step": 24,
      "total_flos": 897265181578104.0,
      "train_loss": 0.13241314888000488,
      "train_runtime": 520.3829,
      "train_samples_per_second": 11.034,
      "train_steps_per_second": 0.046
    }
  ],
  "max_steps": 24,
  "num_train_epochs": 6,
  "total_flos": 897265181578104.0,
  "trial_name": null,
  "trial_params": null
}