File size: 2,308 Bytes
c349099
29518b8
 
b64b4c5
 
c349099
 
 
 
 
29518b8
c349099
29518b8
 
c349099
 
 
29518b8
 
 
 
 
c349099
 
 
29518b8
 
 
c349099
 
29518b8
 
 
 
 
 
c349099
 
29518b8
 
 
 
c349099
 
29518b8
 
 
 
 
 
c349099
 
29518b8
 
 
 
c349099
 
29518b8
 
 
 
 
 
c349099
 
29518b8
 
 
 
c349099
 
29518b8
 
 
 
 
 
b64b4c5
 
 
 
 
 
 
 
 
 
 
 
 
 
c349099
 
29518b8
 
b64b4c5
c349099
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 7.790923824959481,
  "global_step": 2400,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 1.3,
      "learning_rate": 0.00023999999999999998,
      "loss": 3.5498,
      "step": 400
    },
    {
      "epoch": 1.3,
      "eval_loss": 0.7558379173278809,
      "eval_runtime": 196.0447,
      "eval_samples_per_second": 10.156,
      "eval_wer": 0.7275141242937853,
      "step": 400
    },
    {
      "epoch": 2.6,
      "learning_rate": 0.000297029702970297,
      "loss": 0.735,
      "step": 800
    },
    {
      "epoch": 2.6,
      "eval_loss": 0.4254470467567444,
      "eval_runtime": 196.081,
      "eval_samples_per_second": 10.154,
      "eval_wer": 0.521412429378531,
      "step": 800
    },
    {
      "epoch": 3.89,
      "learning_rate": 0.00029306930693069307,
      "loss": 0.502,
      "step": 1200
    },
    {
      "epoch": 3.89,
      "eval_loss": 0.369031697511673,
      "eval_runtime": 193.173,
      "eval_samples_per_second": 10.307,
      "eval_wer": 0.46146892655367233,
      "step": 1200
    },
    {
      "epoch": 5.19,
      "learning_rate": 0.00028910891089108906,
      "loss": 0.4002,
      "step": 1600
    },
    {
      "epoch": 5.19,
      "eval_loss": 0.34798651933670044,
      "eval_runtime": 194.1431,
      "eval_samples_per_second": 10.255,
      "eval_wer": 0.4266666666666667,
      "step": 1600
    },
    {
      "epoch": 6.49,
      "learning_rate": 0.0002851485148514851,
      "loss": 0.3301,
      "step": 2000
    },
    {
      "epoch": 6.49,
      "eval_loss": 0.34466618299484253,
      "eval_runtime": 194.5915,
      "eval_samples_per_second": 10.232,
      "eval_wer": 0.41836158192090395,
      "step": 2000
    },
    {
      "epoch": 7.79,
      "learning_rate": 0.00028118811881188116,
      "loss": 0.2992,
      "step": 2400
    },
    {
      "epoch": 7.79,
      "eval_loss": 0.34237322211265564,
      "eval_runtime": 196.6598,
      "eval_samples_per_second": 10.124,
      "eval_wer": 0.40293785310734465,
      "step": 2400
    }
  ],
  "max_steps": 30800,
  "num_train_epochs": 100,
  "total_flos": 8.237450774585993e+18,
  "trial_name": null,
  "trial_params": null
}