File size: 2,758 Bytes
52d319d
 
 
74c4791
 
52d319d
 
 
 
 
 
74c4791
 
52d319d
 
 
 
74c4791
 
 
 
 
 
52d319d
 
 
 
74c4791
 
52d319d
 
 
 
74c4791
 
 
 
 
 
52d319d
 
 
 
74c4791
 
52d319d
 
 
 
74c4791
 
 
 
 
 
52d319d
 
 
 
74c4791
 
52d319d
 
 
 
74c4791
 
 
 
 
 
52d319d
 
 
 
74c4791
 
52d319d
 
 
 
74c4791
 
 
 
 
 
52d319d
 
 
 
74c4791
 
52d319d
 
 
 
74c4791
 
 
 
 
 
52d319d
 
 
74c4791
 
 
52d319d
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
{
  "best_metric": null,
  "best_model_checkpoint": null,
  "epoch": 48.379746835443036,
  "global_step": 1500,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 8.06,
      "learning_rate": 0.0005,
      "loss": 0.576,
      "step": 250
    },
    {
      "epoch": 8.06,
      "eval_cer": 0.050238462365976976,
      "eval_loss": 0.24107621610164642,
      "eval_runtime": 380.2463,
      "eval_samples_per_second": 19.111,
      "eval_steps_per_second": 2.391,
      "eval_wer": 0.23400590063956597,
      "step": 250
    },
    {
      "epoch": 16.13,
      "learning_rate": 0.001,
      "loss": 0.2564,
      "step": 500
    },
    {
      "epoch": 16.13,
      "eval_cer": 0.04923441029870549,
      "eval_loss": 0.23052524030208588,
      "eval_runtime": 267.8454,
      "eval_samples_per_second": 27.131,
      "eval_steps_per_second": 3.394,
      "eval_wer": 0.20967071263093282,
      "step": 500
    },
    {
      "epoch": 24.19,
      "learning_rate": 0.0007619047619047619,
      "loss": 0.2018,
      "step": 750
    },
    {
      "epoch": 24.19,
      "eval_cer": 0.04937458639900638,
      "eval_loss": 0.23705527186393738,
      "eval_runtime": 264.0504,
      "eval_samples_per_second": 27.521,
      "eval_steps_per_second": 3.443,
      "eval_wer": 0.20590855988753143,
      "step": 750
    },
    {
      "epoch": 32.25,
      "learning_rate": 0.0005238095238095238,
      "loss": 0.1549,
      "step": 1000
    },
    {
      "epoch": 32.25,
      "eval_cer": 0.04349696991429698,
      "eval_loss": 0.22975854575634003,
      "eval_runtime": 264.3572,
      "eval_samples_per_second": 27.489,
      "eval_steps_per_second": 3.439,
      "eval_wer": 0.18440488683840564,
      "step": 1000
    },
    {
      "epoch": 40.32,
      "learning_rate": 0.0002857142857142857,
      "loss": 0.1224,
      "step": 1250
    },
    {
      "epoch": 40.32,
      "eval_cer": 0.040729306910681745,
      "eval_loss": 0.22875599563121796,
      "eval_runtime": 265.748,
      "eval_samples_per_second": 27.345,
      "eval_steps_per_second": 3.421,
      "eval_wer": 0.1724650020790844,
      "step": 1250
    },
    {
      "epoch": 48.38,
      "learning_rate": 4.761904761904762e-05,
      "loss": 0.1004,
      "step": 1500
    },
    {
      "epoch": 48.38,
      "eval_cer": 0.03763565297613421,
      "eval_loss": 0.23267094790935516,
      "eval_runtime": 266.4102,
      "eval_samples_per_second": 27.277,
      "eval_steps_per_second": 3.412,
      "eval_wer": 0.16082212937845278,
      "step": 1500
    }
  ],
  "max_steps": 1550,
  "num_train_epochs": 50,
  "total_flos": 1.244071149131343e+20,
  "trial_name": null,
  "trial_params": null
}