ivangtorre commited on
Commit
398d729
1 Parent(s): d35ad98

Add model files

Browse files

Files changed (4) hide show
  1. pytorch_model.bin +1 -1
  2. trainer_state.json +62 -13
  3. training_args.bin +1 -1
  4. vocab.json +1 -1
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:509588dea56f1c5e67678b30228db8d4070585445da2cfab49c13ee8fc134dc5
3
  size 1262055847
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f498b19aaef569775369986de505f60d65e506d0a2087c7f770127e9f1ab1b4
3
  size 1262055847
trainer_state.json CHANGED
@@ -1,30 +1,79 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 3.785894206549118,
5
- "global_step": 500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
- "epoch": 3.79,
12
- "learning_rate": 0.00039436231366470835,
13
- "loss": 1.5121,
14
  "step": 500
15
  },
16
  {
17
- "epoch": 3.79,
18
- "eval_loss": 0.186998650431633,
19
- "eval_runtime": 714.138,
20
- "eval_samples_per_second": 7.242,
21
- "eval_wer": 0.39502654080485317,
22
  "step": 500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
23
  }
24
  ],
25
- "max_steps": 6600,
26
- "num_train_epochs": 50,
27
- "total_flos": 7.843188479774457e+18,
28
  "trial_name": null,
29
  "trial_params": null
30
  }
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 4.998422712933754,
5
+ "global_step": 2110,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
9
  "log_history": [
10
  {
11
+ "epoch": 1.18,
12
+ "learning_rate": 0.0003470916966876807,
13
+ "loss": 1.587,
14
  "step": 500
15
  },
16
  {
17
+ "epoch": 1.18,
18
+ "eval_loss": 0.2940497398376465,
19
+ "eval_runtime": 783.4997,
20
+ "eval_samples_per_second": 6.601,
21
+ "eval_wer": 0.5440472766257878,
22
  "step": 500
23
+ },
24
+ {
25
+ "epoch": 2.37,
26
+ "learning_rate": 0.0002163596723446065,
27
+ "loss": 0.25,
28
+ "step": 1000
29
+ },
30
+ {
31
+ "epoch": 2.37,
32
+ "eval_loss": 0.20464767515659332,
33
+ "eval_runtime": 845.5317,
34
+ "eval_samples_per_second": 6.117,
35
+ "eval_wer": 0.4130690583897707,
36
+ "step": 1000
37
+ },
38
+ {
39
+ "epoch": 3.55,
40
+ "learning_rate": 7.697202293654628e-05,
41
+ "loss": 0.1538,
42
+ "step": 1500
43
+ },
44
+ {
45
+ "epoch": 3.55,
46
+ "eval_loss": 0.17199403047561646,
47
+ "eval_runtime": 847.1175,
48
+ "eval_samples_per_second": 6.105,
49
+ "eval_wer": 0.3628114949141019,
50
+ "step": 1500
51
+ },
52
+ {
53
+ "epoch": 4.74,
54
+ "learning_rate": 2.6763887922288233e-06,
55
+ "loss": 0.1143,
56
+ "step": 2000
57
+ },
58
+ {
59
+ "epoch": 4.74,
60
+ "eval_loss": 0.16164630651474,
61
+ "eval_runtime": 737.1973,
62
+ "eval_samples_per_second": 7.016,
63
+ "eval_wer": 0.3482467379651178,
64
+ "step": 2000
65
+ },
66
+ {
67
+ "epoch": 5.0,
68
+ "step": 2110,
69
+ "total_flos": 1.0309110757947716e+19,
70
+ "train_runtime": 14179.0923,
71
+ "train_samples_per_second": 0.149
72
  }
73
  ],
74
+ "max_steps": 2110,
75
+ "num_train_epochs": 5,
76
+ "total_flos": 1.0309110757947716e+19,
77
  "trial_name": null,
78
  "trial_params": null
79
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:38479a919eda7dd28d3ae5f9cab083881c8741ef35462dbc9ab73b870d8c6d48
3
  size 2287
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:474caa22f1c7f0c4e89880f0d02b07015187ad5c2b1a354e1f8340ea7bbd6181
3
  size 2287
vocab.json CHANGED
@@ -1 +1 @@
1
- {"m": 0, "d": 1, "c": 2, "l": 3, "b": 4, "i": 5, "y": 6, "w": 7, "k": 8, "n": 10, "\u00f1": 11, "o": 12, "a": 13, "x": 14, "z": 15, "u": 16, "r": 17, "q": 18, "h": 19, "t": 20, "g": 21, "p": 22, "v": 23, "e": 24, "j": 25, "f": 26, "s": 27, "\u00ed": 28, "|": 9, "[UNK]": 29, "[PAD]": 30}
1
+ {"r": 0, "w": 1, "e": 2, "a": 3, "b": 4, "p": 5, "m": 7, "x": 8, "q": 9, "d": 10, "g": 11, "h": 12, "f": 13, "í": 14, "v": 15, "c": 16, "ñ": 17, "i": 18, "t": 19, "y": 20, "n": 21, "z": 22, "o": 23, "l": 24, "s": 25, "k": 26, "j": 27, "u": 28, "|": 6, "[UNK]": 29, "[PAD]": 30}