Joshua Lochner commited on
Commit
59eaa57
1 Parent(s): 9718ae1

Next training iteration (90k)

Browse files
added_tokens.json CHANGED
@@ -1 +1 @@
1
- {"END_SELFPROMO_TOKEN": 32115, "LONG_WORD_TOKEN": 32106, "END_INTERACTION_TOKEN": 32117, "EXTRACT_SEGMENTS: ": 32100, "BETWEEN_SEGMENTS_TOKEN": 32118, "PROFANITY_TOKEN": 32110, "NUMBER_PERCENTAGE_TOKEN": 32103, "[Laughter]": 32109, "SHORT_HYPHENATED_TOKEN": 32105, "[Music]": 32107, "[Applause]": 32108, "END_SPONSOR_TOKEN": 32113, "NO_SEGMENT_TOKEN": 32111, "HYPHENATED_URL_TOKEN": 32102, "START_SPONSOR_TOKEN": 32112, "URL_TOKEN": 32101, "START_SELFPROMO_TOKEN": 32114, "START_INTERACTION_TOKEN": 32116, "NUMBER_TOKEN": 32104}
 
1
+ {"SHORT_HYPHENATED_TOKEN": 32105, "END_SPONSOR_TOKEN": 32113, "EXTRACT_SEGMENTS: ": 32100, "[Music]": 32107, "NUMBER_PERCENTAGE_TOKEN": 32103, "LONG_WORD_TOKEN": 32106, "HYPHENATED_URL_TOKEN": 32102, "START_INTERACTION_TOKEN": 32116, "URL_TOKEN": 32101, "END_INTERACTION_TOKEN": 32117, "END_SELFPROMO_TOKEN": 32115, "NUMBER_TOKEN": 32104, "NO_SEGMENT_TOKEN": 32111, "PROFANITY_TOKEN": 32110, "BETWEEN_SEGMENTS_TOKEN": 32118, "START_SELFPROMO_TOKEN": 32114, "[Laughter]": 32109, "[Applause]": 32108, "START_SPONSOR_TOKEN": 32112}
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e73df4acf596669fc8bbc5025e78d667d77045e11a809f1f2e7f6638f868a82
3
  size 990383053
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71bb817c2eb93b2299b2db3e9a4fdf54230ad4f8af14493ca0539096676da785
3
  size 990383053
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8ebddd8d23b9d2745ef5ee1df068df17974bd5cfbdcfb208e5eeb559e7e4a61
3
  size 14503
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f5898f076f1662c347f647ca9305dacb1097aa523e328bb84cc7c4a92dda75a
3
  size 14503
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:863bc83c7e2bc3df963dc3b7cd76697e4379b39112e53c3aacbeab9768904dc4
3
  size 623
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2e5c883e4333a69700fe4d098d3261cf9eac2c32334388c85d05b1fa6f3a483
3
  size 623
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.08060226008737285,
5
- "global_step": 45000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -68,11 +68,65 @@
68
  "learning_rate": 4.596988699563136e-05,
69
  "loss": 0.1129,
70
  "step": 45000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
71
  }
72
  ],
73
  "max_steps": 558297,
74
  "num_train_epochs": 1,
75
- "total_flos": 4.439552157522432e+16,
76
  "trial_name": null,
77
  "trial_params": null
78
  }
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.1612045201747457,
5
+ "global_step": 90000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
68
  "learning_rate": 4.596988699563136e-05,
69
  "loss": 0.1129,
70
  "step": 45000
71
+ },
72
+ {
73
+ "epoch": 0.09,
74
+ "learning_rate": 4.5522096661812623e-05,
75
+ "loss": 0.1115,
76
+ "step": 50000
77
+ },
78
+ {
79
+ "epoch": 0.1,
80
+ "learning_rate": 4.5074306327993884e-05,
81
+ "loss": 0.1072,
82
+ "step": 55000
83
+ },
84
+ {
85
+ "epoch": 0.11,
86
+ "learning_rate": 4.4626515994175145e-05,
87
+ "loss": 0.1079,
88
+ "step": 60000
89
+ },
90
+ {
91
+ "epoch": 0.12,
92
+ "learning_rate": 4.4178725660356406e-05,
93
+ "loss": 0.3569,
94
+ "step": 65000
95
+ },
96
+ {
97
+ "epoch": 0.13,
98
+ "learning_rate": 4.3730935326537667e-05,
99
+ "loss": 0.1283,
100
+ "step": 70000
101
+ },
102
+ {
103
+ "epoch": 0.13,
104
+ "learning_rate": 4.3283144992718934e-05,
105
+ "loss": 0.1039,
106
+ "step": 75000
107
+ },
108
+ {
109
+ "epoch": 0.14,
110
+ "learning_rate": 4.2835354658900195e-05,
111
+ "loss": 0.0956,
112
+ "step": 80000
113
+ },
114
+ {
115
+ "epoch": 0.15,
116
+ "learning_rate": 4.2387564325081456e-05,
117
+ "loss": 0.0989,
118
+ "step": 85000
119
+ },
120
+ {
121
+ "epoch": 0.16,
122
+ "learning_rate": 4.1939773991262716e-05,
123
+ "loss": 0.0966,
124
+ "step": 90000
125
  }
126
  ],
127
  "max_steps": 558297,
128
  "num_train_epochs": 1,
129
+ "total_flos": 8.885642742554112e+16,
130
  "trial_name": null,
131
  "trial_params": null
132
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d88579f56375596872ffe40e72d85e293c40c8fa8ed74b8701b8ecc7002ec505
3
  size 3119
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da11e8af50c38dbf9430e2d7bbfab617719d848605add5ab7ec3aa4da77adca5
3
  size 3119