jonathanagustin commited on
Commit
4548d44
1 Parent(s): a9eb5ca

Training in progress, step 1100

Browse files
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:703662f67d3e9c690769d54fb804e87a29ff8bf79e3e8252b54853998eb7c3eb
3
  size 265493026
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6adc9954515c2a6c8270a1f55a43bdcd35c3c879a458287434024777b2c6983
3
  size 265493026
tokenizer.json CHANGED
@@ -3,13 +3,11 @@
3
  "truncation": {
4
  "direction": "Right",
5
  "max_length": 512,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
  },
9
  "padding": {
10
- "strategy": {
11
- "Fixed": 512
12
- },
13
  "direction": "Right",
14
  "pad_to_multiple_of": null,
15
  "pad_id": 0,
 
3
  "truncation": {
4
  "direction": "Right",
5
  "max_length": 512,
6
+ "strategy": "OnlySecond",
7
+ "stride": 128
8
  },
9
  "padding": {
10
+ "strategy": "BatchLongest",
 
 
11
  "direction": "Right",
12
  "pad_to_multiple_of": null,
13
  "pad_id": 0,
trainer_state.json CHANGED
@@ -153,16 +153,16 @@
153
  "step": 1020,
154
  "total_flos": 5.148633647651021e+16,
155
  "train_loss": 0.028946983113008386,
156
- "train_runtime": 26.811,
157
- "train_samples_per_second": 19470.051,
158
- "train_steps_per_second": 38.044
159
  },
160
  {
161
  "epoch": 4.0,
162
  "eval_loss": 1.3930128812789917,
163
- "eval_runtime": 8.3512,
164
- "eval_samples_per_second": 1433.204,
165
- "eval_steps_per_second": 11.256,
166
  "step": 1020
167
  }
168
  ],
 
153
  "step": 1020,
154
  "total_flos": 5.148633647651021e+16,
155
  "train_loss": 0.028946983113008386,
156
+ "train_runtime": 26.7355,
157
+ "train_samples_per_second": 19525.044,
158
+ "train_steps_per_second": 38.152
159
  },
160
  {
161
  "epoch": 4.0,
162
  "eval_loss": 1.3930128812789917,
163
+ "eval_runtime": 8.3016,
164
+ "eval_samples_per_second": 1441.77,
165
+ "eval_steps_per_second": 11.323,
166
  "step": 1020
167
  }
168
  ],
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:57d8a461b292d1c7d936212be6c7619b9698a1a89d0479a510f55cfd2a15f38a
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3345a9daf4130375c7a09b812dbb5af19f7b2a07a23d3827bb495e8766983668
3
  size 4664