patrickvonplaten commited on
Commit
86cf3fb
1 Parent(s): e930b89

Training in progress, step 1000

Browse files
Files changed (4) hide show
  1. pytorch_model.bin +1 -1
  2. run.sh +4 -4
  3. special_tokens_map.json +14 -0
  4. training_args.bin +1 -1
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8dbb63e3ec06276762ed302328e57ea42d34ac46df79a439e6a05ec7d7e011a0
3
  size 1262181617
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91fd4dcfce53d762be8373c54aa64ff2d81527bb114096cb75dd78cfac04eac0
3
  size 1262181617
run.sh CHANGED
@@ -17,13 +17,13 @@ python -m torch.distributed.launch \
17
  --per_device_train_batch_size="32" \
18
  --per_device_eval_batch_size="32" \
19
  --gradient_accumulation_steps="1" \
20
- --learning_rate="5e-4" \
21
- --warmup_steps="500" \
22
  --evaluation_strategy="steps" \
23
  --text_column_name="text" \
24
  --min_duration_in_seconds="0.25" \
25
- --save_steps="500" \
26
- --eval_steps="500" \
27
  --logging_steps="1" \
28
  --layerdrop="0.0" \
29
  --length_column_name="input_length" \
 
17
  --per_device_train_batch_size="32" \
18
  --per_device_eval_batch_size="32" \
19
  --gradient_accumulation_steps="1" \
20
+ --learning_rate="1e-4" \
21
+ --warmup_steps="1000" \
22
  --evaluation_strategy="steps" \
23
  --text_column_name="text" \
24
  --min_duration_in_seconds="0.25" \
25
+ --save_steps="1000" \
26
+ --eval_steps="1000" \
27
  --logging_steps="1" \
28
  --layerdrop="0.0" \
29
  --length_column_name="input_length" \
special_tokens_map.json CHANGED
@@ -35,6 +35,20 @@
35
  "rstrip": false,
36
  "single_word": false
37
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
38
  {
39
  "content": "</s>",
40
  "lstrip": false,
 
35
  "rstrip": false,
36
  "single_word": false
37
  },
38
+ {
39
+ "content": "</s>",
40
+ "lstrip": false,
41
+ "normalized": true,
42
+ "rstrip": false,
43
+ "single_word": false
44
+ },
45
+ {
46
+ "content": "<s>",
47
+ "lstrip": false,
48
+ "normalized": true,
49
+ "rstrip": false,
50
+ "single_word": false
51
+ },
52
  {
53
  "content": "</s>",
54
  "lstrip": false,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6235f6f0beb8a3f9ad85c0feedc85239a9b86be9f1a69bfda8761e7879c8145f
3
  size 3311
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b377e92f931b83d528bdb20a32e0040738acc2ab5cf30fe22893b2cdc20f283b
3
  size 3311