emilios commited on
Commit
bbb11e6
1 Parent(s): a714b51

Training in progress, step 1000

Browse files
ds_config.json CHANGED
@@ -18,14 +18,16 @@
18
  }
19
  },
20
 
21
- "scheduler": {
22
- "type": "WarmupLR",
23
- "params": {
24
- "warmup_min_lr": "auto",
25
- "warmup_max_lr": "auto",
26
- "warmup_num_steps": "auto"
27
- }
28
- },
 
 
29
 
30
  "zero_optimization": {
31
  "stage": 2,
 
18
  }
19
  },
20
 
21
+ "scheduler": {
22
+ "type": "WarmupDecayLR",
23
+ "params": {
24
+ "last_batch_iteration": -1,
25
+ "total_num_steps": "auto",
26
+ "warmup_min_lr": "auto",
27
+ "warmup_max_lr": "auto",
28
+ "warmup_num_steps": "auto"
29
+ }
30
+ },
31
 
32
  "zero_optimization": {
33
  "stage": 2,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c0f5ee3669a1e41af8da9db9fe9ae9130dc32a13e3ae28cd41aef89e280450d
3
  size 483536061
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66c65726b9d7262b98529730a55b1d37e92aafedea5486722aba0d97e4216171
3
  size 483536061
run.sh CHANGED
@@ -11,7 +11,7 @@ deepspeed run_speech_recognition_seq2seq_streaming-farsipal.py \
11
  --torch_compile="True" \
12
  --torch_compile_mode="reduce-overhead" \
13
  --torch_compile_mode="max-autotune" \
14
- --max_steps="20000" \
15
  --output_dir="./" \
16
  --per_device_train_batch_size="32" \
17
  --gradient_accumulation_steps="1" \
 
11
  --torch_compile="True" \
12
  --torch_compile_mode="reduce-overhead" \
13
  --torch_compile_mode="max-autotune" \
14
+ --max_steps="5000" \
15
  --output_dir="./" \
16
  --per_device_train_batch_size="32" \
17
  --gradient_accumulation_steps="1" \
runs/Dec20_12-59-04_129-146-176-120/events.out.tfevents.1671542011.129-146-176-120.680663.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20b6c09a11d60f3398e4b98c0406379babb3f2ead03f08f83b1353de1038c4a3
3
- size 43878
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43fcfbc982169b9c6eb2693bf7b43e6d0e4479fe2231d88d1b01991bc0ac2779
3
+ size 48588
runs/Dec20_17-12-10_129-146-176-120/1671557236.120787/events.out.tfevents.1671557236.129-146-176-120.1173831.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c58b0f30d76344d37ea230440b9eb5c6772543e5e75da63ce4f21659a56709f9
3
+ size 5893
runs/Dec20_17-12-10_129-146-176-120/events.out.tfevents.1671557236.129-146-176-120.1173831.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a3ff8c5d37804ce31968452140d31507b018a6068f914438dcace86df6f795d
3
+ size 10887
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d501de5f42040e906b7cddad2305bbf2fffbf7817fcdc2277b3a505956e81b7
3
- size 4667
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:787167c636f3a936e53d4a21eb438c4ffab814c944cd2c0ae1aba0081a1e1f43
3
+ size 4731