Training in progress, step 1000
Browse files- ds_config.json +10 -8
- pytorch_model.bin +1 -1
- run.sh +1 -1
- runs/Dec20_12-59-04_129-146-176-120/events.out.tfevents.1671542011.129-146-176-120.680663.0 +2 -2
- runs/Dec20_17-12-10_129-146-176-120/1671557236.120787/events.out.tfevents.1671557236.129-146-176-120.1173831.1 +3 -0
- runs/Dec20_17-12-10_129-146-176-120/events.out.tfevents.1671557236.129-146-176-120.1173831.0 +3 -0
- training_args.bin +2 -2
ds_config.json
CHANGED
@@ -18,14 +18,16 @@
|
|
18 |
}
|
19 |
},
|
20 |
|
21 |
-
|
22 |
-
|
23 |
-
|
24 |
-
|
25 |
-
|
26 |
-
|
27 |
-
|
28 |
-
|
|
|
|
|
29 |
|
30 |
"zero_optimization": {
|
31 |
"stage": 2,
|
|
|
18 |
}
|
19 |
},
|
20 |
|
21 |
+
"scheduler": {
|
22 |
+
"type": "WarmupDecayLR",
|
23 |
+
"params": {
|
24 |
+
"last_batch_iteration": -1,
|
25 |
+
"total_num_steps": "auto",
|
26 |
+
"warmup_min_lr": "auto",
|
27 |
+
"warmup_max_lr": "auto",
|
28 |
+
"warmup_num_steps": "auto"
|
29 |
+
}
|
30 |
+
},
|
31 |
|
32 |
"zero_optimization": {
|
33 |
"stage": 2,
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 483536061
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66c65726b9d7262b98529730a55b1d37e92aafedea5486722aba0d97e4216171
|
3 |
size 483536061
|
run.sh
CHANGED
@@ -11,7 +11,7 @@ deepspeed run_speech_recognition_seq2seq_streaming-farsipal.py \
|
|
11 |
--torch_compile="True" \
|
12 |
--torch_compile_mode="reduce-overhead" \
|
13 |
--torch_compile_mode="max-autotune" \
|
14 |
-
--max_steps="
|
15 |
--output_dir="./" \
|
16 |
--per_device_train_batch_size="32" \
|
17 |
--gradient_accumulation_steps="1" \
|
|
|
11 |
--torch_compile="True" \
|
12 |
--torch_compile_mode="reduce-overhead" \
|
13 |
--torch_compile_mode="max-autotune" \
|
14 |
+
--max_steps="5000" \
|
15 |
--output_dir="./" \
|
16 |
--per_device_train_batch_size="32" \
|
17 |
--gradient_accumulation_steps="1" \
|
runs/Dec20_12-59-04_129-146-176-120/events.out.tfevents.1671542011.129-146-176-120.680663.0
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:43fcfbc982169b9c6eb2693bf7b43e6d0e4479fe2231d88d1b01991bc0ac2779
|
3 |
+
size 48588
|
runs/Dec20_17-12-10_129-146-176-120/1671557236.120787/events.out.tfevents.1671557236.129-146-176-120.1173831.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c58b0f30d76344d37ea230440b9eb5c6772543e5e75da63ce4f21659a56709f9
|
3 |
+
size 5893
|
runs/Dec20_17-12-10_129-146-176-120/events.out.tfevents.1671557236.129-146-176-120.1173831.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a3ff8c5d37804ce31968452140d31507b018a6068f914438dcace86df6f795d
|
3 |
+
size 10887
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:787167c636f3a936e53d4a21eb438c4ffab814c944cd2c0ae1aba0081a1e1f43
|
3 |
+
size 4731
|