mikr commited on
Commit
6625ac7
1 Parent(s): 4d52663

Training in progress, step 1000

Browse files
config.json CHANGED
@@ -34,7 +34,7 @@
34
  "num_mel_bins": 80,
35
  "pad_token_id": 50257,
36
  "scale_embedding": false,
37
- "torch_dtype": "float16",
38
  "transformers_version": "4.26.0.dev0",
39
  "use_cache": false,
40
  "vocab_size": 51865
 
34
  "num_mel_bins": 80,
35
  "pad_token_id": 50257,
36
  "scale_embedding": false,
37
+ "torch_dtype": "float32",
38
  "transformers_version": "4.26.0.dev0",
39
  "use_cache": false,
40
  "vocab_size": 51865
ds_config.json DELETED
@@ -1,48 +0,0 @@
1
- {
2
- "fp16": {
3
- "enabled": "auto",
4
- "loss_scale": 0,
5
- "loss_scale_window": 1000,
6
- "initial_scale_power": 16,
7
- "hysteresis": 2,
8
- "min_loss_scale": 1
9
- },
10
-
11
- "optimizer": {
12
- "type": "AdamW",
13
- "params": {
14
- "lr": "auto",
15
- "betas": "auto",
16
- "eps": "auto",
17
- "weight_decay": "auto"
18
- }
19
- },
20
-
21
- "scheduler": {
22
- "type": "WarmupLR",
23
- "params": {
24
- "warmup_min_lr": "auto",
25
- "warmup_max_lr": "auto",
26
- "warmup_num_steps": "auto"
27
- }
28
- },
29
-
30
- "zero_optimization": {
31
- "stage": 2,
32
- "offload_optimizer": {
33
- "device": "cpu",
34
- "pin_memory": true
35
- },
36
- "allgather_partitions": true,
37
- "allgather_bucket_size": 2e8,
38
- "overlap_comm": true,
39
- "reduce_scatter": true,
40
- "reduce_bucket_size": 2e8,
41
- "contiguous_gradients": true
42
- },
43
-
44
- "gradient_accumulation_steps": "auto",
45
- "gradient_clipping": "auto",
46
- "train_batch_size": "auto",
47
- "train_micro_batch_size_per_gpu": "auto"
48
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:44089c5590ed9f7824ba2b1ac8971c4eeadc9e44a55ec419bcd2cdc006b7e181
3
- size 483536061
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6458db92153523ae195e1ef0a5db0a78375fc020947b974c8cfe7a8d123fd242
3
+ size 967102601
run.log CHANGED
The diff for this file is too large to render. See raw diff
 
run.sh CHANGED
@@ -1,5 +1,4 @@
1
- deepspeed run_speech_recognition_seq2seq_streaming.py \
2
- --deepspeed="ds_config.json" \
3
  --model_name_or_path="openai/whisper-small" \
4
  --dataset_name="facebook/voxpopuli" \
5
  --dataset_config_name="hr" \
 
1
+ python run_speech_recognition_seq2seq_streaming.py \
 
2
  --model_name_or_path="openai/whisper-small" \
3
  --dataset_name="facebook/voxpopuli" \
4
  --dataset_config_name="hr" \
runs/Dec14_16-16-20_129-146-123-136/events.out.tfevents.1671034661.129-146-123-136.70213.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f92a227fc60f30d6850b5e1e039264a67779ae38804018446c42be9b8405b88
3
- size 24058
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1be0e84061e5fa35dfeebb9f289d88cfad80f96b46cd10380118db6a9f8d84e6
3
+ size 28611
runs/Dec14_23-13-58_129-146-123-136/1671059651.4855802/events.out.tfevents.1671059651.129-146-123-136.104631.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:015fe417fdf705bf034ab36ff08bba1842db4e17e047850603232f6962e1a96d
3
+ size 5871
runs/Dec14_23-13-58_129-146-123-136/events.out.tfevents.1671059651.129-146-123-136.104631.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e789ae5098d6e35eea005b5d67a41d77d8d82744d121f62424b2631b04071568
3
+ size 10851
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4661efef1c7d1829413d2a909012154ff96d9155a348c80c9a204ac96b0688df
3
- size 4667
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8f800914ed7d0ecfdabd5f7c0dd570590eb7c219e403ef5c508f076fc18572f
3
+ size 3579