juancopi81 commited on
Commit
a6140af
1 Parent(s): 7048a2d

Training in progress, step 100

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "juancopi81/whisper-medium-es-train-valid-bs-64",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "architectures": [
 
1
  {
2
+ "_name_or_path": "juancopi81/whisper-medium-es",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "architectures": [
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:619bd4c8a11c4fe601524a7c0beb23fb82404bd4aa82d1b0783a1aa0557034b3
3
  size 1527847357
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35e800d4522326115904b878c2c708d6b6ab3d9332c3bcf82017c8220a7db8ba
3
  size 1527847357
run.sh CHANGED
@@ -1,24 +1,24 @@
1
  deepspeed run_speech_recognition_seq2seq_streaming.py \
2
  --deepspeed="ds_config.json" \
3
- --model_name_or_path="juancopi81/whisper-medium-es-train-valid-bs-64" \
4
  --dataset_name="mozilla-foundation/common_voice_11_0" \
5
  --dataset_config_name="es" \
6
  --language="spanish" \
7
  --train_split_name="train+validation" \
8
  --eval_split_name="test" \
9
  --model_index_name="Whisper Small Spanish" \
10
- --max_steps="500" \
11
  --output_dir="./" \
12
  --per_device_train_batch_size="64" \
13
  --per_device_eval_batch_size="32" \
14
  --logging_steps="25" \
15
- --learning_rate="5e-7" \
16
- --warmup_steps="100" \
17
  --evaluation_strategy="steps" \
18
- --eval_steps="500" \
19
  --save_strategy="steps" \
20
- --save_steps="500" \
21
- --generation_max_length="225" \
22
  --length_column_name="input_length" \
23
  --max_duration_in_seconds="30" \
24
  --text_column_name="sentence" \
 
1
  deepspeed run_speech_recognition_seq2seq_streaming.py \
2
  --deepspeed="ds_config.json" \
3
+ --model_name_or_path="juancopi81/whisper-medium-es" \
4
  --dataset_name="mozilla-foundation/common_voice_11_0" \
5
  --dataset_config_name="es" \
6
  --language="spanish" \
7
  --train_split_name="train+validation" \
8
  --eval_split_name="test" \
9
  --model_index_name="Whisper Small Spanish" \
10
+ --max_steps="100" \
11
  --output_dir="./" \
12
  --per_device_train_batch_size="64" \
13
  --per_device_eval_batch_size="32" \
14
  --logging_steps="25" \
15
+ --learning_rate="3e-5" \
16
+ --warmup_steps="10" \
17
  --evaluation_strategy="steps" \
18
+ --eval_steps="100" \
19
  --save_strategy="steps" \
20
+ --save_steps="100" \
21
+ --generation_max_length="5" \
22
  --length_column_name="input_length" \
23
  --max_duration_in_seconds="30" \
24
  --text_column_name="sentence" \
runs/Dec16_21-53-30_132-145-140-45/1671227636.32413/events.out.tfevents.1671227636.132-145-140-45.989061.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a219b172a2b71d6fbc6cfbafa84f4b288a28e4e4115c5cf67b3f756bd21ea25
3
+ size 5880
runs/Dec16_21-53-30_132-145-140-45/events.out.tfevents.1671227636.132-145-140-45.989061.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d453887acd46dafa47a27f85d23408fe31afa5092146fef1edfd37f4d28480bf
3
+ size 5209
tokenizer_config.json CHANGED
@@ -19,7 +19,7 @@
19
  },
20
  "errors": "replace",
21
  "model_max_length": 1024,
22
- "name_or_path": "juancopi81/whisper-medium-es-train-valid-bs-64",
23
  "pad_token": null,
24
  "processor_class": "WhisperProcessor",
25
  "return_attention_mask": false,
 
19
  },
20
  "errors": "replace",
21
  "model_max_length": 1024,
22
+ "name_or_path": "juancopi81/whisper-medium-es",
23
  "pad_token": null,
24
  "processor_class": "WhisperProcessor",
25
  "return_attention_mask": false,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:24d4aa81ef8f537670affe4d5b2c5869ac70b558e4107f25cdf01c52465bbe29
3
  size 4667
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a0cc955785ae0c566469a79ef4a6f8cab101e3beac5ec6c5745bd6ef17fc6a7
3
  size 4667