deepdml commited on
Commit
3975fdd
1 Parent(s): 5cbc384

Training in progress, step 1000

Browse files
.ipynb_checkpoints/run-checkpoint.sh CHANGED
@@ -1,12 +1,12 @@
1
  python run_speech_recognition_seq2seq_streaming.py \
2
- --model_name_or_path="openai/whisper-medium" \
3
  --dataset_name="mozilla-foundation/common_voice_11_0" \
4
  --dataset_config_name="fr" \
5
  --language="french" \
6
  --train_split_name="train+validation" \
7
  --eval_split_name="test" \
8
  --model_index_name="Whisper Medium Mixed-Spanish" \
9
- --max_steps="8000" \
10
  --output_dir="./" \
11
  --per_device_train_batch_size="32" \
12
  --per_device_eval_batch_size="16" \
 
1
  python run_speech_recognition_seq2seq_streaming.py \
2
+ --model_name_or_path="deepdml/whisper-medium-mix-fr" \
3
  --dataset_name="mozilla-foundation/common_voice_11_0" \
4
  --dataset_config_name="fr" \
5
  --language="french" \
6
  --train_split_name="train+validation" \
7
  --eval_split_name="test" \
8
  --model_index_name="Whisper Medium Mixed-Spanish" \
9
+ --max_steps="4000" \
10
  --output_dir="./" \
11
  --per_device_train_batch_size="32" \
12
  --per_device_eval_batch_size="16" \
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "openai/whisper-medium",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "architectures": [
 
1
  {
2
+ "_name_or_path": "deepdml/whisper-medium-mix-fr",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "architectures": [
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3e45d6fe48f68a8701aed760c77787594c85c9301cf263205c7f74a0c077d4e8
3
  size 3055754841
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f159574104c5b8f4bfb9206e5107730e5158340011275d63a01a97bb2b6d2f2
3
  size 3055754841
run.sh CHANGED
@@ -1,12 +1,12 @@
1
  python run_speech_recognition_seq2seq_streaming.py \
2
- --model_name_or_path="openai/whisper-medium" \
3
  --dataset_name="mozilla-foundation/common_voice_11_0" \
4
  --dataset_config_name="fr" \
5
  --language="french" \
6
  --train_split_name="train+validation" \
7
  --eval_split_name="test" \
8
  --model_index_name="Whisper Medium Mixed-Spanish" \
9
- --max_steps="8000" \
10
  --output_dir="./" \
11
  --per_device_train_batch_size="32" \
12
  --per_device_eval_batch_size="16" \
 
1
  python run_speech_recognition_seq2seq_streaming.py \
2
+ --model_name_or_path="deepdml/whisper-medium-mix-fr" \
3
  --dataset_name="mozilla-foundation/common_voice_11_0" \
4
  --dataset_config_name="fr" \
5
  --language="french" \
6
  --train_split_name="train+validation" \
7
  --eval_split_name="test" \
8
  --model_index_name="Whisper Medium Mixed-Spanish" \
9
+ --max_steps="4000" \
10
  --output_dir="./" \
11
  --per_device_train_batch_size="32" \
12
  --per_device_eval_batch_size="16" \
runs/Dec13_08-12-27_150-136-45-193/events.out.tfevents.1670919198.150-136-45-193.88987.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:daf387e2990aa32ba733717afa44c2968bd481ce06644468fea9aa38c1932fcb
3
- size 37244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf4bd9ec96721e9759b0d678f1fef7828945c1c926035999bf70729f356bef8c
3
+ size 43842
runs/Dec14_15-02-29_150-136-45-193/1671030209.7839215/events.out.tfevents.1671030209.150-136-45-193.1109857.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ef9d163974c0f8866bac47f4da02bd79a6439bf9df93de4735271e5a3e8b14b
3
+ size 5870
runs/Dec14_15-02-29_150-136-45-193/events.out.tfevents.1671030209.150-136-45-193.1109857.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90b1b7e397151c54928e7cc187e7e31b839f65703f736d8db9db512162914f5d
3
+ size 10860
tokenizer_config.json CHANGED
@@ -19,7 +19,7 @@
19
  },
20
  "errors": "replace",
21
  "model_max_length": 1024,
22
- "name_or_path": "openai/whisper-medium",
23
  "pad_token": null,
24
  "processor_class": "WhisperProcessor",
25
  "return_attention_mask": false,
 
19
  },
20
  "errors": "replace",
21
  "model_max_length": 1024,
22
+ "name_or_path": "deepdml/whisper-medium-mix-fr",
23
  "pad_token": null,
24
  "processor_class": "WhisperProcessor",
25
  "return_attention_mask": false,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5b11dd83a82f3e898ed68a1f2409f3f4fb73180191a66cc2e453b6b30c638149
3
  size 3579
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77ffad1564c201d1e9d9780ddc3840bec45b57a7ac0596feb2341f5c94e6cef0
3
  size 3579