p4b commited on
Commit
5e33495
1 Parent(s): c390553

Training in progress, step 200

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "openai/whisper-large-v2",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "architectures": [
 
1
  {
2
+ "_name_or_path": "p4b/whisper-large-v2-lv",
3
  "activation_dropout": 0.0,
4
  "activation_function": "gelu",
5
  "architectures": [
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a115ff886475c9aeba1f4b5db24a576404bc496725b85ec2b92809ea3124e7a
3
- size 3086885937
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6221c007deae46a3c7638e49b86491a5170532af9fba7509175501769a069de0
3
+ size 3086785087
run2.sh ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ deepspeed run_speech_recognition_seq2seq_streaming.py \
2
+ --deepspeed="ds_config.json" \
3
+ --model_name_or_path="p4b/whisper-large-v2-lv" \
4
+ --dataset_name="mozilla-foundation/common_voice_11_0" \
5
+ --dataset_config_name="lv" \
6
+ --language="latvian" \
7
+ --train_split_name="train+validation" \
8
+ --eval_split_name="test" \
9
+ --model_index_name="Whisper Large-v2 Latvian" \
10
+ --max_steps="900" \
11
+ --output_dir="./" \
12
+ --per_device_train_batch_size="32" \
13
+ --gradient_accumulation_steps="2" \
14
+ --per_device_eval_batch_size="32" \
15
+ --logging_steps="25" \
16
+ --learning_rate="1e-7" \
17
+ --lr_scheduler_type="cosine" \
18
+ --warmup_steps="100" \
19
+ --evaluation_strategy="steps" \
20
+ --eval_steps="200" \
21
+ --save_strategy="steps" \
22
+ --save_steps="200" \
23
+ --generation_max_length="225" \
24
+ --length_column_name="input_length" \
25
+ --max_duration_in_seconds="30" \
26
+ --text_column_name="sentence" \
27
+ --freeze_feature_encoder="False" \
28
+ --freeze_encoder="False" \
29
+ --report_to="tensorboard" \
30
+ --metric_for_best_model="wer" \
31
+ --greater_is_better="False" \
32
+ --load_best_model_at_end \
33
+ --gradient_checkpointing \
34
+ --fp16 \
35
+ --overwrite_output_dir \
36
+ --do_train \
37
+ --do_eval \
38
+ --predict_with_generate \
39
+ --do_normalize_eval \
40
+ --use_auth_token \
41
+ --push_to_hub \
42
+ --torch_compile="True" \
43
+ --local_rank=0
runs/Dec19_09-23-32_nipa2022-65403/1671409649.396783/events.out.tfevents.1671409649.nipa2022-65403.20673.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb0f26a93ceec45a313b689d30a026934641ad8461251f435399821468811ee2
3
+ size 5884
runs/Dec19_09-23-32_nipa2022-65403/events.out.tfevents.1671409649.nipa2022-65403.20673.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8dcff521bf933ebe64d9cda1274dba46b3aff08f7a273c6b42eb014ae38dc8c
3
+ size 4286
runs/Dec19_09-48-52_nipa2022-65403/1671411014.4457693/events.out.tfevents.1671411014.nipa2022-65403.3427.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dcf44527ec2f968d95208ac8f04ab2a008abff1dbc03872258edd74f0b8bc603
3
+ size 5884
runs/Dec19_09-48-52_nipa2022-65403/events.out.tfevents.1671411014.nipa2022-65403.3427.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2fd3f4b4cee94f2651c27cee567818ed46a42cdedb1d770deb6c411f7ae53abf
3
+ size 5845
tokenizer_config.json CHANGED
@@ -19,7 +19,7 @@
19
  },
20
  "errors": "replace",
21
  "model_max_length": 1024,
22
- "name_or_path": "openai/whisper-large-v2",
23
  "pad_token": null,
24
  "processor_class": "WhisperProcessor",
25
  "return_attention_mask": false,
 
19
  },
20
  "errors": "replace",
21
  "model_max_length": 1024,
22
+ "name_or_path": "p4b/whisper-large-v2-lv",
23
  "pad_token": null,
24
  "processor_class": "WhisperProcessor",
25
  "return_attention_mask": false,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3799dc22368507dfe5fa8baa5ff4c56435981c120180031622d237adfa2f6550
3
  size 4411
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5515b192c2ca73529b118c5b04d885e8951cd2f2e0b013ca9552fad66d1fe844
3
  size 4411