chmanoj commited on
Commit
1ad5896
1 Parent(s): abc32c7

Training in progress, step 500

Browse files
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f955048c59e9e4047ed09b4c47e04f34abef271130f0124d9eb58bc873f91c55
3
  size 8637973773
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:428cd78ecc6d28a896b4ae26c7e9c5a235d077842b48747a6078f9440175197f
3
  size 8637973773
run_bnb.sh CHANGED
@@ -6,9 +6,9 @@ python run_speech_recognition_ctc_bnb.py \
6
  --output_dir="./" \
7
  --overwrite_output_dir \
8
  --num_train_epochs="150" \
9
- --per_device_train_batch_size="1" \
10
- --per_device_eval_batch_size="1" \
11
- --gradient_accumulation_steps="48" \
12
  --learning_rate="1e-6" \
13
  --warmup_steps="2000" \
14
  --length_column_name="input_length" \
 
6
  --output_dir="./" \
7
  --overwrite_output_dir \
8
  --num_train_epochs="150" \
9
+ --per_device_train_batch_size="4" \
10
+ --per_device_eval_batch_size="4" \
11
+ --gradient_accumulation_steps="12" \
12
  --learning_rate="1e-6" \
13
  --warmup_steps="2000" \
14
  --length_column_name="input_length" \
run_speech_recognition_ctc_bnb.py CHANGED
@@ -698,6 +698,7 @@ def main():
698
  ]
699
  optimizer = bnb.optim.Adam8bit(
700
  params=optimizer_grouped_parameters,
 
701
  betas=(training_args.adam_beta1, training_args.adam_beta2),
702
  eps=training_args.adam_epsilon,
703
  )
 
698
  ]
699
  optimizer = bnb.optim.Adam8bit(
700
  params=optimizer_grouped_parameters,
701
+ lr=training_args.learning_rate,
702
  betas=(training_args.adam_beta1, training_args.adam_beta2),
703
  eps=training_args.adam_epsilon,
704
  )
runs/Jan31_19-04-20_job-2043ddf5-d229-46f3-8808-c26e497d509b/1643656007.0408006/events.out.tfevents.1643656007.job-2043ddf5-d229-46f3-8808-c26e497d509b.574517.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19b17726d5fd4eb996777d0864421aa52c391a515c7c64bf66a7f55400d56ed9
3
+ size 4753
runs/Jan31_19-04-20_job-2043ddf5-d229-46f3-8808-c26e497d509b/events.out.tfevents.1643656007.job-2043ddf5-d229-46f3-8808-c26e497d509b.574517.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d2f453b108916e58e986333948e8aa11506ee8856f1a7e124a8105aafd2d85f
3
+ size 4680
runs/Jan31_19-09-35_job-2043ddf5-d229-46f3-8808-c26e497d509b/1643656313.5386918/events.out.tfevents.1643656313.job-2043ddf5-d229-46f3-8808-c26e497d509b.576732.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:149977fd83e8d846363014c92f04f2ce03392e3cf21087ec2bdc24264f2c253d
3
+ size 4753
runs/Jan31_19-09-35_job-2043ddf5-d229-46f3-8808-c26e497d509b/events.out.tfevents.1643656313.job-2043ddf5-d229-46f3-8808-c26e497d509b.576732.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c544cac7886eaa2ef2904ae9cf0a94e3f6b85d40af8c0153c15bdeb4c52cb28
3
+ size 12812
special_tokens_map.json CHANGED
@@ -1 +1 @@
1
- {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
 
1
+ {"bos_token": "<s>", "eos_token": "</s>", "unk_token": "[UNK]", "pad_token": "[PAD]", "additional_special_tokens": [{"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "<s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}, {"content": "</s>", "single_word": false, "lstrip": false, "rstrip": false, "normalized": true}]}
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3eb05246c3b8f398233525187f3e1378df4480944773dffe7ed37d96ccc4e4b
3
- size 3055
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8d2f4f0bcd677abf1431f17fe99eb16ecf98fc5d369730ce6ec691c318a1c27
3
+ size 2991