Yapeng commited on
Commit
99015bb
1 Parent(s): 1b3527a

Training in progress, step 40

Browse files
fine-tune-whisper-streaming.ipynb CHANGED
@@ -886,8 +886,8 @@
886
  "\n",
887
  " <div>\n",
888
  " \n",
889
- " <progress value='10' max='100' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
890
- " [ 10/100 01:34 < 17:46, 0.08 it/s, Epoch 0.09/9223372036854775807]\n",
891
  " </div>\n",
892
  " <table border=\"1\" class=\"dataframe\">\n",
893
  " <thead>\n",
@@ -895,9 +895,28 @@
895
  " <th>Step</th>\n",
896
  " <th>Training Loss</th>\n",
897
  " <th>Validation Loss</th>\n",
 
898
  " </tr>\n",
899
  " </thead>\n",
900
  " <tbody>\n",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
901
  " </tbody>\n",
902
  "</table><p>"
903
  ],
@@ -907,6 +926,63 @@
907
  },
908
  "metadata": {},
909
  "output_type": "display_data"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
910
  }
911
  ],
912
  "source": [
 
886
  "\n",
887
  " <div>\n",
888
  " \n",
889
+ " <progress value='41' max='100' style='width:300px; height:20px; vertical-align: middle;'></progress>\n",
890
+ " [ 41/100 11:18 < 17:06, 0.06 it/s, Epoch 0.40/9223372036854775807]\n",
891
  " </div>\n",
892
  " <table border=\"1\" class=\"dataframe\">\n",
893
  " <thead>\n",
 
895
  " <th>Step</th>\n",
896
  " <th>Training Loss</th>\n",
897
  " <th>Validation Loss</th>\n",
898
+ " <th>Wer</th>\n",
899
  " </tr>\n",
900
  " </thead>\n",
901
  " <tbody>\n",
902
+ " <tr>\n",
903
+ " <td>10</td>\n",
904
+ " <td>0.444000</td>\n",
905
+ " <td>0.713627</td>\n",
906
+ " <td>51.181102</td>\n",
907
+ " </tr>\n",
908
+ " <tr>\n",
909
+ " <td>20</td>\n",
910
+ " <td>0.499800</td>\n",
911
+ " <td>0.709538</td>\n",
912
+ " <td>55.380577</td>\n",
913
+ " </tr>\n",
914
+ " <tr>\n",
915
+ " <td>30</td>\n",
916
+ " <td>0.432000</td>\n",
917
+ " <td>0.702946</td>\n",
918
+ " <td>51.443570</td>\n",
919
+ " </tr>\n",
920
  " </tbody>\n",
921
  "</table><p>"
922
  ],
 
926
  },
927
  "metadata": {},
928
  "output_type": "display_data"
929
+ },
930
+ {
931
+ "name": "stderr",
932
+ "output_type": "stream",
933
+ "text": [
934
+ "***** Running Evaluation *****\n",
935
+ " Num examples: Unknown\n",
936
+ " Batch size = 32\n",
937
+ "Reading metadata...: 8693it [00:01, 7728.48it/s]\n",
938
+ "The following columns in the evaluation set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n",
939
+ "Saving model checkpoint to ./checkpoint-10\n",
940
+ "Configuration saved in ./checkpoint-10/config.json\n",
941
+ "Model weights saved in ./checkpoint-10/pytorch_model.bin\n",
942
+ "Feature extractor saved in ./checkpoint-10/preprocessor_config.json\n",
943
+ "tokenizer config file saved in ./checkpoint-10/tokenizer_config.json\n",
944
+ "Special tokens file saved in ./checkpoint-10/special_tokens_map.json\n",
945
+ "added tokens file saved in ./checkpoint-10/added_tokens.json\n",
946
+ "Feature extractor saved in ./preprocessor_config.json\n",
947
+ "tokenizer config file saved in ./tokenizer_config.json\n",
948
+ "Special tokens file saved in ./special_tokens_map.json\n",
949
+ "added tokens file saved in ./added_tokens.json\n",
950
+ "/opt/conda/lib/python3.10/site-packages/torch/nn/parallel/_functions.py:68: UserWarning: Was asked to gather along dimension 0, but all input tensors were scalars; will instead unsqueeze and return a vector.\n",
951
+ " warnings.warn('Was asked to gather along dimension 0, but all '\n",
952
+ "***** Running Evaluation *****\n",
953
+ " Num examples: Unknown\n",
954
+ " Batch size = 32\n",
955
+ "Reading metadata...: 8693it [00:02, 3799.36it/s]\n",
956
+ "The following columns in the evaluation set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n",
957
+ "Saving model checkpoint to ./checkpoint-20\n",
958
+ "Configuration saved in ./checkpoint-20/config.json\n",
959
+ "Model weights saved in ./checkpoint-20/pytorch_model.bin\n",
960
+ "Feature extractor saved in ./checkpoint-20/preprocessor_config.json\n",
961
+ "tokenizer config file saved in ./checkpoint-20/tokenizer_config.json\n",
962
+ "Special tokens file saved in ./checkpoint-20/special_tokens_map.json\n",
963
+ "added tokens file saved in ./checkpoint-20/added_tokens.json\n",
964
+ "/opt/conda/lib/python3.10/site-packages/torch/nn/parallel/_functions.py:68: UserWarning: Was asked to gather along dimension 0, but all input tensors were scalars; will instead unsqueeze and return a vector.\n",
965
+ " warnings.warn('Was asked to gather along dimension 0, but all '\n",
966
+ "***** Running Evaluation *****\n",
967
+ " Num examples: Unknown\n",
968
+ " Batch size = 32\n",
969
+ "Reading metadata...: 8693it [00:02, 3860.16it/s]\n",
970
+ "The following columns in the evaluation set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n",
971
+ "Saving model checkpoint to ./checkpoint-30\n",
972
+ "Configuration saved in ./checkpoint-30/config.json\n",
973
+ "Model weights saved in ./checkpoint-30/pytorch_model.bin\n",
974
+ "Feature extractor saved in ./checkpoint-30/preprocessor_config.json\n",
975
+ "tokenizer config file saved in ./checkpoint-30/tokenizer_config.json\n",
976
+ "Special tokens file saved in ./checkpoint-30/special_tokens_map.json\n",
977
+ "added tokens file saved in ./checkpoint-30/added_tokens.json\n",
978
+ "/opt/conda/lib/python3.10/site-packages/torch/nn/parallel/_functions.py:68: UserWarning: Was asked to gather along dimension 0, but all input tensors were scalars; will instead unsqueeze and return a vector.\n",
979
+ " warnings.warn('Was asked to gather along dimension 0, but all '\n",
980
+ "***** Running Evaluation *****\n",
981
+ " Num examples: Unknown\n",
982
+ " Batch size = 32\n",
983
+ "Reading metadata...: 8693it [00:01, 7522.25it/s]\n",
984
+ "The following columns in the evaluation set don't have a corresponding argument in `WhisperForConditionalGeneration.forward` and have been ignored: input_length. If input_length are not expected by `WhisperForConditionalGeneration.forward`, you can safely ignore this message.\n"
985
+ ]
986
  }
987
  ],
988
  "source": [
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5388d3e1bdd849719f7950acca9a4f4b0ed3d6bcefe52280b17066ef754487bd
3
  size 967099139
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c69fad5f642921054b5e7027fa173497fdef8d1aba46e2e10446850af9e20712
3
  size 967099139
runs/Dec06_02-49-42_04812eda968b/events.out.tfevents.1670295010.04812eda968b.1031606.3 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:17115becec12eccf3f1f12abd9d9a3d47a9d3ed2e9d5a6c34ad7747252d043e7
3
- size 6042
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3103049bb8468c9537f04bdc5ee6127b0d444fbd8812deac5ae27d6b1224f306
3
+ size 11598