JRHuy commited on
Commit
389e03f
1 Parent(s): e8d940c

Training in progress, step 4000

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:145802247f511f2db8a6588be1fa1b29d0b032879310d24beb32ffec60f6d996
3
  size 1934161157
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d2eeaa3e0dd9026beaf9e1275fc1de9ebf175e2cdcb2016072c06c0f3625fab9
3
  size 1934161157
last-checkpoint/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4da96b2ae6e5559d7f78e7908472ddf37a9adc97bc0dfa1983148ab68e5b3eb9
3
  size 967102729
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0529397fb768bff68c9e2f5a80dadfcde0b2f3be588cb77e11b29df524c2ac23
3
  size 967102729
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:db1b5c1b07a03db7d365bf63cf3eae9ed5e22033102108fc6ba233d19973a74e
3
  size 14575
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb08efb4868a5313ffdecb076fda7bef23ca071e8b0db9ad3e0f977f931a25bb
3
  size 14575
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f375f0ec2d81d3bc0adbea21cfba80dd771ec303d1e16586405d497868a3b309
3
  size 627
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c05c5f02f34690b6cdc36257cc6f4b53027dee7ea004e5e07023153262401341
3
  size 627
last-checkpoint/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 17.98756798756799,
3
- "best_model_checkpoint": "./whisper-small-vivos/checkpoint-3000",
4
- "epoch": 4.11522633744856,
5
- "global_step": 3000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -756,11 +756,261 @@
756
  "eval_steps_per_second": 0.122,
757
  "eval_wer": 17.98756798756799,
758
  "step": 3000
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
759
  }
760
  ],
761
  "max_steps": 4000,
762
  "num_train_epochs": 6,
763
- "total_flos": 1.384748184895488e+19,
764
  "trial_name": null,
765
  "trial_params": null
766
  }
 
1
  {
2
+ "best_metric": 17.63791763791764,
3
+ "best_model_checkpoint": "./whisper-small-vivos/checkpoint-4000",
4
+ "epoch": 5.486968449931413,
5
+ "global_step": 4000,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
756
  "eval_steps_per_second": 0.122,
757
  "eval_wer": 17.98756798756799,
758
  "step": 3000
759
+ },
760
+ {
761
+ "epoch": 4.15,
762
+ "learning_rate": 1e-05,
763
+ "loss": 0.0289,
764
+ "step": 3025
765
+ },
766
+ {
767
+ "epoch": 4.18,
768
+ "learning_rate": 1e-05,
769
+ "loss": 0.0226,
770
+ "step": 3050
771
+ },
772
+ {
773
+ "epoch": 4.22,
774
+ "learning_rate": 1e-05,
775
+ "loss": 0.0204,
776
+ "step": 3075
777
+ },
778
+ {
779
+ "epoch": 4.25,
780
+ "learning_rate": 1e-05,
781
+ "loss": 0.0213,
782
+ "step": 3100
783
+ },
784
+ {
785
+ "epoch": 4.29,
786
+ "learning_rate": 1e-05,
787
+ "loss": 0.0223,
788
+ "step": 3125
789
+ },
790
+ {
791
+ "epoch": 4.32,
792
+ "learning_rate": 1e-05,
793
+ "loss": 0.0259,
794
+ "step": 3150
795
+ },
796
+ {
797
+ "epoch": 4.36,
798
+ "learning_rate": 1e-05,
799
+ "loss": 0.0207,
800
+ "step": 3175
801
+ },
802
+ {
803
+ "epoch": 4.39,
804
+ "learning_rate": 1e-05,
805
+ "loss": 0.0235,
806
+ "step": 3200
807
+ },
808
+ {
809
+ "epoch": 4.42,
810
+ "learning_rate": 1e-05,
811
+ "loss": 0.0216,
812
+ "step": 3225
813
+ },
814
+ {
815
+ "epoch": 4.46,
816
+ "learning_rate": 1e-05,
817
+ "loss": 0.0209,
818
+ "step": 3250
819
+ },
820
+ {
821
+ "epoch": 4.49,
822
+ "learning_rate": 1e-05,
823
+ "loss": 0.0233,
824
+ "step": 3275
825
+ },
826
+ {
827
+ "epoch": 4.53,
828
+ "learning_rate": 1e-05,
829
+ "loss": 0.028,
830
+ "step": 3300
831
+ },
832
+ {
833
+ "epoch": 4.56,
834
+ "learning_rate": 1e-05,
835
+ "loss": 0.0283,
836
+ "step": 3325
837
+ },
838
+ {
839
+ "epoch": 4.6,
840
+ "learning_rate": 1e-05,
841
+ "loss": 0.0256,
842
+ "step": 3350
843
+ },
844
+ {
845
+ "epoch": 4.63,
846
+ "learning_rate": 1e-05,
847
+ "loss": 0.0238,
848
+ "step": 3375
849
+ },
850
+ {
851
+ "epoch": 4.66,
852
+ "learning_rate": 1e-05,
853
+ "loss": 0.0255,
854
+ "step": 3400
855
+ },
856
+ {
857
+ "epoch": 4.7,
858
+ "learning_rate": 1e-05,
859
+ "loss": 0.0236,
860
+ "step": 3425
861
+ },
862
+ {
863
+ "epoch": 4.73,
864
+ "learning_rate": 1e-05,
865
+ "loss": 0.0244,
866
+ "step": 3450
867
+ },
868
+ {
869
+ "epoch": 4.77,
870
+ "learning_rate": 1e-05,
871
+ "loss": 0.0342,
872
+ "step": 3475
873
+ },
874
+ {
875
+ "epoch": 4.8,
876
+ "learning_rate": 1e-05,
877
+ "loss": 0.022,
878
+ "step": 3500
879
+ },
880
+ {
881
+ "epoch": 4.84,
882
+ "learning_rate": 1e-05,
883
+ "loss": 0.0231,
884
+ "step": 3525
885
+ },
886
+ {
887
+ "epoch": 4.87,
888
+ "learning_rate": 1e-05,
889
+ "loss": 0.024,
890
+ "step": 3550
891
+ },
892
+ {
893
+ "epoch": 4.9,
894
+ "learning_rate": 1e-05,
895
+ "loss": 0.0275,
896
+ "step": 3575
897
+ },
898
+ {
899
+ "epoch": 4.94,
900
+ "learning_rate": 1e-05,
901
+ "loss": 0.0264,
902
+ "step": 3600
903
+ },
904
+ {
905
+ "epoch": 4.97,
906
+ "learning_rate": 1e-05,
907
+ "loss": 0.0285,
908
+ "step": 3625
909
+ },
910
+ {
911
+ "epoch": 5.01,
912
+ "learning_rate": 1e-05,
913
+ "loss": 0.0199,
914
+ "step": 3650
915
+ },
916
+ {
917
+ "epoch": 5.04,
918
+ "learning_rate": 1e-05,
919
+ "loss": 0.0177,
920
+ "step": 3675
921
+ },
922
+ {
923
+ "epoch": 5.08,
924
+ "learning_rate": 1e-05,
925
+ "loss": 0.0154,
926
+ "step": 3700
927
+ },
928
+ {
929
+ "epoch": 5.11,
930
+ "learning_rate": 1e-05,
931
+ "loss": 0.0126,
932
+ "step": 3725
933
+ },
934
+ {
935
+ "epoch": 5.14,
936
+ "learning_rate": 1e-05,
937
+ "loss": 0.0118,
938
+ "step": 3750
939
+ },
940
+ {
941
+ "epoch": 5.18,
942
+ "learning_rate": 1e-05,
943
+ "loss": 0.0129,
944
+ "step": 3775
945
+ },
946
+ {
947
+ "epoch": 5.21,
948
+ "learning_rate": 1e-05,
949
+ "loss": 0.0141,
950
+ "step": 3800
951
+ },
952
+ {
953
+ "epoch": 5.25,
954
+ "learning_rate": 1e-05,
955
+ "loss": 0.0144,
956
+ "step": 3825
957
+ },
958
+ {
959
+ "epoch": 5.28,
960
+ "learning_rate": 1e-05,
961
+ "loss": 0.0135,
962
+ "step": 3850
963
+ },
964
+ {
965
+ "epoch": 5.32,
966
+ "learning_rate": 1e-05,
967
+ "loss": 0.0185,
968
+ "step": 3875
969
+ },
970
+ {
971
+ "epoch": 5.35,
972
+ "learning_rate": 1e-05,
973
+ "loss": 0.0137,
974
+ "step": 3900
975
+ },
976
+ {
977
+ "epoch": 5.38,
978
+ "learning_rate": 1e-05,
979
+ "loss": 0.0129,
980
+ "step": 3925
981
+ },
982
+ {
983
+ "epoch": 5.42,
984
+ "learning_rate": 1e-05,
985
+ "loss": 0.015,
986
+ "step": 3950
987
+ },
988
+ {
989
+ "epoch": 5.45,
990
+ "learning_rate": 1e-05,
991
+ "loss": 0.0128,
992
+ "step": 3975
993
+ },
994
+ {
995
+ "epoch": 5.49,
996
+ "learning_rate": 1e-05,
997
+ "loss": 0.0199,
998
+ "step": 4000
999
+ },
1000
+ {
1001
+ "epoch": 5.49,
1002
+ "eval_cer": 7.027554850324982,
1003
+ "eval_loss": 0.25804632902145386,
1004
+ "eval_runtime": 394.0647,
1005
+ "eval_samples_per_second": 1.929,
1006
+ "eval_steps_per_second": 0.122,
1007
+ "eval_wer": 17.63791763791764,
1008
+ "step": 4000
1009
  }
1010
  ],
1011
  "max_steps": 4000,
1012
  "num_train_epochs": 6,
1013
+ "total_flos": 1.84636939124736e+19,
1014
  "trial_name": null,
1015
  "trial_params": null
1016
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4da96b2ae6e5559d7f78e7908472ddf37a9adc97bc0dfa1983148ab68e5b3eb9
3
  size 967102729
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0529397fb768bff68c9e2f5a80dadfcde0b2f3be588cb77e11b29df524c2ac23
3
  size 967102729
runs/Aug20_17-07-13_713cba38a708/events.out.tfevents.1692551245.713cba38a708.95.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:667db5d350222a235eac237786b548d21eb5511ddfd0c40292cd8517321f5b71
3
- size 25764
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87cfbca740150fa86fac7e75b3663363867462c93653210ab71be000e23ad764
3
+ size 32409