Upload folder using huggingface_hub

Browse files

Files changed (6) hide show

config.json +1 -2
model.safetensors +1 -1
optimizer.pt +1 -1
rng_state.pth +1 -1
scheduler.pt +1 -1
trainer_state.json +89 -5

config.json CHANGED Viewed

@@ -15,8 +15,7 @@
   },
   "auto_map": {
     "AutoConfig": "ultravox_config.UltravoxConfig",
-    "AutoModel": "ultravox_model.UltravoxModel",
-    "AutoProcessor": "ultravox_processing.UltravoxProcessor"
   },
   "hidden_size": 4096,
   "ignore_index": -100,

   },
   "auto_map": {
     "AutoConfig": "ultravox_config.UltravoxConfig",
+    "AutoModel": "ultravox_model.UltravoxModel"
   },
   "hidden_size": 4096,
   "ignore_index": -100,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5778a5c6705a186dd32fd97354ac6fbfb6497b5713c6de8c0d33ac1ad36a0e6c
 size 93348824

 version https://git-lfs.github.com/spec/v1
+oid sha256:844a3876dbf4fb559dd52a63c6732fe1bbff100eff60b3cc3896f126d1ba187e
 size 93348824

optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ff10ea684cccfd7292029ac84396a3366e25e9d587fff254649d097bc911c452
 size 186701138

 version https://git-lfs.github.com/spec/v1
+oid sha256:bdf1123ba05cf5d672c5852f3320f551e8d1a087f05d2182f99b0921467a19d7
 size 186701138

rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:50406e2683fae845a67d2522407cfd71c13ce88867a1aac0dc9d26a8b3a5f840
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:ead2bf9cd84322800eb2f2fc4d4c95ffc6c4f969b8f6967eab4f40dffadb6428
 size 14244

scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2253610a716ca9b86b03ae4320fb93d4188a5a6ee3993619c4ddd1d0d004f2ae
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:7cccfc6f01ca6a15cf846ffdba9f6cd8d0e3d353032a1524b92b53154b87a0b1
 size 1064

trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 7.168458781362007,
   "eval_steps": 1000,
-  "global_step": 6000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -434,6 +434,90 @@
       "learning_rate": 0.00017923655879272394,
       "loss": 0.0743,
       "step": 6000
     }
   ],
   "logging_steps": 100,
@@ -445,15 +529,15 @@
     "TrainerControl": {
       "args": {
         "should_epoch_stop": false,
-        "should_evaluate": true,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 8.490208809019392e+16,
   "train_batch_size": 12,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.6021505376344085,
   "eval_steps": 1000,
+  "global_step": 7200,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00017923655879272394,
       "loss": 0.0743,
       "step": 6000
+    },
+    {
+      "epoch": 7.287933094384707,
+      "grad_norm": 0.06787109375,
+      "learning_rate": 0.00015135574250524898,
+      "loss": 0.076,
+      "step": 6100
+    },
+    {
+      "epoch": 7.407407407407407,
+      "grad_norm": 0.06201171875,
+      "learning_rate": 0.00012565338385541792,
+      "loss": 0.0736,
+      "step": 6200
+    },
+    {
+      "epoch": 7.526881720430108,
+      "grad_norm": 0.047607421875,
+      "learning_rate": 0.00010219546042925842,
+      "loss": 0.0728,
+      "step": 6300
+    },
+    {
+      "epoch": 7.646356033452808,
+      "grad_norm": 0.045654296875,
+      "learning_rate": 8.10421883797694e-05,
+      "loss": 0.0725,
+      "step": 6400
+    },
+    {
+      "epoch": 7.765830346475508,
+      "grad_norm": 0.05126953125,
+      "learning_rate": 6.22478678529197e-05,
+      "loss": 0.0717,
+      "step": 6500
+    },
+    {
+      "epoch": 7.885304659498208,
+      "grad_norm": 0.046875,
+      "learning_rate": 4.5860743599951184e-05,
+      "loss": 0.0726,
+      "step": 6600
+    },
+    {
+      "epoch": 1.004778972520908,
+      "grad_norm": 0.050048828125,
+      "learning_rate": 3.192288113379582e-05,
+      "loss": 0.0732,
+      "step": 6700
+    },
+    {
+      "epoch": 1.124253285543608,
+      "grad_norm": 0.0498046875,
+      "learning_rate": 2.0470058747505516e-05,
+      "loss": 0.0724,
+      "step": 6800
+    },
+    {
+      "epoch": 1.2437275985663083,
+      "grad_norm": 0.050537109375,
+      "learning_rate": 1.153167567188862e-05,
+      "loss": 0.0748,
+      "step": 6900
+    },
+    {
+      "epoch": 1.3632019115890084,
+      "grad_norm": 0.04443359375,
+      "learning_rate": 5.1306766081048454e-06,
+      "loss": 0.0745,
+      "step": 7000
+    },
+    {
+      "epoch": 1.4826762246117084,
+      "grad_norm": 0.050048828125,
+      "learning_rate": 1.2834928289472415e-06,
+      "loss": 0.0717,
+      "step": 7100
+    },
+    {
+      "epoch": 1.6021505376344085,
+      "grad_norm": 0.0458984375,
+      "learning_rate": 0.0,
+      "loss": 0.073,
+      "step": 7200
     }
   ],
   "logging_steps": 100,
     "TrainerControl": {
       "args": {
         "should_epoch_stop": false,
+        "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 1.018481533644288e+17,
   "train_batch_size": 12,
   "trial_name": null,
   "trial_params": null