Upload 3 files

change version to submission 3

Files changed (3) hide show

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:124c6aae5f83a770d311fa14a81015a9679a57de6f0f012adbae414b8042fde6
 size 3785732668

 version https://git-lfs.github.com/spec/v1
+oid sha256:820cb1a44e5a3d0304ef31ea105fc140bcb2865dc4d257a030d7fea72e557668
 size 3785732668

train_args.json ADDED Viewed

+{
+  "output_dir": "../drive/MyDrive/NICE/model/0422_train_encoder",
+  "model_name_or_path": "../drive/MyDrive/NICE/model/cap_best/OFA-huge-caption",
+  "train_caption_file": "./data/train_caption.jsonl",
+  "train_image_file": "../drive/MyDrive/NICE/train_image.tsv",
+  "test_caption_file": null,
+  "test_image_file": null,
+  "freeze_encoder": false,
+  "freeze_word_embed": false,
+  "num_train_epochs": 30,
+  "max_steps": -1,
+  "per_device_train_batch_size": 12,
+  "per_device_eval_batch_size": 256,
+  "learning_rate": 5e-05,
+  "max_seq_length": 150,
+  "logging_steps": 5000,
+  "save_steps": 5000,
+  "save_total_limit": 2,
+  "lr_scheduler_type": "cosine",
+  "warmup_steps": 2000,
+  "warmup_ratio": 0,
+  "gradient_accumulation_steps": 1,
+  "optim": "adamw_torch",
+  "seed": 69,
+  "fp16": false,
+  "no_cuda": false,
+  "dataloader_num_workers": 8,
+  "save_strategy": "steps",
+  "weight_decay": 0,
+  "max_grad_norm": 1.0,
+  "remove_unused_columns": false
+}

trainer_state.json ADDED Viewed

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 30.0,
+  "global_step": 12510,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 11.99,
+      "learning_rate": 4.060393227846204e-05,
+      "loss": 0.7845,
+      "step": 5000
+    },
+    {
+      "epoch": 23.98,
+      "learning_rate": 6.712477093047967e-06,
+      "loss": 0.0208,
+      "step": 10000
+    },
+    {
+      "epoch": 30.0,
+      "step": 12510,
+      "total_flos": 1.1203460780602368e+17,
+      "train_loss": 0.32232193622848304,
+      "train_runtime": 17163.0194,
+      "train_samples_per_second": 8.74,
+      "train_steps_per_second": 0.729
+    }
+  ],
+  "max_steps": 12510,
+  "num_train_epochs": 30,
+  "total_flos": 1.1203460780602368e+17,
+  "trial_name": null,
+  "trial_params": null
+}