Training in progress, step 500

Files changed (14) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "cedpsam/EleutherAI_gpt-neo-125M-stablediffionprompts",
   "activation_function": "gelu_new",
   "architectures": [
     "GPTNeoForCausalLM"

 {
+  "_name_or_path": "../input/gptneo125mstablediffionprompts/cedpsam/EleutherAI_gpt-neo-125M-stablediffionprompts/checkpoint-72000",
   "activation_function": "gelu_new",
   "architectures": [
     "GPTNeoForCausalLM"

last-checkpoint/config.json ADDED Viewed

+{
+  "_name_or_path": "../input/gptneo125mstablediffionprompts/cedpsam/EleutherAI_gpt-neo-125M-stablediffionprompts/checkpoint-72000",
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPTNeoForCausalLM"
+  ],
+  "attention_dropout": 0,
+  "attention_layers": [
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local",
+    "global",
+    "local"
+  ],
+  "attention_types": [
+    [
+      [
+        "global",
+        "local"
+      ],
+      6
+    ]
+  ],
+  "bos_token_id": 50256,
+  "embed_dropout": 0,
+  "eos_token_id": 50256,
+  "gradient_checkpointing": false,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": null,
+  "layer_norm_epsilon": 1e-05,
+  "max_position_embeddings": 2048,
+  "model_type": "gpt_neo",
+  "num_heads": 12,
+  "num_layers": 12,
+  "resid_dropout": 0,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.20.1",
+  "use_cache": true,
+  "vocab_size": 50257,
+  "window_size": 256
+}

last-checkpoint/optimizer.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:4179b0e43211d82c165ea0d5e46ac8abd782eb41ef2c86737f17d354c09a683d
+size 1001681601

last-checkpoint/pytorch_model.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:fdd180c9f3bad595ff28a8081094e34482ae60473cf3c7f3e8d9bbba4c2332c5
+size 551185105

last-checkpoint/rng_state.pth ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:674676e662eeb93778c2b153ffad13aa90b43355da1956ce0b1e01e72f48c8d7
+size 14503

last-checkpoint/scaler.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:0ae53ce3102a174710937c6b72edc10e1eddb295c8c0083f6aef662649364830
+size 559

last-checkpoint/scheduler.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:51dbebb494d0e544faaecc887cfa1d4358344dc2a25186c474aa84b00c5b2075
+size 623

last-checkpoint/trainer_state.json ADDED Viewed

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 0.006782603977318972,
+  "global_step": 500,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.01,
+      "learning_rate": 4.9321739602268106e-05,
+      "loss": 0.0506,
+      "step": 500
+    }
+  ],
+  "max_steps": 73718,
+  "num_train_epochs": 1,
+  "total_flos": 524503851466752.0,
+  "trial_name": null,
+  "trial_params": null
+}

last-checkpoint/training_args.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:76f7a5b9daaa07567ee5671e3963752e7d96c10b76d141e0d49b0ca332fe6348
+size 3567

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f597c6108bec0f76cd5628694bd977651b643867628598c8e1c36834427cf68d
 size 551185105

 version https://git-lfs.github.com/spec/v1
+oid sha256:fdd180c9f3bad595ff28a8081094e34482ae60473cf3c7f3e8d9bbba4c2332c5
 size 551185105

runs/Oct10_09-11-38_e244ff9c7972/1665393287.3311083/events.out.tfevents.1665393287.e244ff9c7972.24.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:29df6494538e25b39490464e84712d11af2069694dd3b1b3ea39ac2dc5df19dc
+size 5544

runs/Oct10_09-11-38_e244ff9c7972/1665393298.9343245/events.out.tfevents.1665393298.e244ff9c7972.24.2 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:5d084c97606d34abaa542878f054fb9f29fc9376bf2433e6dfacc179317aa199
+size 5544

runs/Oct10_09-11-38_e244ff9c7972/events.out.tfevents.1665393287.e244ff9c7972.24.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8d7431a292d663f67f5d821ac94a26e59819e05915a6524907171c27f8e68ed6
+size 8805

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2604f24317422d07fc69f9f19fa59901cfc6225e30dd189b891a4e45b43cb715
-size 3439

 version https://git-lfs.github.com/spec/v1
+oid sha256:76f7a5b9daaa07567ee5671e3963752e7d96c10b76d141e0d49b0ca332fe6348
+size 3567