ninagroot/GPT2-705Mtest

Files changed (6) hide show

README.md CHANGED Viewed

@@ -13,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [](https://huggingface.co/) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Loss: 3.5144
 ## Model description
@@ -48,9 +48,9 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 5.4376        | 0.99  | 45   | 4.6269          |
-| 3.5916        | 2.0   | 91   | 3.7375          |
-| 2.7508        | 2.97  | 135  | 3.5144          |
 ### Framework versions

 This model is a fine-tuned version of [](https://huggingface.co/) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Loss: 3.3102
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 5.418         | 0.99  | 49   | 4.3687          |
+| 3.5953        | 2.0   | 99   | 3.6199          |
+| 2.516         | 2.97  | 147  | 3.3102          |
 ### Framework versions

config.json CHANGED Viewed

@@ -15,7 +15,7 @@
   "n_inner": null,
   "n_layer": 24,
   "n_positions": 256,
-  "pad_token_id": 50256,
   "reorder_and_upcast_attn": false,
   "resid_pdrop": 0.0,
   "scale_attn_by_inverse_layer_idx": false,
@@ -28,5 +28,5 @@
   "torch_dtype": "float32",
   "transformers_version": "4.39.1",
   "use_cache": true,
-  "vocab_size": 50257
 }

   "n_inner": null,
   "n_layer": 24,
   "n_positions": 256,
+  "pad_token_id": 0,
   "reorder_and_upcast_attn": false,
   "resid_pdrop": 0.0,
   "scale_attn_by_inverse_layer_idx": false,
   "torch_dtype": "float32",
   "transformers_version": "4.39.1",
   "use_cache": true,
+  "vocab_size": 32000
 }

generation_config.json CHANGED Viewed

@@ -2,6 +2,6 @@
   "_from_model_config": true,
   "bos_token_id": 50256,
   "eos_token_id": 50256,
-  "pad_token_id": 50256,
   "transformers_version": "4.39.1"
 }

   "_from_model_config": true,
   "bos_token_id": 50256,
   "eos_token_id": 50256,
+  "pad_token_id": 0,
   "transformers_version": "4.39.1"
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:edcdc2e8b934d6e5f57aec20c8665204d854e298d6bf9963a83ebea2ce4d8417
-size 3030220576

 version https://git-lfs.github.com/spec/v1
+oid sha256:43fc797fdeafe2a712b7042be287a3bfccaa8333d2040b7905a200a1f33955b7
+size 2918049568

runs/Apr10_10-47-27_gcn10.local.snellius.surf.nl/events.out.tfevents.1712738857.gcn10.local.snellius.surf.nl.241513.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:d5d027284527755fa9e1a8f26e6adeb836f5401804979b1ac9ce7d7907b38b3d
+size 7289

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:67652905ed07950025ae0f17f985e23ba59ec1ae0e4cf668a1d90b4c0fa93ff3
 size 4984

 version https://git-lfs.github.com/spec/v1
+oid sha256:c3d537fb716c983e38cc2bd8d5326c5cac4a21efff3a0a19129c0cf7eb13cf3f
 size 4984