Training in progress epoch 0

Files changed (6) hide show

README.md CHANGED Viewed

@@ -1,5 +1,6 @@
 ---
 license: mit
 tags:
 - generated_from_keras_callback
 model-index:
@@ -14,9 +15,9 @@ probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on an unknown dataset.
 It achieves the following results on the evaluation set:
-- Train Loss: 8.6853
-- Validation Loss: 8.9496
-- Epoch: 2
 ## Model description
@@ -42,14 +43,12 @@ The following hyperparameters were used during training:
 | Train Loss | Validation Loss | Epoch |
 |:----------:|:---------------:|:-----:|
-| 9.6532     | 9.6275          | 0     |
-| 9.1741     | 9.2580          | 1     |
-| 8.6853     | 8.9496          | 2     |
 ### Framework versions
-- Transformers 4.30.2
 - TensorFlow 2.12.0
-- Datasets 2.13.1
 - Tokenizers 0.13.3

 ---
 license: mit
+base_model: gpt2
 tags:
 - generated_from_keras_callback
 model-index:
 This model is a fine-tuned version of [gpt2](https://huggingface.co/gpt2) on an unknown dataset.
 It achieves the following results on the evaluation set:
+- Train Loss: 10.2980
+- Validation Loss: 9.9832
+- Epoch: 0
 ## Model description
 | Train Loss | Validation Loss | Epoch |
 |:----------:|:---------------:|:-----:|
+| 10.2980    | 9.9832          | 0     |
 ### Framework versions
+- Transformers 4.32.0
 - TensorFlow 2.12.0
+- Datasets 2.14.4
 - Tokenizers 0.13.3

config.json CHANGED Viewed

@@ -32,7 +32,7 @@
       "max_length": 50
     }
   },
-  "transformers_version": "4.30.2",
   "use_cache": true,
   "vocab_size": 44208
 }

       "max_length": 50
     }
   },
+  "transformers_version": "4.32.0",
   "use_cache": true,
   "vocab_size": 44208
 }

generation_config.json CHANGED Viewed

@@ -2,5 +2,5 @@
   "_from_model_config": true,
   "bos_token_id": 0,
   "eos_token_id": 0,
-  "transformers_version": "4.30.2"
 }

   "_from_model_config": true,
   "bos_token_id": 0,
   "eos_token_id": 0,
+  "transformers_version": "4.32.0"
 }

special_tokens_map.json CHANGED Viewed

@@ -13,6 +13,7 @@
     "rstrip": false,
     "single_word": false
   },
   "unk_token": {
     "content": "<|endoftext|>",
     "lstrip": false,

     "rstrip": false,
     "single_word": false
   },
+  "pad_token": "<|endoftext|>",
   "unk_token": {
     "content": "<|endoftext|>",
     "lstrip": false,

tf_model.h5 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:53f499ca66d7484ad0971e816dbd207e936440edd5ae90ffa11d4b04b8b04347
 size 479352912

 version https://git-lfs.github.com/spec/v1
+oid sha256:aede950a6297923209c9686a43a9308af149a4b1c88bab82c84ade98a6342879
 size 479352912

tokenizer.json CHANGED Viewed

@@ -1,6 +1,11 @@
 {
   "version": "1.0",
-  "truncation": null,
   "padding": null,
   "added_tokens": [
     {

 {
   "version": "1.0",
+  "truncation": {
+    "direction": "Right",
+    "max_length": 40,
+    "strategy": "LongestFirst",
+    "stride": 0
+  },
   "padding": null,
   "added_tokens": [
     {