End of training

Browse files

Files changed (6) hide show

README.md +41 -41
config.json +2 -2
model.safetensors +2 -2
runs/Mar04_10-14-38_4aecdba70411/events.out.tfevents.1709547278.4aecdba70411.306.1 +3 -0
tokenizer.json +17 -53
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -13,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [](https://huggingface.co/) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.8108
 ## Model description
@@ -44,46 +44,46 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 3.3648        | 1.0   | 6    | 2.7465          |
-| 2.3708        | 2.0   | 12   | 2.0172          |
-| 1.8554        | 3.0   | 18   | 1.7507          |
-| 1.6599        | 4.0   | 24   | 1.6101          |
-| 1.5513        | 5.0   | 30   | 1.6004          |
-| 1.5494        | 6.0   | 36   | 1.5314          |
-| 1.5147        | 7.0   | 42   | 1.6012          |
-| 1.5361        | 8.0   | 48   | 1.9344          |
-| 1.5928        | 9.0   | 54   | 1.5257          |
-| 1.5114        | 10.0  | 60   | 1.5045          |
-| 1.457         | 11.0  | 66   | 1.4829          |
-| 1.4053        | 12.0  | 72   | 1.4635          |
-| 1.4049        | 13.0  | 78   | 1.4393          |
-| 1.4052        | 14.0  | 84   | 1.3878          |
-| 1.3437        | 15.0  | 90   | 1.3503          |
-| 1.3226        | 16.0  | 96   | 1.3059          |
-| 1.2817        | 17.0  | 102  | 1.2379          |
-| 1.2255        | 18.0  | 108  | 1.1771          |
-| 1.1717        | 19.0  | 114  | 1.2811          |
-| 1.2039        | 20.0  | 120  | 1.3512          |
-| 1.2312        | 21.0  | 126  | 1.2075          |
-| 1.1481        | 22.0  | 132  | 1.0787          |
-| 1.091         | 23.0  | 138  | 1.0809          |
-| 1.0598        | 24.0  | 144  | 1.0479          |
-| 1.0649        | 25.0  | 150  | 1.0148          |
-| 1.0172        | 26.0  | 156  | 1.0194          |
-| 1.0004        | 27.0  | 162  | 0.9618          |
-| 0.9639        | 28.0  | 168  | 0.9565          |
-| 0.9461        | 29.0  | 174  | 0.9197          |
-| 0.9112        | 30.0  | 180  | 0.9280          |
-| 0.9397        | 31.0  | 186  | 0.8850          |
-| 0.8829        | 32.0  | 192  | 0.8936          |
-| 0.8869        | 33.0  | 198  | 0.9086          |
-| 0.8956        | 34.0  | 204  | 0.8656          |
-| 0.8672        | 35.0  | 210  | 0.8579          |
-| 0.8427        | 36.0  | 216  | 0.8305          |
-| 0.8538        | 37.0  | 222  | 0.8312          |
-| 0.83          | 38.0  | 228  | 0.8179          |
-| 0.8411        | 39.0  | 234  | 0.8124          |
-| 0.8238        | 40.0  | 240  | 0.8108          |
 ### Framework versions

 This model is a fine-tuned version of [](https://huggingface.co/) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.0047
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 2.7292        | 1.0   | 6    | 2.1173          |
+| 1.7871        | 2.0   | 12   | 1.3767          |
+| 1.1487        | 3.0   | 18   | 0.9345          |
+| 0.8396        | 4.0   | 24   | 0.8010          |
+| 0.741         | 5.0   | 30   | 0.6938          |
+| 0.617         | 6.0   | 36   | 0.6118          |
+| 0.5495        | 7.0   | 42   | 0.5396          |
+| 0.4991        | 8.0   | 48   | 0.4896          |
+| 0.4526        | 9.0   | 54   | 0.4333          |
+| 0.3899        | 10.0  | 60   | 0.3730          |
+| 0.331         | 11.0  | 66   | 0.3093          |
+| 0.2617        | 12.0  | 72   | 0.2348          |
+| 0.2112        | 13.0  | 78   | 0.1729          |
+| 0.1642        | 14.0  | 84   | 0.1352          |
+| 0.1285        | 15.0  | 90   | 0.1043          |
+| 0.1063        | 16.0  | 96   | 0.0811          |
+| 0.0806        | 17.0  | 102  | 0.0593          |
+| 0.0617        | 18.0  | 108  | 0.0429          |
+| 0.0519        | 19.0  | 114  | 0.0305          |
+| 0.0372        | 20.0  | 120  | 0.0230          |
+| 0.0323        | 21.0  | 126  | 0.0191          |
+| 0.0255        | 22.0  | 132  | 0.0152          |
+| 0.0219        | 23.0  | 138  | 0.0134          |
+| 0.0202        | 24.0  | 144  | 0.0118          |
+| 0.0161        | 25.0  | 150  | 0.0105          |
+| 0.0154        | 26.0  | 156  | 0.0087          |
+| 0.0126        | 27.0  | 162  | 0.0077          |
+| 0.0115        | 28.0  | 168  | 0.0069          |
+| 0.0104        | 29.0  | 174  | 0.0064          |
+| 0.0121        | 30.0  | 180  | 0.0061          |
+| 0.0113        | 31.0  | 186  | 0.0062          |
+| 0.0105        | 32.0  | 192  | 0.0059          |
+| 0.0103        | 33.0  | 198  | 0.0057          |
+| 0.0097        | 34.0  | 204  | 0.0052          |
+| 0.0088        | 35.0  | 210  | 0.0052          |
+| 0.0083        | 36.0  | 216  | 0.0050          |
+| 0.0086        | 37.0  | 222  | 0.0048          |
+| 0.0075        | 38.0  | 228  | 0.0048          |
+| 0.0075        | 39.0  | 234  | 0.0047          |
+| 0.0073        | 40.0  | 240  | 0.0047          |
 ### Framework versions

config.json CHANGED Viewed

@@ -78,7 +78,7 @@
     "typical_p": 1.0,
     "use_bfloat16": false,
     "use_cache": true,
-    "vocab_size": 52
   },
   "decoder_start_token_id": 2,
   "encoder": {
@@ -157,7 +157,7 @@
     "typical_p": 1.0,
     "use_bfloat16": false,
     "use_cache": true,
-    "vocab_size": 52
   },
   "eos_token_id": 0,
   "is_encoder_decoder": true,

     "typical_p": 1.0,
     "use_bfloat16": false,
     "use_cache": true,
+    "vocab_size": 34
   },
   "decoder_start_token_id": 2,
   "encoder": {
     "typical_p": 1.0,
     "use_bfloat16": false,
     "use_cache": true,
+    "vocab_size": 34
   },
   "eos_token_id": 0,
   "is_encoder_decoder": true,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39ba38daef0694e4ee3d5f5eef9162864c41b88cf1ecd98994d9cf8d87ac4c77
-size 31205552

 version https://git-lfs.github.com/spec/v1
+oid sha256:91f0aad8570d108895a8690688662c0eb6282ec67aec2acd1ffb139eb660ab3c
+size 31168616

runs/Mar04_10-14-38_4aecdba70411/events.out.tfevents.1709547278.4aecdba70411.306.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4afeb7803097b9155009aad5867713813a97bf9e549969bf21eaf7ef6f415ff5
+size 27997

tokenizer.json CHANGED Viewed

@@ -116,76 +116,40 @@
       "99": 17,
       "98": 18,
       "11": 19,
-      "12": 20,
-      "97": 21,
-      "13": 22,
-      "96": 23,
       "14": 24,
-      "94": 25,
-      "95": 26,
       "15": 27,
-      "16": 28,
-      "93": 29,
-      "17": 30,
-      "92": 31,
       "18": 32,
-      "91": 33,
-      "90": 34,
-      "19": 35,
-      "89": 36,
-      "20": 37,
-      "21": 38,
-      "88": 39,
-      "87": 40,
-      "22": 41,
-      "23": 42,
-      "86": 43,
-      "85": 44,
-      "24": 45,
-      "25": 46,
-      "84": 47,
-      "83": 48,
-      "26": 49,
-      "27": 50,
-      "82": 51
     },
     "merges": [
       "1 0",
       "9 9",
       "9 8",
       "1 1",
-      "1 2",
       "9 7",
-      "1 3",
       "9 6",
       "1 4",
-      "9 4",
       "9 5",
       "1 5",
-      "1 6",
       "9 3",
-      "1 7",
       "9 2",
       "1 8",
-      "9 1",
-      "9 0",
-      "1 9",
-      "8 9",
-      "2 0",
-      "2 1",
-      "8 8",
-      "8 7",
-      "2 2",
-      "2 3",
-      "8 6",
-      "8 5",
-      "2 4",
-      "2 5",
-      "8 4",
-      "8 3",
-      "2 6",
-      "2 7",
-      "8 2"
     ]
   }
 }

       "99": 17,
       "98": 18,
       "11": 19,
+      "97": 20,
+      "12": 21,
+      "96": 22,
+      "13": 23,
       "14": 24,
+      "95": 25,
+      "94": 26,
       "15": 27,
+      "93": 28,
+      "16": 29,
+      "92": 30,
+      "17": 31,
       "18": 32,
+      "91": 33
     },
     "merges": [
       "1 0",
       "9 9",
       "9 8",
       "1 1",
       "9 7",
+      "1 2",
       "9 6",
+      "1 3",
       "1 4",
       "9 5",
+      "9 4",
       "1 5",
       "9 3",
+      "1 6",
       "9 2",
+      "1 7",
       "1 8",
+      "9 1"
     ]
   }
 }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c82b96d19238c510597b546ba69be7fcb3344cc82e22d34d4a2bc8153fdf4ad2
 size 5112

 version https://git-lfs.github.com/spec/v1
+oid sha256:dcfbe883afc6dc2fd20c64e1776f58f3ea875a7100e49d1f84ecf94198ca77cb
 size 5112