End of training

Browse files

Files changed (6) hide show

README.md +41 -41
config.json +2 -2
model.safetensors +2 -2
runs/Mar11_14-39-47_MSI/events.out.tfevents.1710164392.MSI.11656.0 +3 -0
tokenizer.json +27 -25
training_args.bin +1 -1

README.md CHANGED Viewed

@@ -13,7 +13,7 @@ should probably proofread and complete it, then remove this comment. -->
 This model is a fine-tuned version of [](https://huggingface.co/) on the None dataset.
 It achieves the following results on the evaluation set:
-- Loss: 0.9144
 ## Model description
@@ -44,46 +44,46 @@ The following hyperparameters were used during training:
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
-| 3.3969        | 1.0   | 6    | 2.7182          |
-| 2.3315        | 2.0   | 12   | 1.9518          |
-| 1.7958        | 3.0   | 18   | 1.6778          |
-| 1.6131        | 4.0   | 24   | 1.5845          |
-| 1.5584        | 5.0   | 30   | 1.5760          |
-| 1.548         | 6.0   | 36   | 1.5781          |
-| 1.5369        | 7.0   | 42   | 1.5516          |
-| 1.5412        | 8.0   | 48   | 1.6085          |
-| 1.5311        | 9.0   | 54   | 1.5398          |
-| 1.5435        | 10.0  | 60   | 1.5587          |
-| 1.5138        | 11.0  | 66   | 1.5452          |
-| 1.5192        | 12.0  | 72   | 1.5345          |
-| 1.4818        | 13.0  | 78   | 1.6037          |
-| 1.4935        | 14.0  | 84   | 1.5391          |
-| 1.4396        | 15.0  | 90   | 1.8690          |
-| 1.4801        | 16.0  | 96   | 1.4349          |
-| 1.4051        | 17.0  | 102  | 1.3765          |
-| 1.3563        | 18.0  | 108  | 1.3655          |
-| 1.3188        | 19.0  | 114  | 1.3211          |
-| 1.3023        | 20.0  | 120  | 1.2695          |
-| 1.259         | 21.0  | 126  | 1.2644          |
-| 1.2366        | 22.0  | 132  | 1.2287          |
-| 1.2252        | 23.0  | 138  | 1.1858          |
-| 1.2205        | 24.0  | 144  | 1.1587          |
-| 1.1593        | 25.0  | 150  | 1.1855          |
-| 1.1639        | 26.0  | 156  | 1.1943          |
-| 1.1617        | 27.0  | 162  | 1.1305          |
-| 1.1493        | 28.0  | 168  | 1.0901          |
-| 1.1031        | 29.0  | 174  | 1.0640          |
-| 1.0901        | 30.0  | 180  | 1.0242          |
-| 1.0582        | 31.0  | 186  | 1.0066          |
-| 1.0423        | 32.0  | 192  | 0.9996          |
-| 1.0239        | 33.0  | 198  | 0.9732          |
-| 1.0151        | 34.0  | 204  | 0.9871          |
-| 1.0452        | 35.0  | 210  | 0.9655          |
-| 1.009         | 36.0  | 216  | 0.9411          |
-| 0.9819        | 37.0  | 222  | 0.9342          |
-| 0.9773        | 38.0  | 228  | 0.9235          |
-| 0.9743        | 39.0  | 234  | 0.9175          |
-| 0.9722        | 40.0  | 240  | 0.9144          |
 ### Framework versions

 This model is a fine-tuned version of [](https://huggingface.co/) on the None dataset.
 It achieves the following results on the evaluation set:
+- Loss: 0.6087
 ## Model description
 | Training Loss | Epoch | Step | Validation Loss |
 |:-------------:|:-----:|:----:|:---------------:|
+| 3.3748        | 1.0   | 6    | 2.7546          |
+| 2.3666        | 2.0   | 12   | 2.0282          |
+| 1.8315        | 3.0   | 18   | 1.6880          |
+| 1.616         | 4.0   | 24   | 1.5382          |
+| 1.503         | 5.0   | 30   | 1.4603          |
+| 1.4344        | 6.0   | 36   | 1.4103          |
+| 1.3878        | 7.0   | 42   | 1.3806          |
+| 1.3418        | 8.0   | 48   | 1.2722          |
+| 1.2509        | 9.0   | 54   | 1.2194          |
+| 1.2581        | 10.0  | 60   | 1.2255          |
+| 1.2361        | 11.0  | 66   | 1.4183          |
+| 1.259         | 12.0  | 72   | 1.1575          |
+| 1.1246        | 13.0  | 78   | 1.1058          |
+| 1.0757        | 14.0  | 84   | 1.0496          |
+| 1.0499        | 15.0  | 90   | 1.0402          |
+| 0.9797        | 16.0  | 96   | 0.9715          |
+| 0.9347        | 17.0  | 102  | 0.9876          |
+| 0.9267        | 18.0  | 108  | 0.9119          |
+| 0.8861        | 19.0  | 114  | 0.9250          |
+| 0.9253        | 20.0  | 120  | 0.8471          |
+| 0.9204        | 21.0  | 126  | 0.8488          |
+| 0.8545        | 22.0  | 132  | 0.8404          |
+| 0.8283        | 23.0  | 138  | 0.7885          |
+| 0.7892        | 24.0  | 144  | 0.8518          |
+| 0.804         | 25.0  | 150  | 0.9104          |
+| 0.8278        | 26.0  | 156  | 0.7776          |
+| 0.7759        | 27.0  | 162  | 0.7776          |
+| 0.7388        | 28.0  | 168  | 0.7396          |
+| 0.7323        | 29.0  | 174  | 0.7238          |
+| 0.727         | 30.0  | 180  | 0.6978          |
+| 0.7104        | 31.0  | 186  | 0.6916          |
+| 0.6964        | 32.0  | 192  | 0.6704          |
+| 0.6797        | 33.0  | 198  | 0.6547          |
+| 0.661         | 34.0  | 204  | 0.6457          |
+| 0.6567        | 35.0  | 210  | 0.6497          |
+| 0.6494        | 36.0  | 216  | 0.6411          |
+| 0.6526        | 37.0  | 222  | 0.6314          |
+| 0.6379        | 38.0  | 228  | 0.6150          |
+| 0.6224        | 39.0  | 234  | 0.6093          |
+| 0.6231        | 40.0  | 240  | 0.6087          |
 ### Framework versions

config.json CHANGED Viewed

@@ -78,7 +78,7 @@
     "typical_p": 1.0,
     "use_bfloat16": false,
     "use_cache": true,
-    "vocab_size": 51
   },
   "decoder_start_token_id": 2,
   "encoder": {
@@ -157,7 +157,7 @@
     "typical_p": 1.0,
     "use_bfloat16": false,
     "use_cache": true,
-    "vocab_size": 51
   },
   "eos_token_id": 0,
   "is_encoder_decoder": true,

     "typical_p": 1.0,
     "use_bfloat16": false,
     "use_cache": true,
+    "vocab_size": 52
   },
   "decoder_start_token_id": 2,
   "encoder": {
     "typical_p": 1.0,
     "use_bfloat16": false,
     "use_cache": true,
+    "vocab_size": 52
   },
   "eos_token_id": 0,
   "is_encoder_decoder": true,

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f024fc0d48f55ef44ccd78e8ff1076f4c625b8711bb014ed7c234337f0c6cad2
-size 31203500

 version https://git-lfs.github.com/spec/v1
+oid sha256:518691f2a4d764491e51310041d6488681fc1f56308e3dc613f0d19776354c8f
+size 31205552

runs/Mar11_14-39-47_MSI/events.out.tfevents.1710164392.MSI.11656.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:50401b29756c0e7e939a2e88415da556e1bef2f8dd6a7c52a45a8f87cdba4b8d
+size 28005

tokenizer.json CHANGED Viewed

@@ -112,77 +112,79 @@
       "7": 13,
       "8": 14,
       "9": 15,
-      "10": 16,
-      "99": 17,
       "11": 18,
       "98": 19,
       "97": 20,
       "12": 21,
-      "96": 22,
-      "13": 23,
       "95": 24,
       "14": 25,
-      "15": 26,
-      "94": 27,
-      "16": 28,
-      "93": 29,
       "17": 30,
       "92": 31,
-      "91": 32,
-      "18": 33,
-      "90": 34,
-      "19": 35,
       "20": 36,
       "89": 37,
       "21": 38,
       "88": 39,
       "87": 40,
       "22": 41,
-      "23": 42,
-      "86": 43,
       "24": 44,
       "85": 45,
       "25": 46,
       "84": 47,
-      "83": 48,
-      "26": 49,
-      "82": 50
     },
     "merges": [
-      "1 0",
       "9 9",
       "1 1",
       "9 8",
       "9 7",
       "1 2",
-      "9 6",
       "1 3",
       "9 5",
       "1 4",
-      "1 5",
       "9 4",
-      "1 6",
       "9 3",
       "1 7",
       "9 2",
-      "9 1",
       "1 8",
-      "9 0",
       "1 9",
       "2 0",
       "8 9",
       "2 1",
       "8 8",
       "8 7",
       "2 2",
-      "2 3",
       "8 6",
       "2 4",
       "8 5",
       "2 5",
       "8 4",
-      "8 3",
       "2 6",
       "8 2"
     ]
   }

       "7": 13,
       "8": 14,
       "9": 15,
+      "99": 16,
+      "10": 17,
       "11": 18,
       "98": 19,
       "97": 20,
       "12": 21,
+      "13": 22,
+      "96": 23,
       "95": 24,
       "14": 25,
+      "94": 26,
+      "15": 27,
+      "93": 28,
+      "16": 29,
       "17": 30,
       "92": 31,
+      "18": 32,
+      "91": 33,
+      "19": 34,
+      "90": 35,
       "20": 36,
       "89": 37,
       "21": 38,
       "88": 39,
       "87": 40,
       "22": 41,
+      "86": 42,
+      "23": 43,
       "24": 44,
       "85": 45,
       "25": 46,
       "84": 47,
+      "26": 48,
+      "83": 49,
+      "27": 50,
+      "82": 51
     },
     "merges": [
       "9 9",
+      "1 0",
       "1 1",
       "9 8",
       "9 7",
       "1 2",
       "1 3",
+      "9 6",
       "9 5",
       "1 4",
       "9 4",
+      "1 5",
       "9 3",
+      "1 6",
       "1 7",
       "9 2",
       "1 8",
+      "9 1",
       "1 9",
+      "9 0",
       "2 0",
       "8 9",
       "2 1",
       "8 8",
       "8 7",
       "2 2",
       "8 6",
+      "2 3",
       "2 4",
       "8 5",
       "2 5",
       "8 4",
       "2 6",
+      "8 3",
+      "2 7",
       "8 2"
     ]
   }

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3f75e54efb61940b1887367ab9401dfc1503f0cb31e8ddbd9f6b73ecbe867686
 size 5112

 version https://git-lfs.github.com/spec/v1
+oid sha256:ffb903b082f12ef3984019900e028e957ed048a41aee7d892b5f53d59456a24c
 size 5112