Training in progress, step 100

Files changed (6) hide show

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "princeton-nlp/Mistral-7B-Base-SFT-DPO",
   "architectures": [
     "MistralForCausalLM"
   ],
@@ -20,7 +20,7 @@
   "sliding_window": 4096,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
-  "transformers_version": "4.39.3",
   "use_cache": false,
   "vocab_size": 32000
 }

 {
+  "_name_or_path": "/mnt/bn/xuruijie-llm/checkpoints/simpo/round1",
   "architectures": [
     "MistralForCausalLM"
   ],
   "sliding_window": 4096,
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
+  "transformers_version": "4.41.1",
   "use_cache": false,
   "vocab_size": 32000
 }

runs/Jun12_20-45-22_n136-082-130/events.out.tfevents.1718196590.n136-082-130.1146735.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:61b40d07be10216adf1275f96abfb22153562160ec5084a1a66fb44a926aa0b7
+size 5080

runs/Jun12_21-20-48_n136-082-130/events.out.tfevents.1718198468.n136-082-130.1162050.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:2a4991fc07873bc093977d387d10378cd40e1e0e2c05f95f9d02362b13bd87e0
+size 12516

special_tokens_map.json CHANGED Viewed

@@ -13,7 +13,13 @@
     "rstrip": false,
     "single_word": false
   },
-  "pad_token": "</s>",
   "unk_token": {
     "content": "<unk>",
     "lstrip": false,

     "rstrip": false,
     "single_word": false
   },
+  "pad_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
   "unk_token": {
     "content": "<unk>",
     "lstrip": false,

tokenizer.json CHANGED Viewed

@@ -134,6 +134,7 @@
     "end_of_word_suffix": null,
     "fuse_unk": true,
     "byte_fallback": true,
     "vocab": {
       "<unk>": 0,
       "<s>": 1,

     "end_of_word_suffix": null,
     "fuse_unk": true,
     "byte_fallback": true,
+    "ignore_merges": false,
     "vocab": {
       "<unk>": 0,
       "<s>": 1,

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:53e6d8a2a88e23d8c15c64bcbb88e5c1287466ea42275f3b80916cbe0058ac20
-size 6264

 version https://git-lfs.github.com/spec/v1
+oid sha256:b3c70facc10a0add57b3257c66a9ce0db4d390283c663cd0223999426592e397
+size 6456