RikkiXu commited on
Commit
20d8790
1 Parent(s): 6c57b0d

Training in progress, step 1500

Browse files
config.json CHANGED
@@ -12,7 +12,6 @@
12
  "initializer_range": 0.02,
13
  "intermediate_size": 11008,
14
  "max_position_embeddings": 4096,
15
- "mlp_bias": false,
16
  "model_type": "llama",
17
  "num_attention_heads": 32,
18
  "num_hidden_layers": 30,
@@ -23,7 +22,7 @@
23
  "rope_theta": 10000.0,
24
  "tie_word_embeddings": false,
25
  "torch_dtype": "bfloat16",
26
- "transformers_version": "4.41.1",
27
  "use_cache": false,
28
  "vocab_size": 102400
29
  }
 
12
  "initializer_range": 0.02,
13
  "intermediate_size": 11008,
14
  "max_position_embeddings": 4096,
 
15
  "model_type": "llama",
16
  "num_attention_heads": 32,
17
  "num_hidden_layers": 30,
 
22
  "rope_theta": 10000.0,
23
  "tie_word_embeddings": false,
24
  "torch_dtype": "bfloat16",
25
+ "transformers_version": "4.39.3",
26
  "use_cache": false,
27
  "vocab_size": 102400
28
  }
runs/Jun20_15-28-21_n136-129-074/events.out.tfevents.1718869497.n136-129-074.3627432.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7112485347e57fb2af2a3a9c488f2bb0dce3736515a9ce3e11c14288011f46aa
3
- size 47125
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a9d1b6fe4e780e40a642033dd9757524e0c72fd0f8f18463841696003b718ee
3
+ size 68225
tokenizer.json CHANGED
@@ -266,7 +266,6 @@
266
  "end_of_word_suffix": null,
267
  "fuse_unk": false,
268
  "byte_fallback": false,
269
- "ignore_merges": false,
270
  "vocab": {
271
  "!": 0,
272
  "\"": 1,
 
266
  "end_of_word_suffix": null,
267
  "fuse_unk": false,
268
  "byte_fallback": false,
 
269
  "vocab": {
270
  "!": 0,
271
  "\"": 1,
tokenizer_config.json CHANGED
@@ -124,7 +124,7 @@
124
  }
125
  },
126
  "bos_token": "<|begin▁of▁sentence|>",
127
- "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ 'User: '+ message['content'] }}\n{% elif message['role'] == 'assistant' %}\n{{ 'Assistant: ' + message['content'] + eos_token }}{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ 'Assistant: ' }}{% endif %}\n{% endfor %}",
128
  "clean_up_tokenization_spaces": false,
129
  "eos_token": "<|end▁of▁sentence|>",
130
  "legacy": true,
 
124
  }
125
  },
126
  "bos_token": "<|begin▁of▁sentence|>",
127
+ "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ 'User: '+ message['content'] }}\n{% elif message['role'] == 'assistant' %}\n{{ 'Assistant: ' + message['content'] + eos_token }}{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ 'Assistant: ' }}{% endif %}\n{% endfor %}",
128
  "clean_up_tokenization_spaces": false,
129
  "eos_token": "<|end▁of▁sentence|>",
130
  "legacy": true,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e84c095d194defa97204cd8057f40e6752f407dff0412d8066415e65bde4fba
3
- size 6328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99c954413038ae54893068f1be5a172e843dda5a64dbec190fdf1dfe888eb5bd
3
+ size 6136