stardust-coder commited on
Commit
551140b
1 Parent(s): c4ad639

Training in progress, step 84000

Browse files
Files changed (4) hide show
  1. config.json +1 -2
  2. model.safetensors +1 -1
  3. tokenizer.json +16 -7
  4. training_args.bin +2 -2
config.json CHANGED
@@ -16,7 +16,6 @@
16
  "initializer_range": 0.02,
17
  "intermediate_size": 1536,
18
  "max_position_embeddings": 1024,
19
- "mlp_bias": false,
20
  "model_type": "bit_llama",
21
  "n_ctx": 128,
22
  "num_attention_heads": 12,
@@ -28,7 +27,7 @@
28
  "rope_theta": 10000.0,
29
  "tie_word_embeddings": false,
30
  "torch_dtype": "float32",
31
- "transformers_version": "4.43.1",
32
  "use_cache": true,
33
  "vocab_size": 43176
34
  }
 
16
  "initializer_range": 0.02,
17
  "intermediate_size": 1536,
18
  "max_position_embeddings": 1024,
 
19
  "model_type": "bit_llama",
20
  "n_ctx": 128,
21
  "num_attention_heads": 12,
 
27
  "rope_theta": 10000.0,
28
  "tie_word_embeddings": false,
29
  "torch_dtype": "float32",
30
+ "transformers_version": "4.38.2",
31
  "use_cache": true,
32
  "vocab_size": 43176
33
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b54db5c0bd7c16b81d205546b0424371ca6c7f3921aff82b21fe49bc3a0f7a2
3
  size 510960712
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c0708c3f673e330c78b5930215d181a543796f5a4b18429cc9750498fe6e297
3
  size 510960712
tokenizer.json CHANGED
@@ -36,13 +36,23 @@
36
  "special": true
37
  }
38
  ],
39
- "normalizer": null,
40
- "pre_tokenizer": {
41
- "type": "Metaspace",
42
- "replacement": "▁",
43
- "prepend_scheme": "first",
44
- "split": false
 
 
 
 
 
 
 
 
 
45
  },
 
46
  "post_processor": {
47
  "type": "TemplateProcessing",
48
  "single": [
@@ -129,7 +139,6 @@
129
  "end_of_word_suffix": null,
130
  "fuse_unk": true,
131
  "byte_fallback": true,
132
- "ignore_merges": false,
133
  "vocab": {
134
  "<unk>": 0,
135
  "<s>": 1,
 
36
  "special": true
37
  }
38
  ],
39
+ "normalizer": {
40
+ "type": "Sequence",
41
+ "normalizers": [
42
+ {
43
+ "type": "Prepend",
44
+ "prepend": "▁"
45
+ },
46
+ {
47
+ "type": "Replace",
48
+ "pattern": {
49
+ "String": " "
50
+ },
51
+ "content": "▁"
52
+ }
53
+ ]
54
  },
55
+ "pre_tokenizer": null,
56
  "post_processor": {
57
  "type": "TemplateProcessing",
58
  "single": [
 
139
  "end_of_word_suffix": null,
140
  "fuse_unk": true,
141
  "byte_fallback": true,
 
142
  "vocab": {
143
  "<unk>": 0,
144
  "<s>": 1,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b424b2667b6ff1f95ac264726f10142e36ba9a36e85dd23b84f435ef94b9cc29
3
- size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d1245ad5795253debe58bcbfdd83b24f66ab3036e63cd3b66d342f5ad8f590c
3
+ size 4856