Xenova HF Staff commited on
Commit
1346878
·
verified ·
1 Parent(s): daa5831

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,8 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ onnx/onnx/model.onnx_data filter=lfs diff=lfs merge=lfs -text
37
+ onnx/onnx/model.onnx_data_1 filter=lfs diff=lfs merge=lfs -text
38
+ onnx/onnx/model_fp16.onnx_data filter=lfs diff=lfs merge=lfs -text
39
+ onnx/onnx/model_q4.onnx_data filter=lfs diff=lfs merge=lfs -text
40
+ onnx/onnx/model_q4f16.onnx_data filter=lfs diff=lfs merge=lfs -text
onnx/chat_template.jinja ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {% if messages[0]['role'] == 'system' %}<|bos|><|user_start|>{{ messages[0]['content'] }}
2
+
3
+ {{ messages[1]['content'] }}<|user_end|>{% set messages = messages[2:] %}{% else %}<|bos|>{% endif %}{% for message in messages %}{% if loop.index0 % 2 == 0 %}<|user_start|>{{ message['content'] }}<|user_end|>{% else %}<|assistant_start|>{{ message['content'] }}<|assistant_end|>{% endif %}{% endfor %}{% if add_generation_prompt %}<|assistant_start|>{% endif %}
onnx/config.json ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "NanoGPTForCausalLM"
4
+ ],
5
+ "attention_dropout": 0.0,
6
+ "bos_token": "<|bos|>",
7
+ "bos_token_id": 0,
8
+ "chat_template": "{% if messages[0]['role'] == 'system' %}<|bos|><|user_start|>{{ messages[0]['content'] }}\n\n{{ messages[1]['content'] }}<|user_end|>{% set messages = messages[2:] %}{% else %}<|bos|>{% endif %}{% for message in messages %}{% if loop.index0 % 2 == 0 %}<|user_start|>{{ message['content'] }}<|user_end|>{% else %}<|assistant_start|>{{ message['content'] }}<|assistant_end|>{% endif %}{% endfor %}",
9
+ "dtype": "bfloat16",
10
+ "eos_token": "<|assistant_end|>",
11
+ "eos_token_id": 65531,
12
+ "hidden_act": "relu2",
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 5120,
15
+ "logits_soft_cap": 15.0,
16
+ "max_position_embeddings": 2048,
17
+ "model_type": "nanochat",
18
+ "n_embd": 1280,
19
+ "n_head": 10,
20
+ "n_layer": 20,
21
+ "num_key_value_heads": 10,
22
+ "pad_token": "<|assistant_end|>",
23
+ "pad_token_id": 65531,
24
+ "qkv_bias": false,
25
+ "resid_dropout": 0.0,
26
+ "rms_norm_eps": 1e-06,
27
+ "rope_scaling": null,
28
+ "rope_theta": 10000.0,
29
+ "tie_word_embeddings": false,
30
+ "transformers_version": "4.57.0",
31
+ "use_cache": true,
32
+ "vocab_size": 65536,
33
+ "transformers.js_config": {
34
+ "use_external_data_format": {
35
+ "model.onnx": 2,
36
+ "model_fp16.onnx": 1,
37
+ "model_q4.onnx": 1,
38
+ "model_q4f16.onnx": 1
39
+ },
40
+ "kv_cache_dtype": {
41
+ "q4f16": "float16",
42
+ "fp16": "float16"
43
+ }
44
+ }
45
+ }
onnx/onnx/model.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5d888397a4f8afcf3c120d0b0071a5a0dd641040cd4782c0316f5a40f1be2b8
3
+ size 191419
onnx/onnx/model.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c58e65e672b04216a5e28286a8a45fa08e0d2bc86c6d407b2ea1827faf11b65
3
+ size 1909671936
onnx/onnx/model.onnx_data_1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:beb6cc27be5b7e85a93a11aa93cf89afc56c4c9049d3e521bf1611a2a524e657
3
+ size 335544320
onnx/onnx/model_fp16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1df67c56aab2b644ae38b0c667bd006835b15e13bcb3175dc4d5371a738eca8b
3
+ size 290893
onnx/onnx/model_fp16.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3c4b1c14c3f6035f373d4d24e6e1973db6486768d1222d7a0de04d332525fab
3
+ size 1122715648
onnx/onnx/model_q4.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b81c840993bd104e39d6b333a4e42f63ce5749b6690796fb956ae431fcede8e
3
+ size 223545
onnx/onnx/model_q4.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:994c21b844cb03f673c9c40e1b7feedf301a2a0caa10915471f3b03640c56e1d
3
+ size 634996736
onnx/onnx/model_q4f16.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3f0043592f6cc9ccbfc2485ca958ba0d5c4259cda2d6045db402d0610a9f6b14
3
+ size 278295
onnx/onnx/model_q4f16.onnx_data ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ef9ab2b7b280b54beda19fb344c127107cd57e24134acaa2f506af1977d4a702
3
+ size 436881408
onnx/special_tokens_map.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {}
onnx/tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
onnx/tokenizer_config.json ADDED
@@ -0,0 +1,81 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "65527": {
4
+ "content": "<|bos|>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "65528": {
12
+ "content": "<|user_start|>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "65529": {
20
+ "content": "<|user_end|>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "65530": {
28
+ "content": "<|assistant_start|>",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "65531": {
36
+ "content": "<|assistant_end|>",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ },
43
+ "65532": {
44
+ "content": "<|python_start|>",
45
+ "lstrip": false,
46
+ "normalized": false,
47
+ "rstrip": false,
48
+ "single_word": false,
49
+ "special": true
50
+ },
51
+ "65533": {
52
+ "content": "<|python_end|>",
53
+ "lstrip": false,
54
+ "normalized": false,
55
+ "rstrip": false,
56
+ "single_word": false,
57
+ "special": true
58
+ },
59
+ "65534": {
60
+ "content": "<|output_start|>",
61
+ "lstrip": false,
62
+ "normalized": false,
63
+ "rstrip": false,
64
+ "single_word": false,
65
+ "special": true
66
+ },
67
+ "65535": {
68
+ "content": "<|output_end|>",
69
+ "lstrip": false,
70
+ "normalized": false,
71
+ "rstrip": false,
72
+ "single_word": false,
73
+ "special": true
74
+ }
75
+ },
76
+ "clean_up_tokenization_spaces": false,
77
+ "extra_special_tokens": {},
78
+ "model_max_length": 1000000000000000019884624838656,
79
+ "tokenizer_class": "PreTrainedTokenizerFast",
80
+ "chat_template": "{% if messages[0]['role'] == 'system' %}<|bos|><|user_start|>{{ messages[0]['content'] }}\n\n{{ messages[1]['content'] }}<|user_end|>{% set messages = messages[2:] %}{% else %}<|bos|>{% endif %}{% for message in messages %}{% if loop.index0 % 2 == 0 %}<|user_start|>{{ message['content'] }}<|user_end|>{% else %}<|assistant_start|>{{ message['content'] }}<|assistant_end|>{% endif %}{% endfor %}{% if add_generation_prompt %}<|assistant_start|>{% endif %}"
81
+ }