Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- added_tokens.json +3 -0
- cal_data.safetensors +3 -0
- config.json +36 -0
- generation_config.json +7 -0
- hidden_states.safetensors +3 -0
- job_new.json +0 -0
- measurement.json +0 -0
- out_tensor/lm_head.safetensors +3 -0
- out_tensor/model.layers.0.mlp.down_proj.safetensors +3 -0
- out_tensor/model.layers.0.mlp.gate_proj.safetensors +3 -0
- out_tensor/model.layers.0.mlp.up_proj.safetensors +3 -0
- out_tensor/model.layers.0.self_attn.k_proj.safetensors +3 -0
- out_tensor/model.layers.0.self_attn.o_proj.safetensors +3 -0
- out_tensor/model.layers.0.self_attn.q_proj.safetensors +3 -0
- out_tensor/model.layers.0.self_attn.v_proj.safetensors +3 -0
- out_tensor/model.layers.1.mlp.down_proj.safetensors +3 -0
- out_tensor/model.layers.1.mlp.gate_proj.safetensors +3 -0
- out_tensor/model.layers.1.mlp.up_proj.safetensors +3 -0
- out_tensor/model.layers.1.self_attn.k_proj.safetensors +3 -0
- out_tensor/model.layers.1.self_attn.o_proj.safetensors +3 -0
- out_tensor/model.layers.1.self_attn.q_proj.safetensors +3 -0
- out_tensor/model.layers.1.self_attn.v_proj.safetensors +3 -0
- out_tensor/model.layers.10.mlp.down_proj.safetensors +3 -0
- out_tensor/model.layers.10.mlp.gate_proj.safetensors +3 -0
- out_tensor/model.layers.10.mlp.up_proj.safetensors +3 -0
- out_tensor/model.layers.10.self_attn.k_proj.safetensors +3 -0
- out_tensor/model.layers.10.self_attn.o_proj.safetensors +3 -0
- out_tensor/model.layers.10.self_attn.q_proj.safetensors +3 -0
- out_tensor/model.layers.10.self_attn.v_proj.safetensors +3 -0
- out_tensor/model.layers.11.mlp.down_proj.safetensors +3 -0
- out_tensor/model.layers.11.mlp.gate_proj.safetensors +3 -0
- out_tensor/model.layers.11.mlp.up_proj.safetensors +3 -0
- out_tensor/model.layers.11.self_attn.k_proj.safetensors +3 -0
- out_tensor/model.layers.11.self_attn.o_proj.safetensors +3 -0
- out_tensor/model.layers.11.self_attn.q_proj.safetensors +3 -0
- out_tensor/model.layers.11.self_attn.v_proj.safetensors +3 -0
- out_tensor/model.layers.12.mlp.down_proj.safetensors +3 -0
- out_tensor/model.layers.12.mlp.gate_proj.safetensors +3 -0
- out_tensor/model.layers.12.mlp.up_proj.safetensors +3 -0
- out_tensor/model.layers.12.self_attn.k_proj.safetensors +3 -0
- out_tensor/model.layers.12.self_attn.o_proj.safetensors +3 -0
- out_tensor/model.layers.12.self_attn.q_proj.safetensors +3 -0
- out_tensor/model.layers.12.self_attn.v_proj.safetensors +3 -0
- out_tensor/model.layers.13.mlp.down_proj.safetensors +3 -0
- out_tensor/model.layers.13.mlp.gate_proj.safetensors +3 -0
- out_tensor/model.layers.13.mlp.up_proj.safetensors +3 -0
- out_tensor/model.layers.13.self_attn.k_proj.safetensors +3 -0
- out_tensor/model.layers.13.self_attn.o_proj.safetensors +3 -0
- out_tensor/model.layers.13.self_attn.q_proj.safetensors +3 -0
- out_tensor/model.layers.13.self_attn.v_proj.safetensors +3 -0
added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<|extra_idx|>": 120073
|
3 |
+
}
|
cal_data.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9d9c9f447b588607ca4e53e973ab9e70d7daab6150b779913f2b625ae676a00e
|
3 |
+
size 1884248
|
config.json
ADDED
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "augmxnt/shisa-base-7b-v1",
|
3 |
+
"architectures": [
|
4 |
+
"MistralForCausalLM"
|
5 |
+
],
|
6 |
+
"bos_token_id": 1,
|
7 |
+
"eos_token_id": 2,
|
8 |
+
"hidden_act": "silu",
|
9 |
+
"hidden_size": 4096,
|
10 |
+
"initializer_range": 0.02,
|
11 |
+
"intermediate_size": 14336,
|
12 |
+
"max_position_embeddings": 32768,
|
13 |
+
"model_type": "mistral",
|
14 |
+
"num_attention_heads": 32,
|
15 |
+
"num_hidden_layers": 32,
|
16 |
+
"num_key_value_heads": 8,
|
17 |
+
"rms_norm_eps": 1e-05,
|
18 |
+
"rope_theta": 10000.0,
|
19 |
+
"sliding_window": 4096,
|
20 |
+
"tie_word_embeddings": false,
|
21 |
+
"torch_dtype": "bfloat16",
|
22 |
+
"transformers_version": "4.35.1",
|
23 |
+
"use_cache": false,
|
24 |
+
"vocab_size": 120074,
|
25 |
+
"quantization_config": {
|
26 |
+
"quant_method": "exl2",
|
27 |
+
"version": "0.0.17",
|
28 |
+
"bits": 4.0,
|
29 |
+
"head_bits": 6,
|
30 |
+
"calibration": {
|
31 |
+
"rows": 100,
|
32 |
+
"length": 2048,
|
33 |
+
"dataset": "(default)"
|
34 |
+
}
|
35 |
+
}
|
36 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"transformers_version": "4.35.1",
|
6 |
+
"use_cache": false
|
7 |
+
}
|
hidden_states.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a23327fbf558f2dd61f661f806e805046fc1f41dc0340c8922efd3a55f9962fb
|
3 |
+
size 1929389952
|
job_new.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
measurement.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
out_tensor/lm_head.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58c170b6719adb640c05518a92163047f1d7dd84892f57dc54287f1f373bbc68
|
3 |
+
size 390088824
|
out_tensor/model.layers.0.mlp.down_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d736c895070fbcef949f718db7849901f4fafde0b0f7aae02fd46ed3621cabda
|
3 |
+
size 32582808
|
out_tensor/model.layers.0.mlp.gate_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ed79118c9e6e7d5f92df8ce2b408889a501d82f3eb0f032a4a039f1c3d837ca
|
3 |
+
size 31040792
|
out_tensor/model.layers.0.mlp.up_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8d7d1c14fc393fafbeff13785d1500506e145ab90fa3bd46d09f2ba5bac4568
|
3 |
+
size 32130320
|
out_tensor/model.layers.0.self_attn.k_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb36ee0cec0c2902beca9abf3dbf78b68c4ab2638269f65755df8e825ee9825a
|
3 |
+
size 2233632
|
out_tensor/model.layers.0.self_attn.o_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20a6017a4b9693f61cfce1bae12f0b24f924d6c0b53c6e374013f8fba94696a6
|
3 |
+
size 8881440
|
out_tensor/model.layers.0.self_attn.q_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cd68a2e4d2b7c8907017b7f86071ce6b6dcd53b4e98c1c46b816d5918abbedb9
|
3 |
+
size 8881440
|
out_tensor/model.layers.0.self_attn.v_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b09e675a7d743b501aced5d8c033678734fa34703a19835c1a8ec3199d229dec
|
3 |
+
size 2704672
|
out_tensor/model.layers.1.mlp.down_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5a91630bc96dd8e5f71578b394d652fa87608aa1bcb0ce0fda52203b18db2d78
|
3 |
+
size 31192356
|
out_tensor/model.layers.1.mlp.gate_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07d17646638f5acf7747c3cc83cfc7d613a6c2e6128ac984efb5b489cadb67dc
|
3 |
+
size 23700760
|
out_tensor/model.layers.1.mlp.up_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e526f1303754fc85a7344709891d0b5db0f55570dbb72c82bc2ffc7f19cb7495
|
3 |
+
size 24790288
|
out_tensor/model.layers.1.self_attn.k_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e1fea1ca60fa0b89bbb7ee218e68d78132836dac770e3632d3c0ad03559f118
|
3 |
+
size 2757920
|
out_tensor/model.layers.1.self_attn.o_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:55efa27039d01020a5ec611218be3c429dd5ceafe7e632ef1417c705a53b5bd0
|
3 |
+
size 10978600
|
out_tensor/model.layers.1.self_attn.q_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6cb76964e481f9d98f59150755a8355d48190034ad0a8aa03e4808b3ed54a790
|
3 |
+
size 10978600
|
out_tensor/model.layers.1.self_attn.v_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b1442d4f212fe3c8ee835eafa2ae033161d890b0b5c9c375afbf2e27674c75ca
|
3 |
+
size 3228960
|
out_tensor/model.layers.10.mlp.down_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e74b67c4197db92a0df85ac67484784b4049346caa5b892f12e8b5927b69b6d1
|
3 |
+
size 31192364
|
out_tensor/model.layers.10.mlp.gate_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:284f451bc30c6a8b3dc39d70a8339642300a07c2b75c573da692bab1dd8c08e3
|
3 |
+
size 23700768
|
out_tensor/model.layers.10.mlp.up_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65d335c716277b5375943c40cd485665791f44a1bd763204544b6dd2ea0a5ed6
|
3 |
+
size 24790288
|
out_tensor/model.layers.10.self_attn.k_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbb8aaf19403deda45ec5c6b2b73814cbaa0de03b0090f0f8f0d2adf5a7f842d
|
3 |
+
size 2233632
|
out_tensor/model.layers.10.self_attn.o_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2fee1cb46c0ccfbfc64cb3d9354735fe5d0f06fb8cad296037ffcd63f16d3aff
|
3 |
+
size 8881448
|
out_tensor/model.layers.10.self_attn.q_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93ca6f7ff6ac09fe67a89a50461c60fae510f5b8427e62b79bab578d4eef306c
|
3 |
+
size 8881448
|
out_tensor/model.layers.10.self_attn.v_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8d312283a26b57d479549e0e145964ed4fdf7598ee4cf5844dfd356ab7da1f6
|
3 |
+
size 2704672
|
out_tensor/model.layers.11.mlp.down_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d657c1c47394cba9111251f1e8dda038d443ecc0e67d5e4ac3c0ebce71f5600
|
3 |
+
size 25619616
|
out_tensor/model.layers.11.mlp.gate_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2607af501f22c79f4928d0160f1a39a1151a4044ed7383c841b5c9c822a57fe
|
3 |
+
size 23700768
|
out_tensor/model.layers.11.mlp.up_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:33d611c40ad88bf1f0869a4a16aa649a7b8ba9566e8219e9acdced0381382431
|
3 |
+
size 24790288
|
out_tensor/model.layers.11.self_attn.k_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d4f456e62ed9e581156a604f0389ae4eaa4b229fb046e62d4f7ab897efcced7e
|
3 |
+
size 2233632
|
out_tensor/model.layers.11.self_attn.o_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:285075d2bb5ab28e65ce9253a06674f7e1e2373d2846470b301954c2ba8a76b0
|
3 |
+
size 8881448
|
out_tensor/model.layers.11.self_attn.q_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c1a3f441b99d7e5f8d95cdce5727168a4962b2bcc9c319faac149c78c8b40ae
|
3 |
+
size 8881448
|
out_tensor/model.layers.11.self_attn.v_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2ff492be80a1750b1fa40198d701bb4d5938ce9b71b8deeb3db5de6d62b9c67
|
3 |
+
size 2704672
|
out_tensor/model.layers.12.mlp.down_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b51ede6b8a6738d790870671823cf733235e0b22446ecf044f74f3447e57a0ea
|
3 |
+
size 25619616
|
out_tensor/model.layers.12.mlp.gate_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98064d8f6220d112d253c35a32684d42f2b8a605a33720a6b8ef49caaa3b8d86
|
3 |
+
size 23700768
|
out_tensor/model.layers.12.mlp.up_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:464d517f3200708cd59a33595efe69a4231d5fe510dd5c812df09ead4157ca01
|
3 |
+
size 24790288
|
out_tensor/model.layers.12.self_attn.k_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f3792ae134358876f5cc0a5f9fc0b94b9c79ed2d9b27d6e486f164bb0a25294
|
3 |
+
size 2233632
|
out_tensor/model.layers.12.self_attn.o_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b73d1372b9f6c66c86fdd6706cec68b2a0368075d17eadb404f523dea2732202
|
3 |
+
size 8881448
|
out_tensor/model.layers.12.self_attn.q_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89a590985a00a9fdd3a72044561d332f2d58b1c00f089c5e91a1b041652c5956
|
3 |
+
size 8881448
|
out_tensor/model.layers.12.self_attn.v_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2503ded6abbdfd21cbb7b568e08ca1943afed1254c903b90c6395ad13068d184
|
3 |
+
size 2704672
|
out_tensor/model.layers.13.mlp.down_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a557b699c1c4dc03c3510fca6359cf85850d021a8f2c4541c6685a01787ee33
|
3 |
+
size 31192364
|
out_tensor/model.layers.13.mlp.gate_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b4da890933cc00b8b543d2de6dba441e547b3bc2dcfa8a2859b516f2a2a6aadb
|
3 |
+
size 23700768
|
out_tensor/model.layers.13.mlp.up_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3eb7b1a83059b8f7f2584f6693620b0f3f9c877e2197d2dc21f750b987d9b9b9
|
3 |
+
size 24790288
|
out_tensor/model.layers.13.self_attn.k_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc13612f8e67c41aee036e56c99cb48784e05b689967201603fe1eebc481eace
|
3 |
+
size 1671904
|
out_tensor/model.layers.13.self_attn.o_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:146c20431ac25435e3689225632fb30e2f007fbe0a1b6dcfe8f3981f43d1222f
|
3 |
+
size 6636256
|
out_tensor/model.layers.13.self_attn.q_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d45a8f1e2bea174f9a1f7b23294fb7b1ae930bb224b205bf01f7ecf437de73b
|
3 |
+
size 6636256
|
out_tensor/model.layers.13.self_attn.v_proj.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:331f1a839a1fcca6e171b8a29d0faa386f435b8148215dd8d75a4ce232052ea5
|
3 |
+
size 1680288
|