finnstrom3693 commited on
Commit
72425ae
1 Parent(s): 8aadb34

Upload MistralForCausalLM

Browse files
Files changed (2) hide show
  1. config.json +1 -1
  2. model.safetensors +2 -2
config.json CHANGED
@@ -17,7 +17,7 @@
17
  "model_type": "mistral",
18
  "num_attention_heads": 18,
19
  "num_hidden_layers": 13,
20
- "num_key_value_heads": 8,
21
  "quantization_aware_training": true,
22
  "rms_norm_eps": 1e-05,
23
  "rope_theta": 10000.0,
 
17
  "model_type": "mistral",
18
  "num_attention_heads": 18,
19
  "num_hidden_layers": 13,
20
+ "num_key_value_heads": 18,
21
  "quantization_aware_training": true,
22
  "rms_norm_eps": 1e-05,
23
  "rope_theta": 10000.0,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:529822ecd38ef3ead5af0d3c42a9143b489bb52253ce162cc19dd08182843035
3
- size 761096120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f301ff74113b0761dcb085f8f8959436f3e0e881d6e06a0dc46687aa5d1a4169
3
+ size 837773240