wejoncy commited on
Commit
c578e69
1 Parent(s): 6335a38

update config

Browse files
Files changed (1) hide show
  1. config.json +19 -18
config.json CHANGED
@@ -23,7 +23,21 @@
23
  "num_hidden_layers": 126,
24
  "num_key_value_heads": 8,
25
  "pretraining_tp": 1,
26
- "quant_config": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
27
  "model.layers.0.mlp.down_proj": {
28
  "bias": null,
29
  "enable_norm": true,
@@ -21191,20 +21205,7 @@
21191
  -1,
21192
  8
21193
  ]
21194
- }
21195
- },
21196
- "rms_norm_eps": 1e-05,
21197
- "rope_scaling": {
21198
- "factor": 8.0,
21199
- "high_freq_factor": 4.0,
21200
- "low_freq_factor": 1.0,
21201
- "original_max_position_embeddings": 8192,
21202
- "rope_type": "llama3"
21203
- },
21204
- "rope_theta": 500000.0,
21205
- "tie_word_embeddings": false,
21206
- "torch_dtype": "bfloat16",
21207
- "transformers_version": "4.45.2",
21208
- "use_cache": true,
21209
- "vocab_size": 128256
21210
- }
 
23
  "num_hidden_layers": 126,
24
  "num_key_value_heads": 8,
25
  "pretraining_tp": 1,
26
+ "rms_norm_eps": 1e-05,
27
+ "rope_scaling": {
28
+ "factor": 8.0,
29
+ "high_freq_factor": 4.0,
30
+ "low_freq_factor": 1.0,
31
+ "original_max_position_embeddings": 8192,
32
+ "rope_type": "llama3"
33
+ },
34
+ "rope_theta": 500000.0,
35
+ "tie_word_embeddings": false,
36
+ "torch_dtype": "bfloat16",
37
+ "transformers_version": "4.45.2",
38
+ "use_cache": true,
39
+ "vocab_size": 128256,
40
+ "quantization_config": {
41
  "model.layers.0.mlp.down_proj": {
42
  "bias": null,
43
  "enable_norm": true,
 
21205
  -1,
21206
  8
21207
  ]
21208
+ },
21209
+ "quant_method": "vptq"
21210
+ }
21211
+ }