wejoncy commited on
Commit
ef005b7
1 Parent(s): 928ba43

update config

Browse files
Files changed (1) hide show
  1. config.json +19 -18
config.json CHANGED
@@ -22,7 +22,21 @@
22
  "num_hidden_layers": 32,
23
  "num_key_value_heads": 8,
24
  "pretraining_tp": 1,
25
- "quant_config": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  "model.layers.0.mlp.down_proj": {
27
  "bias": false,
28
  "enable_norm": true,
@@ -5398,20 +5412,7 @@
5398
  -1,
5399
  8
5400
  ]
5401
- }
5402
- },
5403
- "rms_norm_eps": 1e-05,
5404
- "rope_scaling": {
5405
- "factor": 8.0,
5406
- "high_freq_factor": 4.0,
5407
- "low_freq_factor": 1.0,
5408
- "original_max_position_embeddings": 8192,
5409
- "rope_type": "llama3"
5410
- },
5411
- "rope_theta": 500000.0,
5412
- "tie_word_embeddings": false,
5413
- "torch_dtype": "bfloat16",
5414
- "transformers_version": "4.45.1",
5415
- "use_cache": true,
5416
- "vocab_size": 128256
5417
- }
 
22
  "num_hidden_layers": 32,
23
  "num_key_value_heads": 8,
24
  "pretraining_tp": 1,
25
+ "rms_norm_eps": 1e-05,
26
+ "rope_scaling": {
27
+ "factor": 8.0,
28
+ "high_freq_factor": 4.0,
29
+ "low_freq_factor": 1.0,
30
+ "original_max_position_embeddings": 8192,
31
+ "rope_type": "llama3"
32
+ },
33
+ "rope_theta": 500000.0,
34
+ "tie_word_embeddings": false,
35
+ "torch_dtype": "bfloat16",
36
+ "transformers_version": "4.45.1",
37
+ "use_cache": true,
38
+ "vocab_size": 128256,
39
+ "quantization_config": {
40
  "model.layers.0.mlp.down_proj": {
41
  "bias": false,
42
  "enable_norm": true,
 
5412
  -1,
5413
  8
5414
  ]
5415
+ },
5416
+ "quant_method": "vptq"
5417
+ }
5418
+ }