zhaospei commited on
Commit
4be4e53
1 Parent(s): 9c69fb4

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +12 -10
config.json CHANGED
@@ -18,16 +18,18 @@
18
  "num_key_value_heads": 32,
19
  "pretraining_tp": 1,
20
  "quantization_config": {
21
- "backend": "llm-awq",
22
- "bits": 4,
23
- "do_fuse": false,
24
- "fuse_max_seq_len": null,
25
- "group_size": 128,
26
- "modules_to_fuse": null,
27
- "modules_to_not_convert": null,
28
- "quant_method": "awq",
29
- "version": "gemm",
30
- "zero_point": true
 
 
31
  },
32
  "rms_norm_eps": 1e-06,
33
  "rope_scaling": {
 
18
  "num_key_value_heads": 32,
19
  "pretraining_tp": 1,
20
  "quantization_config": {
21
+ "_load_in_4bit": false,
22
+ "_load_in_8bit": true,
23
+ "bnb_4bit_compute_dtype": "float32",
24
+ "bnb_4bit_quant_type": "nf4",
25
+ "bnb_4bit_use_double_quant": true,
26
+ "llm_int8_enable_fp32_cpu_offload": false,
27
+ "llm_int8_has_fp16_weight": false,
28
+ "llm_int8_skip_modules": null,
29
+ "llm_int8_threshold": 6.0,
30
+ "load_in_4bit": false,
31
+ "load_in_8bit": true,
32
+ "quant_method": "bitsandbytes"
33
  },
34
  "rms_norm_eps": 1e-06,
35
  "rope_scaling": {