reyvan commited on
Commit
82daa44
1 Parent(s): c92f0e2

Upload 3 files

Browse files
Files changed (3) hide show
  1. config.json +6 -6
  2. pytorch_model.bin +2 -2
  3. quantize_config.json +2 -2
config.json CHANGED
@@ -8,10 +8,10 @@
8
  "AutoConfig": "Qwen/Qwen-7B--configuration_qwen.QWenConfig",
9
  "AutoModelForCausalLM": "Qwen/Qwen-7B--modeling_qwen.QWenLMHeadModel"
10
  },
11
- "bf16": true,
12
  "emb_dropout_prob": 0.0,
13
  "fp16": false,
14
- "fp32": false,
15
  "hidden_size": 4096,
16
  "initializer_range": 0.02,
17
  "intermediate_size": 22016,
@@ -29,8 +29,8 @@
29
  "desc_act": false,
30
  "group_size": 128,
31
  "is_marlin_format": false,
32
- "model_file_base_name": "gptq_model-4bit-128g",
33
- "model_name_or_path": "Qwen-7B-4bit",
34
  "quant_method": "gptq",
35
  "static_groups": false,
36
  "sym": true,
@@ -44,12 +44,12 @@
44
  "tie_word_embeddings": false,
45
  "tokenizer_class": "QWenTokenizer",
46
  "torch_dtype": "float16",
47
- "transformers_version": "4.37.2",
48
  "use_cache": true,
49
  "use_cache_kernel": false,
50
  "use_cache_quantization": false,
51
  "use_dynamic_ntk": true,
52
- "use_flash_attn": true,
53
  "use_logn_attn": true,
54
  "vocab_size": 151936
55
  }
 
8
  "AutoConfig": "Qwen/Qwen-7B--configuration_qwen.QWenConfig",
9
  "AutoModelForCausalLM": "Qwen/Qwen-7B--modeling_qwen.QWenLMHeadModel"
10
  },
11
+ "bf16": false,
12
  "emb_dropout_prob": 0.0,
13
  "fp16": false,
14
+ "fp32": true,
15
  "hidden_size": 4096,
16
  "initializer_range": 0.02,
17
  "intermediate_size": 22016,
 
29
  "desc_act": false,
30
  "group_size": 128,
31
  "is_marlin_format": false,
32
+ "model_file_base_name": null,
33
+ "model_name_or_path": null,
34
  "quant_method": "gptq",
35
  "static_groups": false,
36
  "sym": true,
 
44
  "tie_word_embeddings": false,
45
  "tokenizer_class": "QWenTokenizer",
46
  "torch_dtype": "float16",
47
+ "transformers_version": "4.38.1",
48
  "use_cache": true,
49
  "use_cache_kernel": false,
50
  "use_cache_quantization": false,
51
  "use_dynamic_ntk": true,
52
+ "use_flash_attn": false,
53
  "use_logn_attn": true,
54
  "vocab_size": 151936
55
  }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2393b2d40537456cd8cd8cd876999c6ef834e4edc9346e8b7be6e4fa0769a90f
3
- size 5860862723
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d606b03c92a7744aa3d9dc082b393526ba13badc35cdb01e2b470a59ebfa882f
3
+ size 8454625504
quantize_config.json CHANGED
@@ -6,8 +6,8 @@
6
  "static_groups": false,
7
  "sym": true,
8
  "true_sequential": true,
9
- "model_name_or_path": "Qwen-7B-4bit",
10
- "model_file_base_name": "gptq_model-4bit-128g",
11
  "is_marlin_format": false,
12
  "quant_method": "gptq"
13
  }
 
6
  "static_groups": false,
7
  "sym": true,
8
  "true_sequential": true,
9
+ "model_name_or_path": null,
10
+ "model_file_base_name": null,
11
  "is_marlin_format": false,
12
  "quant_method": "gptq"
13
  }