Haihao commited on
Commit
bd11ee4
1 Parent(s): 7b86016

Update README.md

Browse files

Use bf16 compute type

Files changed (1) hide show
  1. README.md +1 -1
README.md CHANGED
@@ -157,7 +157,7 @@ So, the sum of 100, 520, and 60 is 680.
157
  from transformers import AutoTokenizer, TextStreamer
158
  from intel_extension_for_transformers.transformers import AutoModelForCausalLM, WeightOnlyQuantConfig
159
  model_name = "Intel/neural-chat-7b-v3-3"
160
- config = WeightOnlyQuantConfig(compute_dtype="int8", weight_dtype="int4")
161
  prompt = "Once upon a time, there existed a little girl,"
162
 
163
  tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
 
157
  from transformers import AutoTokenizer, TextStreamer
158
  from intel_extension_for_transformers.transformers import AutoModelForCausalLM, WeightOnlyQuantConfig
159
  model_name = "Intel/neural-chat-7b-v3-3"
160
+ config = WeightOnlyQuantConfig(compute_dtype="bf16", weight_dtype="int4")
161
  prompt = "Once upon a time, there existed a little girl,"
162
 
163
  tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)