lvkaokao commited on
Commit
56bb9e3
1 Parent(s): 2c7e06a

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +3 -1
README.md CHANGED
@@ -202,7 +202,9 @@ outputs = model.generate(inputs, streamer=streamer, max_new_tokens=300)
202
  ```python
203
  from transformers import AutoTokenizer, TextStreamer
204
  from intel_extension_for_transformers.transformers import AutoModelForCausalLM, WeightOnlyQuantConfig
205
- model_name = "Intel/neural-chat-7b-v3-1"
 
 
206
  config = WeightOnlyQuantConfig(compute_dtype="bf16", weight_dtype="int4")
207
  prompt = "Once upon a time, there existed a little girl,"
208
 
 
202
  ```python
203
  from transformers import AutoTokenizer, TextStreamer
204
  from intel_extension_for_transformers.transformers import AutoModelForCausalLM, WeightOnlyQuantConfig
205
+ model_name = "Intel/neural-chat-7b-v3-1"
206
+
207
+ # for int8, should set weight_dtype="int8"
208
  config = WeightOnlyQuantConfig(compute_dtype="bf16", weight_dtype="int4")
209
  prompt = "Once upon a time, there existed a little girl,"
210