BAAI
/

AquilaChat2-34B

Text Generation

Model card Files Files and versions Community

Anhforth commited on Oct 20, 2023

Commit

17734e6

•

1 Parent(s): 5220fea

Update README.md

Files changed (1) hide show

README.md +11 -1

README.md CHANGED Viewed

@@ -24,11 +24,21 @@ The additional details of the Aquila model will be presented in the official tec
 ```python
 from transformers import AutoTokenizer, AutoModelForCausalLM
 import torch
 device = torch.device("cuda:0")
 model_info = "BAAI/AquilaChat2-34B"
 tokenizer = AutoTokenizer.from_pretrained(model_info, trust_remote_code=True)
-model = AutoModelForCausalLM.from_pretrained(model_info, trust_remote_code=True, torch_dtype=torch.bfloat16)
 model.eval()
 model.to(device)
 text = "请给出10个要到北京旅游的理由。"

 ```python
 from transformers import AutoTokenizer, AutoModelForCausalLM
+from transformers import BitsAndBytesConfig
 import torch
 device = torch.device("cuda:0")
 model_info = "BAAI/AquilaChat2-34B"
 tokenizer = AutoTokenizer.from_pretrained(model_info, trust_remote_code=True)
+quantization_config=BitsAndBytesConfig(
+                        load_in_4bit=True,
+                        bnb_4bit_use_double_quant=True,
+                        bnb_4bit_quant_type="nf4",
+                        bnb_4bit_compute_dtype=torch.bfloat16,
+                    )
+model = AutoModelForCausalLM.from_pretrained(model_info, trust_remote_code=True, torch_dtype=torch.bfloat16
+                                                # quantization_config=quantization_config, # Uncomment this line for 4bit quantization
+                                                )
 model.eval()
 model.to(device)
 text = "请给出10个要到北京旅游的理由。"