BAAI
/

Bunny-Llama-3-8B-V

Text Generation

Model card Files Files and versions Community

BoyaWu10 commited on Apr 29

Commit

a65ec98

•

1 Parent(s): b0bb93e

Update README.md

Files changed (1) hide show

README.md +7 -4

README.md CHANGED Viewed

@@ -30,6 +30,9 @@ Before running the snippet, you need to install the following dependencies:
 pip install torch transformers accelerate pillow
 ```
 ```python
 import torch
 import transformers
@@ -43,12 +46,12 @@ transformers.logging.disable_progress_bar()
 warnings.filterwarnings('ignore')
 # set device
-torch.set_default_device('cpu')  # or 'cuda'
 # create model
 model = AutoModelForCausalLM.from_pretrained(
     'BAAI/Bunny-Llama-3-8B-V',
-    torch_dtype=torch.float16,
     device_map='auto',
     trust_remote_code=True)
 tokenizer = AutoTokenizer.from_pretrained(
@@ -59,11 +62,11 @@ tokenizer = AutoTokenizer.from_pretrained(
 prompt = 'Why is the image funny?'
 text = f"A chat between a curious user and an artificial intelligence assistant. The assistant gives helpful, detailed, and polite answers to the user's questions. USER: <image>\n{prompt} ASSISTANT:"
 text_chunks = [tokenizer(chunk).input_ids for chunk in text.split('<image>')]
-input_ids = torch.tensor(text_chunks[0] + [-200] + text_chunks[1][1:], dtype=torch.long).unsqueeze(0)
 # image, sample images can be found in images folder
 image = Image.open('example_2.png')
-image_tensor = model.process_images([image], model.config).to(dtype=model.dtype)
 # generate
 output_ids = model.generate(

 pip install torch transformers accelerate pillow
 ```
+If the CUDA memory is enough, it would be faster to execute this snippet by setting `CUDA_VISIBLE_DEVICES=0`.
 ```python
 import torch
 import transformers
 warnings.filterwarnings('ignore')
 # set device
+device = 'cuda'  # or cpu
 # create model
 model = AutoModelForCausalLM.from_pretrained(
     'BAAI/Bunny-Llama-3-8B-V',
+    torch_dtype=torch.float16, # float32 for cpu
     device_map='auto',
     trust_remote_code=True)
 tokenizer = AutoTokenizer.from_pretrained(
 prompt = 'Why is the image funny?'
 text = f"A chat between a curious user and an artificial intelligence assistant. The assistant gives helpful, detailed, and polite answers to the user's questions. USER: <image>\n{prompt} ASSISTANT:"
 text_chunks = [tokenizer(chunk).input_ids for chunk in text.split('<image>')]
+input_ids = torch.tensor(text_chunks[0] + [-200] + text_chunks[1][1:], dtype=torch.long).unsqueeze(0).to(device)
 # image, sample images can be found in images folder
 image = Image.open('example_2.png')
+image_tensor = model.process_images([image], model.config).to(dtype=model.dtype, device=device)
 # generate
 output_ids = model.generate(