nielsr HF staff commited on
Commit
740fb26
1 Parent(s): 1c3da59

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -18,10 +18,10 @@ blip_processor_large = AutoProcessor.from_pretrained("Salesforce/blip-image-capt
18
  blip_model_large = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-image-captioning-large").to(device)
19
 
20
  blip2_processor = AutoProcessor.from_pretrained("Salesforce/blip2-opt-6.7b")
21
- blip2_model = Blip2ForConditionalGeneration.from_pretrained("Salesforce/blip2-opt-6.7b", device_map="auto", torch_dtype=torch.float16)
22
 
23
  instructblip_processor = AutoProcessor.from_pretrained("Salesforce/instructblip-vicuna-7b")
24
- instructblip_model = InstructBlipForConditionalGeneration.from_pretrained("Salesforce/instructblip-vicuna-7b").to(device)
25
 
26
  def generate_caption(processor, model, image, tokenizer=None, use_float_16=False):
27
  inputs = processor(images=image, return_tensors="pt").to(device)
@@ -42,7 +42,7 @@ def generate_caption(processor, model, image, tokenizer=None, use_float_16=False
42
  def generate_caption_blip2(processor, model, image, replace_token=False):
43
  prompt = "Generate a caption for the image:"
44
 
45
- inputs = processor(images=image, text=prompt, return_tensors="pt").to(device=device, dtype=torch.float16)
46
 
47
  generated_ids = model.generate(pixel_values=inputs.pixel_values,
48
  num_beams=5, max_length=50, min_length=1, top_p=0.9,
@@ -61,7 +61,7 @@ def generate_captions(image):
61
 
62
  caption_blip2 = generate_caption_blip2(blip2_processor, blip2_model, image).strip()
63
 
64
- caption_instructblip = generate_caption_blip2(instructblip_processor, instructblip_model, image)
65
 
66
  return caption_git_large_coco, caption_blip_large, caption_blip2, caption_instructblip
67
 
 
18
  blip_model_large = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-image-captioning-large").to(device)
19
 
20
  blip2_processor = AutoProcessor.from_pretrained("Salesforce/blip2-opt-6.7b")
21
+ blip2_model = Blip2ForConditionalGeneration.from_pretrained("Salesforce/blip2-opt-6.7b", device_map="auto", load_in_4bit=True, torch_dtype=torch.float16)
22
 
23
  instructblip_processor = AutoProcessor.from_pretrained("Salesforce/instructblip-vicuna-7b")
24
+ instructblip_model = InstructBlipForConditionalGeneration.from_pretrained("Salesforce/instructblip-vicuna-7b", device_map="auto", load_in_4bit=True, torch_dtype=torch.float16)
25
 
26
  def generate_caption(processor, model, image, tokenizer=None, use_float_16=False):
27
  inputs = processor(images=image, return_tensors="pt").to(device)
 
42
  def generate_caption_blip2(processor, model, image, replace_token=False):
43
  prompt = "Generate a caption for the image:"
44
 
45
+ inputs = processor(images=image, text=prompt, return_tensors="pt").to(device=model.device, dtype=torch.float16)
46
 
47
  generated_ids = model.generate(pixel_values=inputs.pixel_values,
48
  num_beams=5, max_length=50, min_length=1, top_p=0.9,
 
61
 
62
  caption_blip2 = generate_caption_blip2(blip2_processor, blip2_model, image).strip()
63
 
64
+ caption_instructblip = generate_caption_blip2(instructblip_processor, instructblip_model, image, replace_token=True)
65
 
66
  return caption_git_large_coco, caption_blip_large, caption_blip2, caption_instructblip
67