Spaces:

iamrobotbear
/

blip-vqa-gradio

Paused

iamrobotbear commited on Apr 2, 2023

Commit

bd67535

1 Parent(s): 33f9417

switch back to opt-2.7b

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,12 +7,7 @@ from PIL import Image
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
-# Load the BLIP-2 model and processor (needs A10G)
-processor = AutoProcessor.from_pretrained("Salesforce/blip-itm-large-coco")
-# Load model in int8 using bitsandbytes, and pass device_map='auto'
-model = Blip2ForConditionalGeneration.from_pretrained(
-    "Salesforce/blip-itm-large-coco", load_in_8bit=True, device_map='auto'
-)
 # Load the BLIP-2 model and processor (needs A10G)
@@ -22,14 +17,14 @@ model = Blip2ForConditionalGeneration.from_pretrained(
 #    "Salesforce/blip2-opt-6.7b-coco", load_in_8bit=True, device_map='auto'
 #)
-# Uncomment lines 20, 22, 23, & 24 to begin using blip2-oopt-2.7b model (can run on T4 Medium)
 # Load the BLIP-2 model and processor
-#processor = AutoProcessor.from_pretrained("Salesforce/blip2-opt-2.7b")
 # Load model in int8 using bitsandbytes, and pass device_map='auto'
-#model = Blip2ForConditionalGeneration.from_pretrained(
-#   "Salesforce/blip2-opt-2.7b", load_in_8bit=True, device_map='auto'
-#)
 def blip2_interface(image, prompted_caption_text, vqa_question, chat_context):
     # Prepare image input

 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
 # Load the BLIP-2 model and processor (needs A10G)
 #    "Salesforce/blip2-opt-6.7b-coco", load_in_8bit=True, device_map='auto'
 #)
+# Uncomment lines 20, 22, 23, & 24 to begin using blip2-opt-2.7b model (can run on T4 Medium)
 # Load the BLIP-2 model and processor
+processor = AutoProcessor.from_pretrained("Salesforce/blip2-opt-2.7b")
 # Load model in int8 using bitsandbytes, and pass device_map='auto'
+model = Blip2ForConditionalGeneration.from_pretrained(
+   "Salesforce/blip2-opt-2.7b", load_in_8bit=True, device_map='auto'
+)
 def blip2_interface(image, prompted_caption_text, vqa_question, chat_context):
     # Prepare image input