Spaces:

KwabsHug
/

Moondream1cputest

Sleeping

App Files Files Community

kwabs22 commited on Feb 18

Commit

37f1dd5

•

1 Parent(s): 032673b

remove unneeded comments

Browse files

Files changed (1) hide show

app.py +3 -13

app.py CHANGED Viewed

@@ -9,15 +9,7 @@ def clear_model(model):
     del model
     gc.collect()
 def process_image_and_question(image, question):
-    # Placeholder for your image processing and question answering
-    # Replace this with your actual model processing
-    # For example:
-    # enc_image = model.encode_image(image)
-    # answer = model.answer_question(enc_image, question, tokenizer)
-    # return answer
     FinalOutput = ""
     model_id = "vikhyatk/moondream1"
@@ -32,15 +24,13 @@ def process_image_and_question(image, question):
         model = AutoModelForCausalLM.from_pretrained(model_id, trust_remote_code=True)
         tokenizer = Tokenizer.from_pretrained(model_id)
-    # Assuming you have a correct way to process the image
-    #image = Image.open('/content/_57e22ed5-217c-4004-a279-eeecc18cbd55.jpg') #/content/Bard_Generated_Image (3).jpg')
-    # This part of the code is incorrect for a standard transformers model
     enc_image = model.encode_image(image)
     FinalOutput += model.answer_question(enc_image, "how many people are there? also explain if the image is weird?", tokenizer)
     model_size = asizeof.asizeof(model)
     tokenizer_size = asizeof.asizeof(tokenizer)
-    FinalOutput += f"\nModel size in RAM: {model_size} bytes, Tokenizer size in RAM: {tokenizer_size} bytes"
     #model load and set-up = 1 min and inference on CPU = 2 min
     return FinalOutput
@@ -50,7 +40,7 @@ iface = gr.Interface(fn=process_image_and_question,
                      inputs=[gr.Image(type="pil"), gr.Textbox(lines=2, placeholder="Ask a question about the image...")],
                      outputs="text",
                      title="Image Question Answering",
-                     description="Upload an image and ask a question about it. ( 2 - 3 min response time expected )")
 # Launch the interface
 iface.launch()

     del model
     gc.collect()
 def process_image_and_question(image, question):
     FinalOutput = ""
     model_id = "vikhyatk/moondream1"
         model = AutoModelForCausalLM.from_pretrained(model_id, trust_remote_code=True)
         tokenizer = Tokenizer.from_pretrained(model_id)
     enc_image = model.encode_image(image)
     FinalOutput += model.answer_question(enc_image, "how many people are there? also explain if the image is weird?", tokenizer)
     model_size = asizeof.asizeof(model)
     tokenizer_size = asizeof.asizeof(tokenizer)
+    FinalOutput += f"\n\nExpected Ram usage: +- 9.5 gb \nModel size in RAM: {model_size} bytes, Tokenizer size in RAM: {tokenizer_size} bytes"
+    #clear_model(model) #Not needed due to try except check
     #model load and set-up = 1 min and inference on CPU = 2 min
     return FinalOutput
                      inputs=[gr.Image(type="pil"), gr.Textbox(lines=2, placeholder="Ask a question about the image...")],
                      outputs="text",
                      title="Image Question Answering",
+                     description="Upload an image and ask a question about it. ( 3 - 4 min response time expected )")
 # Launch the interface
 iface.launch()