Spaces:

jke94
/

demo-openai-clip-vit

Sleeping

App Files Files Community

jke94 commited on Jul 28, 2023

Commit

b36fb35

•

1 Parent(s): 93632ff

Add files.

Browse files

Files changed (8) hide show

README.md +10 -5
app.py +90 -0
images/example-01-two-cats.jpg +0 -0
images/example-02-two-cats.jpg +0 -0
images/example-03-woman-with-pink-shirt-and-a-printer.jpg +0 -0
images/example-04-printer-in-the-left.jpg +0 -0
images/example-05-car-in-the-left-and-motorbike-in-the-right.jpg +0 -0
requirements.txt +2 -0

README.md CHANGED Viewed

@@ -1,13 +1,18 @@
 ---
-title: Demo Openai Clip Vit
-emoji: 🌍
-colorFrom: red
-colorTo: gray
 sdk: gradio
 sdk_version: 3.39.0
 app_file: app.py
 pinned: false
-license: openrail
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: Gradio Openai Clip Vit Large Patch14
+emoji: 🏢
+colorFrom: blue
+colorTo: yellow
 sdk: gradio
 sdk_version: 3.39.0
 app_file: app.py
 pinned: false
+license: creativeml-openrail-m
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
+# Examples:
+## A. Input example:
+the photo contains one cat, the photo contains a animal,the photo contains two cats, the photo contains something else

app.py ADDED Viewed

	@@ -0,0 +1,90 @@

+import gradio as gr
+from transformers import pipeline
+import os
+MODEL_OPENAI_CLIP_VIT_LARGE_PATCH_14 = "openai/clip-vit-large-patch14"
+MODEL_OPENAI_CLIP_VIT_BASE_PATCH_16 = "openai/clip-vit-base-patch16"
+MODEL_OPENAI_CLIP_VIT_BASE_PATCH_32 = "openai/clip-vit-base-patch32"
+input_examles = [
+    [
+        os.path.join(os.path.dirname(__file__), "images/example-01-two-cats.jpg"),
+        'the photo contains one cat,'   \
+        'the photo contains a animal,'  \
+        'the photo contains two cats,'  \
+        'the photo contains something else',
+        MODEL_OPENAI_CLIP_VIT_LARGE_PATCH_14
+    ],
+    [
+        os.path.join(os.path.dirname(__file__), "images/example-02-two-cats.jpg"),
+        'the photo contains one cat,'   \
+        'the photo contains a animal,'  \
+        'the photo contains two cats,'  \
+        'the photo contains something else',
+        MODEL_OPENAI_CLIP_VIT_BASE_PATCH_16
+    ],
+    [
+        os.path.join(os.path.dirname(__file__), "images/example-03-woman-with-pink-shirt-and-a-printer.jpg"),
+        'the photo contains a man and a printer,'                       \
+        'the photo contains a woman with blue shirt and a printer,'     \
+        'the photo contains a woman and a printer,'                     \
+        'the photo contains a printer,'                                 \
+        'the photo contains a woman with pink shirt and a printer,'     \
+        'the photo contains something else',
+        MODEL_OPENAI_CLIP_VIT_LARGE_PATCH_14
+    ],
+    [
+        os.path.join(os.path.dirname(__file__), "images/example-04-printer-in-the-left.jpg"),
+        'the photo contains a printer in the left,'     \
+        'the photo contains a printer in the right,'    \
+        'the photo contains a printer in the middle'    \
+        'the photo contains something else',
+        MODEL_OPENAI_CLIP_VIT_LARGE_PATCH_14
+    ],
+    [
+        os.path.join(os.path.dirname(__file__), "images/example-05-car-in-the-left-and-motorbike-in-the-right.jpg"),
+        'the photo contains a car in the left and a motorbike in the right,'     \
+        'the photo contains a car in the right and a motorbike in the left',
+        MODEL_OPENAI_CLIP_VIT_LARGE_PATCH_14
+    ]
+]
+def launch(image_input, labels_input, dropdown_input):
+    return predict(image_input, labels_input, dropdown_input)
+def predict(image_input, labels_input, dropdown_input):
+    labels_candidate = labels_input.split(",")
+    selected_model = f"""{dropdown_input}"""
+    pipe = pipeline(task="zero-shot-image-classification",  model=selected_model)
+    predictions = pipe(image_input, candidate_labels=labels_candidate)
+    return {p["label"]: p["score"] for p in predictions}
+# SYSTEM INPUTS
+image_input = gr.Image(label="Upload iamge candidate", type="filepath")
+text_input = gr.Textbox(type="text", label="Possible classes to detect.")
+dropdown_input = gr.Dropdown(
+    [
+        MODEL_OPENAI_CLIP_VIT_LARGE_PATCH_14,
+        MODEL_OPENAI_CLIP_VIT_BASE_PATCH_16,
+        MODEL_OPENAI_CLIP_VIT_BASE_PATCH_32
+    ],
+    label="OpenAI ClipVit Model")
+# SYSTEM OUTPUTS
+output_label = gr.outputs.Label()
+demo = gr.Interface(
+    launch,
+    inputs=[image_input, text_input, dropdown_input],
+    outputs=output_label,
+    title="Demo aobut zero-shot-image-classification",
+    examples = input_examles
+)
+if __name__ == "__main__":
+    demo.launch()

images/example-01-two-cats.jpg ADDED Viewed

images/example-02-two-cats.jpg ADDED Viewed

images/example-03-woman-with-pink-shirt-and-a-printer.jpg ADDED Viewed

images/example-04-printer-in-the-left.jpg ADDED Viewed

images/example-05-car-in-the-left-and-motorbike-in-the-right.jpg ADDED Viewed

requirements.txt ADDED Viewed

	@@ -0,0 +1,2 @@


1	+ transformers
2	+ torch