upload more samples

Files changed (22) hide show

app.py CHANGED Viewed

@@ -21,34 +21,24 @@ st.sidebar.title("Select a sample image")
 sample_name = st.sidebar.selectbox(
     "Please Choose the Model",
-    (
-        "sample 1",
-        "sample 2",
-        "sample 3",
-        "sample 4"
-    )
 )
-sample_name = f'sample_{sample_name.split()[-1].zfill(2)}.jpg'
-sample_path = f'samples/{sample_name}'
 image = Image.open(sample_path)
 show = st.image(image, use_column_width=True)
-show.image(image, 'Uploaded Image', use_column_width=True)
 # For newline
 st.sidebar.write('\n')
-# if st.sidebar.button("Click here to get image caption"):
 with st.spinner('Generating image caption ...'):
-    caption, tokens, token_ids = predict_dummy(image)
     st.success(f'caption: {caption}')
-    st.success(f'tokens: {tokens}')
-    st.success(f'token ids: {token_ids}')
 st.sidebar.header("ViT-GPT2 predicts:")
 st.sidebar.write(f"caption: {caption}", '\n')

 sample_name = st.sidebar.selectbox(
     "Please Choose the Model",
+    sample_fns
 )
+sample_name = f'COCO_val2014_{sample_name.replace('.jpg', '').zfill(12)}.jpg'
+sample_path = os.path.join(sample_dir, sample_name)
 image = Image.open(sample_path)
 show = st.image(image, use_column_width=True)
+show.image(image, 'Selected Image', use_column_width=True)
 # For newline
 st.sidebar.write('\n')
 with st.spinner('Generating image caption ...'):
+    caption = predict_dummy(image)
+    image.close()
     st.success(f'caption: {caption}')
 st.sidebar.header("ViT-GPT2 predicts:")
 st.sidebar.write(f"caption: {caption}", '\n')

model.py CHANGED Viewed

@@ -53,18 +53,21 @@ def predict(image):
     token_ids = np.array(generation.sequences)[0]
     caption = tokenizer.decode(token_ids)
-    return caption, token_ids
-def init():
     image_path = 'samples/val_000000039769.jpg'
     image = Image.open(image_path)
-    caption, token_ids = predict(image)
     image.close()
 def predict_dummy(image):
-    return 'dummy caption!', ['dummy', 'caption', '!'], [1, 2, 3]
-init()

     token_ids = np.array(generation.sequences)[0]
     caption = tokenizer.decode(token_ids)
+    return caption
+def compile():
     image_path = 'samples/val_000000039769.jpg'
     image = Image.open(image_path)
+    caption = predict(image)
     image.close()
 def predict_dummy(image):
+    return 'dummy caption!'
+compile()
+sample_dir = './samples/'
+sample_fns = tuple([f"{int(f.replace('COCO_val2014_', '').replace('.jpg', ''))}.jpg" for f in os.listdir(sample_dir) if f.startswith('COCO_val2014_')])