Spaces:

vivien
/

clip

Running

App Files Files Community

Vivien commited on Oct 5, 2021

Commit

c81898a

•

1 Parent(s): 59898ea

Initial commit

Browse files

Files changed (7) hide show

.gitattributes +1 -0
README.md +4 -4
app.py +78 -0
data.csv +0 -0
data2.csv +0 -0
embeddings.npy +3 -0
embeddings2.npy +3 -0

.gitattributes CHANGED Viewed

@@ -25,3 +25,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zstandard filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zstandard filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text

README.md CHANGED Viewed

@@ -1,11 +1,11 @@
 ---
-title: Clip
 emoji: 👁
-colorFrom: yellow
-colorTo: yellow
 sdk: streamlit
 app_file: app.py
-pinned: false
 ---
 # Configuration

 ---
+title: Clip Demo
 emoji: 👁
+colorFrom: indigo
+colorTo: blue
 sdk: streamlit
 app_file: app.py
+pinned: true
 ---
 # Configuration

app.py ADDED Viewed

	@@ -0,0 +1,78 @@

+import streamlit as st
+import pandas as pd, numpy as np
+import os
+from transformers import CLIPProcessor, CLIPTextModel, CLIPModel
+@st.cache(show_spinner=False,
+          hash_funcs={CLIPModel: lambda _: None,
+                      CLIPTextModel: lambda _: None,
+                      CLIPProcessor: lambda _: None,
+                      dict: lambda _: None})
+def load():
+  model = CLIPModel.from_pretrained("openai/clip-vit-base-patch32")
+  text_model = CLIPTextModel.from_pretrained("openai/clip-vit-base-patch32")
+  processor = CLIPProcessor.from_pretrained("openai/clip-vit-base-patch32")
+  df = {0: pd.read_csv('data.csv'), 1: pd.read_csv('data2.csv')}
+  embeddings = {0: np.load('embeddings.npy'), 1: np.load('embeddings2.npy')}
+  for k in [0, 1]:
+    embeddings[k] = np.divide(embeddings[k], np.sqrt(np.sum(embeddings[k]**2, axis=1, keepdims=True)))
+  return model, text_model, processor, df, embeddings
+model, text_model, processor, df, embeddings = load()
+source = {0: '\nSource: Unsplash', 1: '\nSource: The Movie Database (TMDB)'}
+def get_html(url_list, height=200):
+    html = "<div style='margin-top: 20px; max-width: 1200px; display: flex; flex-wrap: wrap; justify-content: space-evenly'>"
+    for url, title, link in url_list:
+        html2 = f"<img title='{title}' style='height: {height}px; margin: 5px' src='{url}'>"
+        if len(link) > 0:
+            html2 = f"<a href='{link}' target='_blank'>" + html2 + "</a>"
+        html = html + html2
+    html += "</div>"
+    return html
+def compute_text_embeddings(list_of_strings):
+    inputs = processor(text=list_of_strings, return_tensors="pt", padding=True)
+    return model.text_projection(text_model(**inputs).pooler_output)
+st.cache(show_spinner=False)
+def image_search(query, corpus, n_results=24):
+    text_embeddings = compute_text_embeddings([query]).detach().numpy()
+    k = 0 if corpus == 'Unsplash' else 1
+    results = np.argsort((embeddings[k]@text_embeddings.T)[:, 0])[-1:-n_results-1:-1]
+    return [(df[k].iloc[i]['path'],
+             df[k].iloc[i]['tooltip'] + source[k],
+             df[k].iloc[i]['link']) for i in results]
+description = '''
+# Semantic image search
+Built with OpenAI's [CLIP](https://openai.com/blog/clip/) model, 🤗 Hugging Face's [transformers library](https://huggingface.co/transformers/), [Streamlit](https://streamlit.io/) and images from [Unsplash](https://unsplash.com/) and [The Movie Database (TMDB)](https://www.themoviedb.org/)
+'''
+def main():
+  st.markdown('''
+              <style>
+              .block-container{
+                max-width: 1200px;
+              }
+              stTextInput{
+                max-width: 600px;
+              }
+              #MainMenu {
+                visibility: hidden;
+              }
+              footer {
+                visibility: hidden;
+              }
+              </style>''',
+              unsafe_allow_html=True)
+  st.sidebar.markdown(description)
+  _, col1, col2, _ = st.columns([2, 10, 2, 2])
+  query = col1.text_input('')
+  corpus = col2.radio('', ["Unsplash","Movies"])
+  if len(query) > 0:
+    results = image_search(query, corpus)
+    st.markdown(get_html(results), unsafe_allow_html=True)
+if __name__ == '__main__':
+  main()

data.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

data2.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

embeddings.npy ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9f8c171e32276739be6b020592edc8a2c06e029ff6505a9d1d4efe3cafa073bd
+size 51200128

embeddings2.npy ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:389f1012d8980c48d3e193dbed13435bbf249adc842c9e67c2ab1e3c5292cb76
+size 15739008