Fix app.py
Browse files
app.py
CHANGED
@@ -14,7 +14,7 @@ import pyminizip
|
|
14 |
import transformers
|
15 |
from transformers import AutoModel, AutoTokenizer
|
16 |
from huggingface_hub import hf_hub_download, snapshot_download
|
17 |
-
from PIL import Image
|
18 |
|
19 |
|
20 |
def unicode_normalize(cls, s):
|
@@ -150,7 +150,7 @@ class ClipTextModel(nn.Module):
|
|
150 |
|
151 |
@torch.no_grad()
|
152 |
def encode_text(self, texts, batch_size=8, max_length=64):
|
153 |
-
|
154 |
all_embeddings = []
|
155 |
iterator = range(0, len(texts), batch_size)
|
156 |
for batch_idx in iterator:
|
@@ -222,6 +222,7 @@ class ClipTextModel(nn.Module):
|
|
222 |
|
223 |
# @torch.no_grad()
|
224 |
# def encode_image(self, images, batch_size=8):
|
|
|
225 |
# all_embeddings = []
|
226 |
# iterator = range(0, len(images), batch_size)
|
227 |
# for batch_idx in iterator:
|
@@ -327,11 +328,11 @@ if "model" not in st.session_state:
|
|
327 |
|
328 |
print("extract dataset")
|
329 |
pyminizip.uncompress(
|
330 |
-
"
|
331 |
)
|
332 |
|
333 |
print("loading dataset")
|
334 |
-
df = pq.read_table("
|
335 |
columns=["page", "description", "image_url", "image_vector"]).to_pandas()
|
336 |
st.session_state.df = df
|
337 |
|
|
|
14 |
import transformers
|
15 |
from transformers import AutoModel, AutoTokenizer
|
16 |
from huggingface_hub import hf_hub_download, snapshot_download
|
17 |
+
# from PIL import Image
|
18 |
|
19 |
|
20 |
def unicode_normalize(cls, s):
|
|
|
150 |
|
151 |
@torch.no_grad()
|
152 |
def encode_text(self, texts, batch_size=8, max_length=64):
|
153 |
+
self.eval()
|
154 |
all_embeddings = []
|
155 |
iterator = range(0, len(texts), batch_size)
|
156 |
for batch_idx in iterator:
|
|
|
222 |
|
223 |
# @torch.no_grad()
|
224 |
# def encode_image(self, images, batch_size=8):
|
225 |
+
# self.eval()
|
226 |
# all_embeddings = []
|
227 |
# iterator = range(0, len(images), batch_size)
|
228 |
# for batch_idx in iterator:
|
|
|
328 |
|
329 |
print("extract dataset")
|
330 |
pyminizip.uncompress(
|
331 |
+
"clip_zeroshot_irasuto_image_items_20210224.pq.zip", st.secrets["ZIP_PASSWORD"], None, 1
|
332 |
)
|
333 |
|
334 |
print("loading dataset")
|
335 |
+
df = pq.read_table("clip_zeroshot_irasuto_image_items_20210224.parquet",
|
336 |
columns=["page", "description", "image_url", "image_vector"]).to_pandas()
|
337 |
st.session_state.df = df
|
338 |
|