Spaces:

marinap
/

multilingual-image-search

Runtime error

marinap commited on May 11, 2023

Commit

bb5ec6d

1 Parent(s): 848a638

added resizing

Files changed (1) hide show

app.py CHANGED Viewed

@@ -21,9 +21,18 @@ embeddings = torch.tensor(embeddings)
 img_df = pd.read_csv('image_data.csv')
-def url2img(url):
     data = requests.get(url, allow_redirects = True).content
-    return Image.open(io.BytesIO(data))
 def find_topk(text):
@@ -34,10 +43,11 @@ def find_topk(text):
     text_data = model_multi.preprocess_text(text)
     text_features, text_embedding = model_multi.encode_text(text_data, return_features=True)
     sims = F.cosine_similarity(text_embedding, embeddings)
     vals, inds = sims.topk(top_k)
-    print(img_df)
     top_k_urls = img_df.iloc[inds]['photo_image_url'].values
     print('top_k_urls', top_k_urls)

 img_df = pd.read_csv('image_data.csv')
+def url2img(url, resize = False, fix_height = 200):
     data = requests.get(url, allow_redirects = True).content
+    img = Image.open(io.BytesIO(data))
+    if resize:
+        width, height = img.size
+        img = img.resize((resize_wh(width, height, fix_height)))
+    return  img
+def resize_wh(w, h, fix_height):
+    ratio = w / h
+    w_n = int(fix_height * ratio)
+    return w_n, fix_height
 def find_topk(text):
     text_data = model_multi.preprocess_text(text)
     text_features, text_embedding = model_multi.encode_text(text_data, return_features=True)
+    print('Got features', datetime.now().strftime("%H:%M:%S"))
     sims = F.cosine_similarity(text_embedding, embeddings)
     vals, inds = sims.topk(top_k)
     top_k_urls = img_df.iloc[inds]['photo_image_url'].values
     print('top_k_urls', top_k_urls)