Spaces:

junyangwang0410
/

Mobile-Agent

Running

App Files Files Community

junyangwang0410 commited on Jun 27, 2024

Commit

b4af017

verified ·

1 Parent(s): 43c0e1c

Update MobileAgent/crop.py

Browse files

Files changed (1) hide show

MobileAgent/crop.py +0 -52

MobileAgent/crop.py CHANGED Viewed

@@ -2,8 +2,6 @@ import math
 import cv2
 import numpy as np
 from PIL import Image, ImageDraw, ImageFont
-import clip
-import torch
 def crop_image(img, position):
@@ -89,53 +87,3 @@ def in_box(box, target):
         return True
     else:
         return False
-def crop_for_clip(image, box, i, position):
-    image = Image.open(image)
-    w, h = image.size
-    if position == "left":
-        bound = [0, 0, w/2, h]
-    elif position == "right":
-        bound = [w/2, 0, w, h]
-    elif position == "top":
-        bound = [0, 0, w, h/2]
-    elif position == "bottom":
-        bound = [0, h/2, w, h]
-    elif position == "top left":
-        bound = [0, 0, w/2, h/2]
-    elif position == "top right":
-        bound = [w/2, 0, w, h/2]
-    elif position == "bottom left":
-        bound = [0, h/2, w/2, h]
-    elif position == "bottom right":
-        bound = [w/2, h/2, w, h]
-    else:
-        bound = [0, 0, w, h]
-    if in_box(box, bound):
-        cropped_image = image.crop(box)
-        cropped_image.save(f"./temp/{i}.jpg")
-        return True
-    else:
-        return False
-def clip_for_icon(clip_model, clip_preprocess, images, prompt):
-    image_features = []
-    for image_file in images:
-        image = clip_preprocess(Image.open(image_file)).unsqueeze(0).to(next(clip_model.parameters()).device)
-        image_feature = clip_model.encode_image(image)
-        image_features.append(image_feature)
-    image_features = torch.cat(image_features)
-    text = clip.tokenize([prompt]).to(next(clip_model.parameters()).device)
-    text_features = clip_model.encode_text(text)
-    image_features /= image_features.norm(dim=-1, keepdim=True)
-    text_features /= text_features.norm(dim=-1, keepdim=True)
-    similarity = (100.0 * image_features @ text_features.T).softmax(dim=0).squeeze(0)
-    _, max_pos = torch.max(similarity, dim=0)
-    pos = max_pos.item()
-    return pos

 import cv2
 import numpy as np
 from PIL import Image, ImageDraw, ImageFont
 def crop_image(img, position):
         return True
     else:
         return False