Spaces:

Tonic
/

GOT-OCR

Running on Zero

Tonic commited on Sep 13, 2024

Commit

1a87a19

unverified ·

1 Parent(s): 40d5755

do it normally

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,8 +5,10 @@ import os
 import base64
 import spaces
 import io
-from PIL import Image
 import numpy as np
 title = """# 🙋🏻‍♂️Welcome to Tonic's🫴🏻📸GOT-OCR"""
 description = """"
@@ -52,12 +54,24 @@ model.config.pad_token_id = tokenizer.eos_token_id
 #     image.save(buffered, format="PNG")
 #     return base64.b64encode(buffered.getvalue()).decode()
 @spaces.GPU
-def process_image(image, task, ocr_type=None, ocr_box=None, ocr_color=None):
     try:
-        if image is None:
             return "No image provided", None
         if task == "Plain Text OCR":
             res = model.chat(tokenizer, image, ocr_type='ocr')
         elif task == "Format Text OCR":
@@ -74,6 +88,8 @@ def process_image(image, task, ocr_type=None, ocr_box=None, ocr_color=None):
                 html_content = f.read()
             return res, html_content
         return res, None
     except Exception as e:
         return str(e), None

 import base64
 import spaces
 import io
 import numpy as np
+from PIL import Image
+import io
 title = """# 🙋🏻‍♂️Welcome to Tonic's🫴🏻📸GOT-OCR"""
 description = """"
 #     image.save(buffered, format="PNG")
 #     return base64.b64encode(buffered.getvalue()).decode()
+def numpy_to_pil(image_np):
+    return Image.fromarray(image_np.astype('uint8'), 'RGB')
 @spaces.GPU
+def process_image(image_np, task, ocr_type=None, ocr_box=None, ocr_color=None):
     try:
+        if image_np is None:
             return "No image provided", None
+        image = numpy_to_pil(image_np)
+        with io.BytesIO() as buffer:
+            image.save(buffer, format="PNG")
+            image_path = "/tmp/temp_image.png"
+            with open(image_path, "wb") as f:
+                f.write(buffer.getvalue())
         if task == "Plain Text OCR":
             res = model.chat(tokenizer, image, ocr_type='ocr')
         elif task == "Format Text OCR":
                 html_content = f.read()
             return res, html_content
+        os.remove(image_path)
         return res, None
     except Exception as e:
         return str(e), None