Spaces:

tungedng2710
/

TonAI-OCR

Sleeping

App Files Files Community

tungedng2710 commited on Sep 19, 2024

Commit

db5ea6e

verified ·

1 Parent(s): 7a253ad

Upload folder using huggingface_hub

Browse files

Files changed (3) hide show

README.md +58 -9
app.py +65 -0
requirements.txt +92 -0

README.md CHANGED Viewed

@@ -1,13 +1,62 @@
 ---
-title: TonAI OCR
-emoji: 📉
-colorFrom: green
-colorTo: green
-sdk: gradio
-sdk_version: 4.44.0
 app_file: app.py
-pinned: false
-license: apache-2.0
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: TonAI-OCR
 app_file: app.py
+sdk: gradio
+colorTo: purple
+sdk_version: 4.31.2
 ---
+# TonAI Text Recognition
+### A simple OCR Python library
+![ONNX](https://a11ybadges.com/badge?logo=onnx) ![Python](https://a11ybadges.com/badge?logo=python) ![PyPI](https://a11ybadges.com/badge?logo=pypi)
+Text detection with text recognition
+![](stuffs/demo2.jpg)
+Vietnam military vehicle license plate
+![](stuffs/ocr_plate.jpg)
+## Installation
+install via PyPi
+```
+pip install ton-ocr
+```
+## Usage example
+```
+import cv2
+import numpy as np
+from ton_ocr import TonOCRPipeline
+image_path = "stuffs/example.jpg"
+image = cv2.imread(image_path)
+ocr = TonOCRPipeline()
+results = ocr.predict(image)
+for result in results:
+    bbox = result.box           # text bounding box
+    text = result.text          # text string
+    score = result.score        # OCR's confidence
+    img = result.img            # cropped text image
+    # Draw the bounding polygon
+    points = np.array(bbox, np.int32)
+    points = points.reshape((-1, 1, 2))
+    color = (0, 255, 255)
+    is_closed = True
+    thickness = 2
+    cv2.polylines(image, [points], is_closed, color, thickness)
+    # Add OCR text to the image
+    font = cv2.FONT_HERSHEY_SIMPLEX
+    font_scale = 1
+    text_color = (0, 0, 255)
+    text_thickness = 2
+    first_point = tuple(points[0][0])
+    cv2.putText(image, text, first_point, font, font_scale, text_color, text_thickness)
+cv2.imshow('Image Window', image)
+cv2.waitKey(0)
+cv2.destroyAllWindows()
+```

app.py ADDED Viewed

	@@ -0,0 +1,65 @@

+import cv2
+import numpy as np
+import gradio as gr
+import warnings
+from ton_ocr import TonOCRPipeline
+# Suppress all warnings
+warnings.filterwarnings("ignore")
+def clear_image():
+        return None, None
+def ocr_image(image):
+    ocr = TonOCRPipeline()
+    image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
+    results = ocr.predict(image)
+    for result in results:
+        bbox = result.box           # text bounding box
+        text = result.text          # text string
+        score = result.score        # OCR's confidence
+        img = result.img            # cropped text image
+        # Draw the bounding polygon
+        points = np.array(bbox, np.int32)
+        points = points.reshape((-1, 1, 2))
+        color = (0, 255, 255)
+        is_closed = True
+        thickness = 2
+        cv2.polylines(image, [points], is_closed, color, thickness)
+        # Add OCR text to the image
+        font = cv2.FONT_HERSHEY_SIMPLEX
+        font_scale = 1
+        text_color = (0, 0, 255)
+        text_thickness = 2
+        first_point = tuple(points[0][0])
+        cv2.putText(image, text, first_point, font, font_scale, text_color, text_thickness)
+    # Convert image from BGR to RGB for Gradio
+    image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+    return image
+# Create the Gradio Blocks interface
+with gr.Blocks(theme=gr.Theme.from_hub("ParityError/Interstellar")) as demo:
+    gr.Markdown("# TonAI OCR - Nhận diện chữ trong ảnh")
+    with gr.Row():
+        with gr.Column():
+            image_input = gr.Image(sources = ['upload', 'clipboard'],
+                                   label="Input Image")
+            with gr.Row():
+                with gr.Column():
+                    submit_button = gr.Button("Submit")
+                with gr.Column():
+                    clear_button = gr.Button("Clear")
+        with gr.Column():
+            image_output = gr.Image(type="numpy", label="Output Image")
+            submit_button.click(fn=ocr_image, inputs=image_input, outputs=image_output)
+            clear_button.click(fn=clear_image, outputs=[image_input, image_output])
+# Launch the interface
+demo.launch(server_name="0.0.0.0",
+            server_port=7862,
+            favicon_path="stuffs/favicon.png",
+            max_threads=99)

requirements.txt ADDED Viewed

	@@ -0,0 +1,92 @@

+aiofiles==23.2.1
+annotated-types==0.7.0
+anyio==4.4.0
+backports.tarfile==1.2.0
+build==1.2.2
+certifi==2024.8.30
+cffi==1.17.1
+charset-normalizer==3.3.2
+click==8.1.7
+coloredlogs==15.0.1
+contourpy==1.3.0
+cryptography==43.0.1
+cycler==0.12.1
+docutils==0.21.2
+exceptiongroup==1.2.2
+fastapi==0.115.0
+ffmpy==0.4.0
+filelock==3.16.1
+flatbuffers==24.3.25
+fonttools==4.53.1
+fsspec==2024.9.0
+gradio==4.44.0
+gradio_client==1.3.0
+h11==0.14.0
+httpcore==1.0.5
+httpx==0.27.2
+huggingface-hub==0.25.0
+humanfriendly==10.0
+idna==3.10
+importlib_metadata==8.5.0
+importlib_resources==6.4.5
+jaraco.classes==3.4.0
+jaraco.context==6.0.1
+jaraco.functools==4.0.2
+jeepney==0.8.0
+Jinja2==3.1.4
+keyring==25.3.0
+kiwisolver==1.4.7
+markdown-it-py==3.0.0
+MarkupSafe==2.1.5
+matplotlib==3.9.2
+mdurl==0.1.2
+more-itertools==10.5.0
+mpmath==1.3.0
+nh3==0.2.18
+numpy==2.1.1
+onnxruntime-gpu==1.19.2
+opencv-python==4.10.0.84
+orjson==3.10.7
+packaging==24.1
+pandas==2.2.2
+pillow==10.4.0
+pkginfo==1.10.0
+protobuf==5.28.1
+pyclipper==1.3.0.post5
+pycparser==2.22
+pydantic==2.9.2
+pydantic_core==2.23.4
+pydub==0.25.1
+Pygments==2.18.0
+pyparsing==3.1.4
+pyproject_hooks==1.1.0
+python-dateutil==2.9.0.post0
+python-multipart==0.0.9
+pytz==2024.2
+PyYAML==6.0.2
+readme_renderer==44.0
+requests==2.32.3
+requests-toolbelt==1.0.0
+rfc3986==2.0.0
+rich==13.8.1
+ruff==0.6.5
+SecretStorage==3.3.3
+semantic-version==2.10.0
+shapely==2.0.6
+shellingham==1.5.4
+six==1.16.0
+sniffio==1.3.1
+starlette==0.38.5
+sympy==1.13.2
+tomli==2.0.1
+tomlkit==0.12.0
+ton_ocr==0.2.1
+tqdm==4.66.5
+twine==5.1.1
+typer==0.12.5
+typing_extensions==4.12.2
+tzdata==2024.1
+urllib3==2.2.3
+uvicorn==0.30.6
+websockets==12.0
+zipp==3.20.2