Spaces:

eagle0504
/

ocr-basics

Sleeping

App Files Files Community

eagle0504 commited on Oct 18, 2024

Commit

28e97a7

verified ·

1 Parent(s): 629124e

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -8

app.py CHANGED Viewed

@@ -2,13 +2,12 @@ import streamlit as st
 from PIL import Image
 import os
 import base64
 from helper import (
     custom_file_uploader, resize_image, convert_image_to_base64, post_request_and_parse_response,
     draw_bounding_boxes_for_textract, extract_text_from_textract_blocks, ChatGPTClient
 )
-import tempfile
-import shutil
-from pdf2image import convert_from_bytes
 # Load OpenAI API Key from environment variable
 OPENAI_API_KEY = os.environ["OPENAI_API_KEY"]
@@ -26,20 +25,26 @@ with st.sidebar:
     # Display a placeholder for uploaded image
     st.warning("Please upload an image or a single-page PDF file!")
-    uploaded_file = st.file_uploader("Upload an Image or PDF", type=['TXT', 'PDF'], label_visibility="collapsed")
     pil_image = None
     if uploaded_file:
         # Handle PDF file
         if uploaded_file.type == "application/pdf":
             try:
-                # Read PDF as bytes and convert to image directly
                 pdf_bytes = uploaded_file.read()
-                pages = convert_from_bytes(pdf_bytes, dpi=200)
-                if len(pages) != 1:
                     st.warning("Please upload a PDF with only one page!")
                 else:
-                    pil_image = pages[0]
             except Exception as e:
                 st.error(f"Failed to convert PDF to image: {e}")
         else:

 from PIL import Image
 import os
 import base64
+import fitz  # PyMuPDF
 from helper import (
     custom_file_uploader, resize_image, convert_image_to_base64, post_request_and_parse_response,
     draw_bounding_boxes_for_textract, extract_text_from_textract_blocks, ChatGPTClient
 )
+import io
 # Load OpenAI API Key from environment variable
 OPENAI_API_KEY = os.environ["OPENAI_API_KEY"]
     # Display a placeholder for uploaded image
     st.warning("Please upload an image or a single-page PDF file!")
+    uploaded_file = st.file_uploader("Upload an Image or PDF", type=['PDF'], label_visibility="collapsed")
     pil_image = None
     if uploaded_file:
         # Handle PDF file
         if uploaded_file.type == "application/pdf":
             try:
+                # Read PDF as bytes
                 pdf_bytes = uploaded_file.read()
+                pdf_document = fitz.open(stream=pdf_bytes, filetype="pdf")
+                # Check if the PDF has only one page
+                if pdf_document.page_count != 1:
                     st.warning("Please upload a PDF with only one page!")
                 else:
+                    # Convert the first page to an image
+                    page = pdf_document.load_page(0)
+                    pix = page.get_pixmap()
+                    image_bytes = pix.tobytes()
+                    pil_image = Image.open(io.BytesIO(image_bytes))
             except Exception as e:
                 st.error(f"Failed to convert PDF to image: {e}")
         else: