Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -2,13 +2,12 @@ import streamlit as st
|
|
2 |
from PIL import Image
|
3 |
import os
|
4 |
import base64
|
|
|
5 |
from helper import (
|
6 |
custom_file_uploader, resize_image, convert_image_to_base64, post_request_and_parse_response,
|
7 |
draw_bounding_boxes_for_textract, extract_text_from_textract_blocks, ChatGPTClient
|
8 |
)
|
9 |
-
import
|
10 |
-
import shutil
|
11 |
-
from pdf2image import convert_from_bytes
|
12 |
|
13 |
# Load OpenAI API Key from environment variable
|
14 |
OPENAI_API_KEY = os.environ["OPENAI_API_KEY"]
|
@@ -26,20 +25,26 @@ with st.sidebar:
|
|
26 |
|
27 |
# Display a placeholder for uploaded image
|
28 |
st.warning("Please upload an image or a single-page PDF file!")
|
29 |
-
uploaded_file = st.file_uploader("Upload an Image or PDF", type=['
|
30 |
|
31 |
pil_image = None
|
32 |
if uploaded_file:
|
33 |
# Handle PDF file
|
34 |
if uploaded_file.type == "application/pdf":
|
35 |
try:
|
36 |
-
# Read PDF as bytes
|
37 |
pdf_bytes = uploaded_file.read()
|
38 |
-
|
39 |
-
|
|
|
|
|
40 |
st.warning("Please upload a PDF with only one page!")
|
41 |
else:
|
42 |
-
|
|
|
|
|
|
|
|
|
43 |
except Exception as e:
|
44 |
st.error(f"Failed to convert PDF to image: {e}")
|
45 |
else:
|
|
|
2 |
from PIL import Image
|
3 |
import os
|
4 |
import base64
|
5 |
+
import fitz # PyMuPDF
|
6 |
from helper import (
|
7 |
custom_file_uploader, resize_image, convert_image_to_base64, post_request_and_parse_response,
|
8 |
draw_bounding_boxes_for_textract, extract_text_from_textract_blocks, ChatGPTClient
|
9 |
)
|
10 |
+
import io
|
|
|
|
|
11 |
|
12 |
# Load OpenAI API Key from environment variable
|
13 |
OPENAI_API_KEY = os.environ["OPENAI_API_KEY"]
|
|
|
25 |
|
26 |
# Display a placeholder for uploaded image
|
27 |
st.warning("Please upload an image or a single-page PDF file!")
|
28 |
+
uploaded_file = st.file_uploader("Upload an Image or PDF", type=['PDF'], label_visibility="collapsed")
|
29 |
|
30 |
pil_image = None
|
31 |
if uploaded_file:
|
32 |
# Handle PDF file
|
33 |
if uploaded_file.type == "application/pdf":
|
34 |
try:
|
35 |
+
# Read PDF as bytes
|
36 |
pdf_bytes = uploaded_file.read()
|
37 |
+
pdf_document = fitz.open(stream=pdf_bytes, filetype="pdf")
|
38 |
+
|
39 |
+
# Check if the PDF has only one page
|
40 |
+
if pdf_document.page_count != 1:
|
41 |
st.warning("Please upload a PDF with only one page!")
|
42 |
else:
|
43 |
+
# Convert the first page to an image
|
44 |
+
page = pdf_document.load_page(0)
|
45 |
+
pix = page.get_pixmap()
|
46 |
+
image_bytes = pix.tobytes()
|
47 |
+
pil_image = Image.open(io.BytesIO(image_bytes))
|
48 |
except Exception as e:
|
49 |
st.error(f"Failed to convert PDF to image: {e}")
|
50 |
else:
|