Spaces:

mangalathkedar
/

image_recog

Sleeping

App Files Files Community

mangalathkedar commited on Nov 29, 2024

Commit

c313d0c

verified ·

1 Parent(s): f7dd71a

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -21

app.py CHANGED Viewed

@@ -1,17 +1,14 @@
 import base64
 import streamlit as st
-from openai import OpenAI
-import pdf2image
 from PIL import Image
 import io
 import tempfile
-# Load environment variables
-# Initialize OpenAI client
-client = OpenAI()
 def convert_pdf_to_images(pdf_file):
     """Convert PDF to list of images"""
@@ -19,9 +16,13 @@ def convert_pdf_to_images(pdf_file):
         tmp_file.write(pdf_file.getvalue())
         pdf_path = tmp_file.name
-    images = pdf2image.convert_from_path(pdf_path)
-    os.unlink(pdf_path)
-    return images
 def format_response(text):
     """Format the analysis response with clean styling"""
@@ -38,7 +39,7 @@ def format_response(text):
     # Split into pages
     pages = text.split("Page")
-    for page_num, page_content in enumerate(pages[1:], 1):  # Skip first empty split
         # Add page header
         formatted_text += f'<div style="margin-bottom: 30px;">'
         formatted_text += f'<h3 style="color: #2c3e50; margin-bottom: 15px;">Page {page_num}</h3>'
@@ -46,9 +47,7 @@ def format_response(text):
         # Process each line
         lines = page_content.split('\n')
         for line in lines:
-            # Skip empty lines and lines with asterisks
             if line.strip() and not line.strip().startswith('*') and not line.strip().startswith('Here'):
-                # Remove asterisks and dashes
                 line = line.replace('**', '').replace('- ', '')
                 if ':' in line:
@@ -60,7 +59,6 @@ def format_response(text):
         formatted_text += '</div>'
-        # Add separator between pages except for the last page
         if page_num < len(pages) - 1:
             formatted_text += '<hr style="border: 1px solid #eee; margin: 20px 0;">'
@@ -76,8 +74,8 @@ def analyze_image(image):
         base64_image = base64.b64encode(img_byte_arr).decode("utf-8")
-        response = client.chat.completions.create(
-            model="gpt-4o-mini",
             messages=[
                 {
                     "role": "user",
@@ -106,14 +104,14 @@ def analyze_image(image):
             max_tokens=1000
         )
-        return response.choices[0].message.content
     except Exception as e:
         return f"An error occurred: {str(e)}"
 def main():
     st.set_page_config(page_title="Document Analysis App", layout="wide")
-    # Custom CSS to set light background and improve button styling
     st.markdown("""
         <style>
         .stApp {
@@ -146,7 +144,6 @@ def main():
         if uploaded_file is not None:
             if uploaded_file.type == "application/pdf":
-                # Handle PDF
                 with st.spinner("Processing PDF..."):
                     images = convert_pdf_to_images(uploaded_file)
@@ -161,7 +158,6 @@ def main():
                             st.markdown(format_response(combined_results), unsafe_allow_html=True)
             else:
-                # Handle single image
                 image = Image.open(uploaded_file)
                 if st.button("Extract Information"):

 import base64
 import streamlit as st
+import openai
+import os
 from PIL import Image
 import io
 import tempfile
+import pdf2image
+# Set OpenAI API key from Streamlit secrets
+openai.api_key = st.secrets["OPENAI_API_KEY"]
 def convert_pdf_to_images(pdf_file):
     """Convert PDF to list of images"""
         tmp_file.write(pdf_file.getvalue())
         pdf_path = tmp_file.name
+    try:
+        images = pdf2image.convert_from_path(pdf_path)
+        os.unlink(pdf_path)
+        return images
+    except Exception as e:
+        st.error(f"Error converting PDF: {str(e)}")
+        return []
 def format_response(text):
     """Format the analysis response with clean styling"""
     # Split into pages
     pages = text.split("Page")
+    for page_num, page_content in enumerate(pages[1:], 1):
         # Add page header
         formatted_text += f'<div style="margin-bottom: 30px;">'
         formatted_text += f'<h3 style="color: #2c3e50; margin-bottom: 15px;">Page {page_num}</h3>'
         # Process each line
         lines = page_content.split('\n')
         for line in lines:
             if line.strip() and not line.strip().startswith('*') and not line.strip().startswith('Here'):
                 line = line.replace('**', '').replace('- ', '')
                 if ':' in line:
         formatted_text += '</div>'
         if page_num < len(pages) - 1:
             formatted_text += '<hr style="border: 1px solid #eee; margin: 20px 0;">'
         base64_image = base64.b64encode(img_byte_arr).decode("utf-8")
+        response = openai.ChatCompletion.create(
+            model="gpt-4-vision-preview",
             messages=[
                 {
                     "role": "user",
             max_tokens=1000
         )
+        return response.choices[0].message['content']
     except Exception as e:
+        st.error(f"API Error: {str(e)}")
         return f"An error occurred: {str(e)}"
 def main():
     st.set_page_config(page_title="Document Analysis App", layout="wide")
     st.markdown("""
         <style>
         .stApp {
         if uploaded_file is not None:
             if uploaded_file.type == "application/pdf":
                 with st.spinner("Processing PDF..."):
                     images = convert_pdf_to_images(uploaded_file)
                             st.markdown(format_response(combined_results), unsafe_allow_html=True)
             else:
                 image = Image.open(uploaded_file)
                 if st.button("Extract Information"):