GOT_official_online_demo

Sleeping

App Files Files Community

acharyaaditya26 commited on Nov 25, 2024

Commit

3c5823e

verified ·

1 Parent(s): 6101e9e

Update app.py

Browse files

Files changed (1) hide show

app.py +35 -16

app.py CHANGED Viewed

@@ -12,6 +12,11 @@ import time
 import shutil
 from pathlib import Path
 import json
 # Load tokenizer and model
 tokenizer = AutoTokenizer.from_pretrained('ucaslcl/GOT-OCR2_0', trust_remote_code=True)
@@ -45,40 +50,53 @@ def run_GOT(pdf_file):
     unique_id = str(uuid.uuid4())
     pdf_path = os.path.join(UPLOAD_FOLDER, f"{unique_id}.pdf")
     shutil.copy(pdf_file, pdf_path)
     images = pdf_to_images(pdf_path)
     results = []
     try:
         for i, image in enumerate(images):
             image_path = os.path.join(UPLOAD_FOLDER, f"{unique_id}_page_{i+1}.png")
             image.save(image_path)
             result_path = os.path.join(RESULTS_FOLDER, f"{unique_id}_page_{i+1}.html")
             res = model.chat_crop(tokenizer, image_path, ocr_type='format', render=True, save_render_file=result_path)
             # Read the rendered HTML content
-            with open(result_path, 'r') as f:
-                html_content = f.read()
             results.append({
                 "page_number": i + 1,
                 "text": res,
-                "html": html_content
             })
             if os.path.exists(image_path):
                 os.remove(image_path)
             if os.path.exists(result_path):
                 os.remove(result_path)
     except Exception as e:
         return f"Error: {str(e)}", None
     finally:
         if os.path.exists(pdf_path):
             os.remove(pdf_path)
-    return json.dumps(results, indent=4)
 def cleanup_old_files():
     current_time = time.time()
@@ -92,16 +110,17 @@ with gr.Blocks() as demo:
         with gr.Column():
             pdf_input = gr.File(type="filepath", label="Upload your PDF")
             submit_button = gr.Button("Submit")
         with gr.Column():
-            ocr_result = gr.JSON(label="GOT output")
     submit_button.click(
         run_GOT,
         inputs=[pdf_input],
-        outputs=[ocr_result]
     )
 if __name__ == "__main__":
     cleanup_old_files()
-    demo.launch()

 import shutil
 from pathlib import Path
 import json
+import logging
+# Set up logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
 # Load tokenizer and model
 tokenizer = AutoTokenizer.from_pretrained('ucaslcl/GOT-OCR2_0', trust_remote_code=True)
     unique_id = str(uuid.uuid4())
     pdf_path = os.path.join(UPLOAD_FOLDER, f"{unique_id}.pdf")
     shutil.copy(pdf_file, pdf_path)
     images = pdf_to_images(pdf_path)
     results = []
+    html_content = "<html><body>"
     try:
         for i, image in enumerate(images):
             image_path = os.path.join(UPLOAD_FOLDER, f"{unique_id}_page_{i+1}.png")
             image.save(image_path)
             result_path = os.path.join(RESULTS_FOLDER, f"{unique_id}_page_{i+1}.html")
+            logger.info(f"Processing page {i+1}...")
             res = model.chat_crop(tokenizer, image_path, ocr_type='format', render=True, save_render_file=result_path)
             # Read the rendered HTML content
+            if os.path.exists(result_path):
+                with open(result_path, 'r') as f:
+                    page_html_content = f.read()
+                logger.info(f"HTML content for page {i+1} read successfully.")
+            else:
+                logger.error(f"HTML file for page {i+1} not found at {result_path}.")
+                page_html_content = ""
             results.append({
                 "page_number": i + 1,
                 "text": res,
+                "html": page_html_content
             })
+            html_content += f"<h2>Page {i + 1}</h2>"
+            html_content += page_html_content + "<br><hr><br>"  # Add a separator between pages
             if os.path.exists(image_path):
                 os.remove(image_path)
             if os.path.exists(result_path):
                 os.remove(result_path)
     except Exception as e:
+        logger.error(f"Error occurred: {str(e)}")
         return f"Error: {str(e)}", None
     finally:
         if os.path.exists(pdf_path):
             os.remove(pdf_path)
+    html_content += "</body></html>"
+    logger.info(f"Final HTML content: {html_content}")  # Log the final HTML content for debugging
+    return json.dumps(results, indent=4), html_content
 def cleanup_old_files():
     current_time = time.time()
         with gr.Column():
             pdf_input = gr.File(type="filepath", label="Upload your PDF")
             submit_button = gr.Button("Submit")
         with gr.Column():
+            ocr_result = gr.JSON(label="GOT output (JSON)")
+            html_result = gr.HTML(label="GOT output (HTML)")
     submit_button.click(
         run_GOT,
         inputs=[pdf_input],
+        outputs=[ocr_result, html_result]
     )
 if __name__ == "__main__":
     cleanup_old_files()
+    demo.launch()