Spaces:

MJobe
/

document-vqa-v2

Sleeping

App Files Files Community

MJobe commited on Dec 12, 2023

Commit

f8ec4b3

•

1 Parent(s): 6bbd3ca

Update main.py

Browse files

Files changed (1) hide show

main.py +35 -4

main.py CHANGED Viewed

@@ -3,20 +3,23 @@ from io import BytesIO
 from PIL import Image
 from fastapi import FastAPI, File, UploadFile, Form
 from fastapi.responses import JSONResponse
-from pytesseract import pytesseract
 from transformers import pipeline
 app = FastAPI()
 # Load a BERT-based question answering pipeline
-nlp = pipeline('question-answering', model='bert-large-uncased-whole-word-masking-finetuned-squad')
 description = """
 ## Image-based Document QA
 This API extracts text from an uploaded image using OCR and performs document question answering using a BERT-based model.
-### Endpoint:
 - **POST /uploadfile/:** Upload an image file to extract text and answer provided questions.
 """
 app = FastAPI(docs_url="/", description=description)
@@ -42,7 +45,35 @@ async def perform_document_qa(
         # Perform document question answering for each question using BERT-based model
         answers_dict = {}
         for question in question_list:
-            result = nlp({
                 'question': question,
                 'context': text_content
             })

 from PIL import Image
 from fastapi import FastAPI, File, UploadFile, Form
 from fastapi.responses import JSONResponse
+import fitz
 from transformers import pipeline
+import requests
+from typing import List
 app = FastAPI()
 # Load a BERT-based question answering pipeline
+nlp_qa = pipeline('question-answering', model='bert-large-uncased-whole-word-masking-finetuned-squad')
 description = """
 ## Image-based Document QA
 This API extracts text from an uploaded image using OCR and performs document question answering using a BERT-based model.
+### Endpoints:
 - **POST /uploadfile/:** Upload an image file to extract text and answer provided questions.
+- **POST /pdfUpload/:** Provide a file to extract text and answer provided questions.
 """
 app = FastAPI(docs_url="/", description=description)
         # Perform document question answering for each question using BERT-based model
         answers_dict = {}
         for question in question_list:
+            result = nlp_qa({
+                'question': question,
+                'context': text_content
+            })
+            answers_dict[question] = result['answer']
+        return answers_dict
+    except Exception as e:
+        return JSONResponse(content=f"Error processing file: {str(e)}", status_code=500)
+@app.post("/pdfUpload/", description=description)
+async def load_file(
+    file: UploadFile = File(...),
+    questions: str = Form(...),
+):
+    try:
+        # Read the uploaded file
+        contents = await file.read()
+        # Convert binary content to text
+        text_content = contents.decode('utf-8')
+        # Split the questions string into a list
+        question_list = [q.strip() for q in questions.split(',')]
+        # Perform document question answering for each question using BERT-based model
+        answers_dict = {}
+        for question in question_list:
+            result = nlp_qa({
                 'question': question,
                 'context': text_content
             })