Spaces:

Cachoups
/

FinanceReport

Running

App Files Files Community

Cachoups commited on Sep 25, 2024

Commit

12cfba7

verified ·

1 Parent(s): 8fd6111

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -4

app.py CHANGED Viewed

@@ -12,7 +12,8 @@ import io
 # Initialize spaCy model
 nlp = spacy.load('en_core_web_sm')
 nlp.add_pipe('sentencizer')
 def split_in_sentences(text):
     doc = nlp(text)
     return [str(sent).strip() for sent in doc.sents]
@@ -44,6 +45,19 @@ def fin_ext_bis(text):
     results = fin_model_bis(split_in_sentences(text))
     return make_spans(text, results)
 def extract_and_paragraph(pdf1, pdf2, paragraph):
     if not pdf1 or not pdf2:
         return [], []
@@ -68,8 +82,6 @@ def extract_and_paragraph(pdf1, pdf2, paragraph):
     return paragraphs_1, paragraphs_2
-# Gradio interface setup
-PDF_FOLDER = "data"
 def process_paragraph_1_sum(paragraph):
                 try:
                     paragraph_index = int(paragraph.split(':')[0].replace('Paragraph ', '')) - 1
@@ -445,9 +457,10 @@ with gr.Blocks(theme='gradio/soft',js=js_func) as demo:
             # Upload PDFs
             with gr.Column():
                 gr.Markdown("### Step 1: Upload PDF Files")
                 pdf1 = gr.Dropdown(choices=get_pdf_files(PDF_FOLDER), label="Select PDF 1")
                 pdf2 = gr.Dropdown(choices=get_pdf_files(PDF_FOLDER), label="Select PDF 2")
             with gr.Column():
                 gr.Markdown("### Step 2: Extract and Display Paragraphs")
                 b1 = gr.Button("Extract and Display Paragraphs")

 # Initialize spaCy model
 nlp = spacy.load('en_core_web_sm')
 nlp.add_pipe('sentencizer')
+# Gradio interface setup
+PDF_FOLDER = "data"
 def split_in_sentences(text):
     doc = nlp(text)
     return [str(sent).strip() for sent in doc.sents]
     results = fin_model_bis(split_in_sentences(text))
     return make_spans(text, results)
+def upload_file_and_update_dropdown(file):
+    if file is not None:
+        # Save the file to the upload directory
+        file_path = os.path.join(PDF_FOLDER, file.name)
+        with open(file_path, "wb") as f:
+            f.write(file.read())
+        # Get the updated list of files
+        files = os.listdir(PDF_FOLDER)
+        return gr.Dropdown.update(choices=files), gr.Dropdown.update(choices=files)
+    return gr.Dropdown.update(choices=[]),gr.Dropdown.update(choices=[])
 def extract_and_paragraph(pdf1, pdf2, paragraph):
     if not pdf1 or not pdf2:
         return [], []
     return paragraphs_1, paragraphs_2
 def process_paragraph_1_sum(paragraph):
                 try:
                     paragraph_index = int(paragraph.split(':')[0].replace('Paragraph ', '')) - 1
             # Upload PDFs
             with gr.Column():
                 gr.Markdown("### Step 1: Upload PDF Files")
+                upload_button = gr.File(label="Upload files", file_types=[".pdf"])
                 pdf1 = gr.Dropdown(choices=get_pdf_files(PDF_FOLDER), label="Select PDF 1")
                 pdf2 = gr.Dropdown(choices=get_pdf_files(PDF_FOLDER), label="Select PDF 2")
+                upload_button.upload(upload_file_and_update_dropdown, upload_button, [pdf1, pdf2])
             with gr.Column():
                 gr.Markdown("### Step 2: Extract and Display Paragraphs")
                 b1 = gr.Button("Extract and Display Paragraphs")