not-lain commited on
Commit
5d2e8ec
·
1 Parent(s): 0772fb4

seperate doc and docx

Browse files
Files changed (1) hide show
  1. app.py +19 -6
app.py CHANGED
@@ -405,11 +405,23 @@ pdf_to_text = gr.Interface(
405
  api_name="pdf_to_text",
406
  )
407
 
408
- doc_or_docx_to_text = gr.Interface(
409
- extract_text_from_doc_or_docx,
 
 
 
 
 
 
 
 
 
 
 
 
410
  gr.File(),
411
- gr.Textbox(placeholder="Extracted text from DOC or DOCX will appear here"),
412
- api_name="doc_or_docx_to_text",
413
  )
414
 
415
  # pptx_or_ppt_to_text = gr.Interface(
@@ -458,11 +470,12 @@ url_parser = gr.Interface(
458
  api_name="url_to_text",
459
  )
460
  demo = gr.TabbedInterface(
461
- [pdf_to_img, pdf_to_text, doc_or_docx_to_text, ppt_to_text, pptx_to_text, url_parser, str_to_json],
462
  [
463
  "PDF to Image",
464
  "Extract PDF Text",
465
- "Extract DOC/DOCX Text",
 
466
  "Extract PPT Text",
467
  "Extract PPTX Text",
468
  "Extract text from URL",
 
405
  api_name="pdf_to_text",
406
  )
407
 
408
+ # doc_or_docx_to_text = gr.Interface(
409
+ # extract_text_from_doc_or_docx,
410
+ # gr.File(),
411
+ # gr.Textbox(placeholder="Extracted text from DOC or DOCX will appear here"),
412
+ # api_name="doc_or_docx_to_text",
413
+ # )
414
+ doc_to_txt = gr.Interface(
415
+ convert_doc_to_text,
416
+ gr.File(),
417
+ gr.Textbox(),
418
+ api_name="doc_to_txt"
419
+ )
420
+ docx_to_txt = gr.Interface(
421
+ extract_text_from_docx,
422
  gr.File(),
423
+ gr.Textbox(),
424
+ api_name="docx_to_txt"
425
  )
426
 
427
  # pptx_or_ppt_to_text = gr.Interface(
 
470
  api_name="url_to_text",
471
  )
472
  demo = gr.TabbedInterface(
473
+ [pdf_to_img, pdf_to_text, doc_to_txt, docx_to_txt , ppt_to_text, pptx_to_text, url_parser, str_to_json],
474
  [
475
  "PDF to Image",
476
  "Extract PDF Text",
477
+ "Extract DOC Text",
478
+ "Extract DOCX Text",
479
  "Extract PPT Text",
480
  "Extract PPTX Text",
481
  "Extract text from URL",