Spaces:

not-lain
/

utils

Sleeping

utils / app.py

add pdf to text

c982cf8 about 2 months ago

692 Bytes

	import gradio as gr
	from pdf2image import convert_from_path
	import pdfplumber

	def convert_pdf_to_image(file):
	images = convert_from_path(file)
	return images

	def extract_text_from_pdf(file):
	text = ""
	with pdfplumber.open(file) as pdf:
	for page in pdf.pages:
	text += page.extract_text()
	return text

	pdf_to_img = gr.Interface(convert_pdf_to_image, gr.File(), gr.Gallery(), api_name="pdf_to_img")
	pdf_to_text = gr.Interface(extract_text_from_pdf, gr.File(), gr.Textbox(placeholder="Extracted text will appear here"), api_name="pdf_to_text")

	demo = gr.TabbedInterface([pdf_to_img, pdf_to_text], ["PDF to Image", "Extract Text"])
	demo.launch(debug=True)