Spaces:
Sleeping
Sleeping
File size: 457 Bytes
5f81bcf |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 |
import PyPDF2
import re
def extract_text_from_pdf(pdf_file):
text = ""
reader = PyPDF2.PdfReader(pdf_file)
for page in reader.pages:
text += page.extract_text()
return text
def clean_text(text):
text = re.sub(r'\s+', ' ', text)
text = text.strip()
return text
def parse_resume(pdf_file):
raw_text = extract_text_from_pdf(pdf_file)
cleaned_text = clean_text(raw_text)
return cleaned_text
|