PirateXX commited on
Commit
c6a55b0
·
1 Parent(s): 94abe9f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +13 -1
app.py CHANGED
@@ -60,7 +60,19 @@ def findRealProb(text):
60
  realProb = ans/len(text)
61
  return {"Real": realProb, "Fake": 1-realProb, "results": results, "text": text}
62
 
63
- def upload_file():
 
 
 
 
 
 
 
 
 
 
 
 
64
  if 'pdfFile' in request.files:
65
  pdf_file = request.files['pdfFile']
66
  text = ""
 
60
  realProb = ans/len(text)
61
  return {"Real": realProb, "Fake": 1-realProb, "results": results, "text": text}
62
 
63
+ def upload_file(file):
64
+ if file:
65
+ pdf_file = file
66
+ text = ""
67
+ with pdfplumber.open(pdf_file) as pdf:
68
+ cnt = 0
69
+ for page in pdf.pages:
70
+ cnt+=1
71
+ text+=(page.extract_text(x_tolerance = 1))
72
+ print(text)
73
+ if cnt>5:
74
+ break
75
+ return findRealProb(text)
76
  if 'pdfFile' in request.files:
77
  pdf_file = request.files['pdfFile']
78
  text = ""