PirateXX commited on
Commit
c43109e
·
1 Parent(s): 8eae465

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +25 -25
app.py CHANGED
@@ -67,21 +67,21 @@ def findRealProb(text):
67
 
68
  def upload_file(file):
69
 
70
- if 'pdfFile' in request.files:
71
- pdf_file = request.files['pdfFile']
72
- text = ""
73
- with pdfplumber.open(pdf_file) as pdf:
74
- cnt = 0
75
- for page in pdf.pages:
76
- cnt+=1
77
- text+=(page.extract_text(x_tolerance = 1))
78
- print(text)
79
- if cnt>5:
80
- break
81
- text = text.replace('\n', ' ')
82
- return findRealProb(text)
83
  # return jsonify({'text': text})
84
- # if file:
85
 
86
  # with open(file.name, 'rb') as pdf_file:
87
  # pdf_reader = PyPDF2.PdfReader(pdf_file)
@@ -91,17 +91,17 @@ def upload_file(file):
91
  # text += page.extract_text()
92
  # text = text.replace('\n', ' ')
93
  # return findRealProb(text)
94
- # pdf_file = file.name
95
- # print(file, pdf_file)
96
- # text = ""
97
- # with pdfplumber.open(pdf_file) as pdf:
98
- # cnt = 0
99
- # for page in pdf.pages:
100
- # cnt+=1
101
- # text+=(page.extract_text(x_tolerance = 1))
102
- # if cnt>5:
103
- # break
104
- # return findRealProb(text)
105
  else:
106
  return {"error":'No PDF file found in request'}
107
 
 
67
 
68
  def upload_file(file):
69
 
70
+ # if 'pdfFile' in request.files:
71
+ # pdf_file = request.files['pdfFile']
72
+ # text = ""
73
+ # with pdfplumber.open(pdf_file) as pdf:
74
+ # cnt = 0
75
+ # for page in pdf.pages:
76
+ # cnt+=1
77
+ # text+=(page.extract_text(x_tolerance = 1))
78
+ # print(text)
79
+ # if cnt>5:
80
+ # break
81
+ # text = text.replace('\n', ' ')
82
+ # return findRealProb(text)
83
  # return jsonify({'text': text})
84
+ if file:
85
 
86
  # with open(file.name, 'rb') as pdf_file:
87
  # pdf_reader = PyPDF2.PdfReader(pdf_file)
 
91
  # text += page.extract_text()
92
  # text = text.replace('\n', ' ')
93
  # return findRealProb(text)
94
+ pdf_file = file.name
95
+ print(file, pdf_file)
96
+ text = ""
97
+ with pdfplumber.open(pdf_file) as pdf:
98
+ cnt = 0
99
+ for page in pdf.pages:
100
+ cnt+=1
101
+ text+=(page.extract_text(x_tolerance = 1))
102
+ if cnt>5:
103
+ break
104
+ return findRealProb(text)
105
  else:
106
  return {"error":'No PDF file found in request'}
107