acrowth commited on
Commit
ca594bc
·
1 Parent(s): 7531e94

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -4
app.py CHANGED
@@ -1,12 +1,11 @@
1
  from pdf2image import convert_from_path
2
  import pandas as pd, numpy as np
3
- from PIL import Image
4
- import pickle
5
  import gradio as gr
6
  from transformers import pipeline
7
  import pandas as pd
8
- from sentence_transformers import SentenceTransformer, util
9
- import pickle
10
  import pytesseract
11
  from transformers import pipeline
12
  pipe = pipeline("text-classification",model="acrowth/autotrain-preesmetextclassifier-2437575785")
@@ -16,6 +15,11 @@ pipe = pipeline("text-classification",model="acrowth/autotrain-preesmetextclassi
16
  # pipe=pickle.load(file)
17
 
18
  def findpdftype(file):
 
 
 
 
 
19
  images = convert_from_path(file.name)
20
  results=[]
21
  for image in images:
 
1
  from pdf2image import convert_from_path
2
  import pandas as pd, numpy as np
3
+ #from PIL import Image
4
+ #import pickle
5
  import gradio as gr
6
  from transformers import pipeline
7
  import pandas as pd
8
+ #from sentence_transformers import SentenceTransformer, util
 
9
  import pytesseract
10
  from transformers import pipeline
11
  pipe = pipeline("text-classification",model="acrowth/autotrain-preesmetextclassifier-2437575785")
 
15
  # pipe=pickle.load(file)
16
 
17
  def findpdftype(file):
18
+ images = convert_from_path(file.name, first_page=1,last_page=1)
19
+ images[0].save('test.jpg')
20
+ return pipe('test.jpg')[0]['label']
21
+
22
+ def findpdftypeold2(file):
23
  images = convert_from_path(file.name)
24
  results=[]
25
  for image in images: