DevBM commited on
Commit
a71879c
·
verified ·
1 Parent(s): e79f627

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +49 -48
app.py CHANGED
@@ -1,49 +1,50 @@
1
- import streamlit as st
2
- from transformers import pipeline
3
- from PyPDF2 import PdfReader
4
- import PyPDF2
5
- import fitz
6
- import os
7
- import nltk
8
-
9
-
10
- def get_pdf_text(pdf_docs):
11
- text = ""
12
- for pdf in pdf_docs:
13
- pdf_reader = PdfReader(pdf)
14
- for page in pdf_reader.pages:
15
- text += page.extract_text()
16
- return text
17
-
18
- def main():
19
- st.title('Question Generator from PDFs')
20
- pipe = pipeline(
21
- task = 'text2text-generation',
22
- model = 'ramsrigouthamg/t5_squad_v1'
23
- )
24
- file = st.file_uploader(label='Upload',accept_multiple_files=True)
25
- pr = st.button(label='Start')
26
- if pr:
27
- st.write('Hi')
28
- raw_text = get_pdf_text(file)
29
- sentences = nltk.sent_tokenize(text=raw_text)
30
- # st.write(sts)
31
- # for i in sentences:
32
- # st.write(i)
33
- questions = []
34
- st.subheader("Generated Questions are: ")
35
- s = pipe(sentences)
36
- for i in s:
37
- questions.append(i['generated_text'][10:])
38
- st.write(i['generated_text'][10:])
39
- if st.toggle(label='Show Pipeline Output'):
40
- st.write(s)
41
- if st.toggle(label='Show Questions list'):
42
- st.write(questions)
43
- # for i in sts:
44
- # x = pipe(i)
45
- # questions.append(x)
46
- # st.write(x)
47
-
48
- if __name__ == '__main__':
 
49
  main()
 
1
+ import streamlit as st
2
+ from transformers import pipeline
3
+ from PyPDF2 import PdfReader
4
+ import PyPDF2
5
+ import fitz
6
+ import os
7
+ import nltk
8
+
9
+ nltk.download('punkt')
10
+
11
+ def get_pdf_text(pdf_docs):
12
+ text = ""
13
+ for pdf in pdf_docs:
14
+ pdf_reader = PdfReader(pdf)
15
+ for page in pdf_reader.pages:
16
+ text += page.extract_text()
17
+ return text
18
+
19
+ def main():
20
+ st.title('Question Generator from PDFs')
21
+ pipe = pipeline(
22
+ task = 'text2text-generation',
23
+ model = 'ramsrigouthamg/t5_squad_v1'
24
+ )
25
+ file = st.file_uploader(label='Upload',accept_multiple_files=True)
26
+ pr = st.button(label='Start')
27
+ if pr:
28
+ st.write('Hi')
29
+ raw_text = get_pdf_text(file)
30
+ sentences = nltk.sent_tokenize(text=raw_text)
31
+ # st.write(sts)
32
+ # for i in sentences:
33
+ # st.write(i)
34
+ questions = []
35
+ st.subheader("Generated Questions are: ")
36
+ s = pipe(sentences)
37
+ for i in s:
38
+ questions.append(i['generated_text'][10:])
39
+ st.write(i['generated_text'][10:])
40
+ if st.toggle(label='Show Pipeline Output'):
41
+ st.write(s)
42
+ if st.toggle(label='Show Questions list'):
43
+ st.write(questions)
44
+ # for i in sts:
45
+ # x = pipe(i)
46
+ # questions.append(x)
47
+ # st.write(x)
48
+
49
+ if __name__ == '__main__':
50
  main()