Spaces:
Running
Running
import gradio as gr | |
import requests | |
from pypdf import PdfReader | |
def scrape(instring): | |
html_src=(f''' | |
<div style="text-align:center"> | |
<h4>PDF Viewer</h4> | |
<iframe src="https://docs.google.com/viewer?url={instring}&embedded=true" frameborder="0" height="1200px" width="100%"></iframe> | |
</div>''') | |
return gr.HTML.update(f'''{html_src}''') | |
def scrape00(instring): | |
response = requests.get(instring, stream=True) | |
if response.status_code == 200: | |
with open("data.pdf", "wb") as f: | |
f.write(response.content) | |
else: | |
print(response.status_code) | |
#out = Path("./data.pdf") | |
#print (out) | |
reader = PdfReader("data.pdf") | |
number_of_pages = len(reader.pages) | |
page = reader.pages[0] | |
text = page.extract_text() | |
try: | |
summarizer = gr.Interface.load("huggingface/facebook/bart-large-cnn") | |
sum_out = summarizer(text) | |
except Exception: | |
sum_out = "Error" | |
return text, sum_out | |
with gr.Blocks() as app: | |
gr.Markdown('''<h1>PDF Viewer''') | |
inp=gr.Textbox() | |
with gr.Row(): | |
go_btn = gr.Button("Load PDF") | |
sum_btn = gr.Button("Summarize") | |
outp = gr.HTML() | |
with gr.Row(): | |
text_out = gr.Textbox() | |
sum_out = gr.Textbox() | |
go_btn.click(scrape,inp,outp) | |
sum_btn.click(scrape00,inp,[text_out,sum_out]) | |
app.queue(concurrency_count=10).launch() |