File size: 1,303 Bytes
7a3d3ad c306bb9 7a3d3ad c306bb9 8c96cb8 a0ecce1 c306bb9 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 |
# https://huggingface.co/spaces/Antoniskaraolis/AI_Audio_Processing
# Here are the imports
import gradio as gr
from PyPDF2 import PdfReader
from transformers import pipeline
from gtts import gTTS
import tempfile
import os
# Here is the code
def extract_abstract_from_pdf(file):
reader = PdfReader(file.name)
first_page = reader.pages[0]
text = first_page.extract_text()
return text
def summarize_text(text, model_name='sshleifer/distilbart-cnn-12-6'):
summarizer = pipeline("summarization", model=model_name)
summary = summarizer(text, max_length=75, min_length=20, do_sample=False)
first_sentence = summary[0]['summary_text'].split('.')[0] + '.'
return first_sentence
def process_pdf_to_speech(file):
abstract = extract_abstract_from_pdf(file)
summary = summarize_text(abstract)
tts = gTTS(text=summary, lang='en')
with tempfile.NamedTemporaryFile(delete=False, suffix='.mp3') as fp:
tts.save(fp.name)
return fp.name
iface = gr.Interface(
fn=process_pdf_to_speech,
inputs=gr.File(label="Upload PDF"),
outputs=gr.Audio(label="Play Summary"),
title="PDF Abstract to Speech",
description="This app summarizes the abstract from a PDF and converts it to speech. Please upload a PDF with an abstract."
)
iface.launch() |