Spaces:
Sleeping
Sleeping
File size: 1,590 Bytes
8efe659 5777a9a 2fe2a42 13ac7c2 2fe2a42 3fd92e9 13ac7c2 5777a9a 28ca0f2 1efe83d 5777a9a 13ac7c2 56c79b1 5777a9a 56c79b1 1efe83d 3fd92e9 5777a9a 3fd92e9 56c79b1 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 |
import gradio as gr
import re
from mailparser import parse_from_string
from bs4 import BeautifulSoup
def accept_mail(email_content):
email = parse_from_string(email_content)
return email
def clean_email(email):
soup = BeautifulSoup(email.body, 'html.parser')
for tag in soup.find_all(['style', 'link']):
tag.decompose()
cleaned_text = ' '.join(soup.get_text(separator=' ').split())
return cleaned_text
def remove_special_characters(text):
pattern = r'[=_-]+'
cleaned_text = re.sub(pattern, '', text)
return cleaned_text
def present(email_content):
email = accept_mail(email_content)
cleaned_text = clean_email(email)
further_cleaned_text = remove_special_characters(cleaned_text)
email_info = {
"Subject": email.subject,
"From": email.from_,
"To": email.to,
"Date": email.date,
# "Message ID": email.message_id,
# "Headers": str(email.headers),
"Cleaned Body": further_cleaned_text
}
return [email_info[key] for key in email_info]
demo = gr.Interface(
fn=present,
inputs="text",
outputs=[
gr.components.Textbox(label="Subject"),
gr.components.Textbox(label="From"),
gr.components.Textbox(label="To"),
gr.components.Textbox(label="Date"),
# gr.components.Textbox(label="Message ID"),
# gr.components.Textbox(label="Headers"),
gr.components.Textbox(label="Cleaned Body")
],
title="Email Info",
description="Enter the email content below to view its details."
)
demo.launch()
|