Spaces:
Sleeping
Sleeping
Nikhil Singh
commited on
Commit
·
d90af9d
1
Parent(s):
a02ed2b
email upload
Browse files
app.py
CHANGED
@@ -65,15 +65,18 @@ def present(email_file, labels, multilingual=False):
|
|
65 |
sentence_list = get_sentences(further_cleaned_text)
|
66 |
|
67 |
entities = parse_query(sentence_list, labels, threshold=0.3, nested_ner=False, model_name="urchade/gliner_base", multilingual=multilingual)
|
|
|
|
|
|
|
68 |
|
69 |
email_info = {
|
70 |
"Subject": email.subject,
|
71 |
"From": email.from_,
|
72 |
"To": email.to,
|
73 |
"Date": email.date,
|
74 |
-
"Extracted Entities":
|
75 |
}
|
76 |
-
return [email_info[key] for key in ["Subject", "From", "To", "Date"]] + [
|
77 |
|
78 |
labels = ["PERSON", "PRODUCT", "DEAL", "ORDER", "ORDER PAYMENT METHOD", "STORE", "LEGAL ENTITY", "MERCHANT", "FINANCIAL TRANSACTION", "UNCATEGORIZED", "DATE"]
|
79 |
|
@@ -93,7 +96,7 @@ demo = gr.Interface(
|
|
93 |
gr.components.Textbox(label="From"),
|
94 |
gr.components.Textbox(label="To"),
|
95 |
gr.components.Textbox(label="Date"),
|
96 |
-
gr.components.Dataframe(label="Extracted Entities")
|
97 |
],
|
98 |
title="Email Info Extractor",
|
99 |
description="Upload an email file (.eml) to extract its details and detected entities."
|
|
|
65 |
sentence_list = get_sentences(further_cleaned_text)
|
66 |
|
67 |
entities = parse_query(sentence_list, labels, threshold=0.3, nested_ner=False, model_name="urchade/gliner_base", multilingual=multilingual)
|
68 |
+
|
69 |
+
# Format entities for DataFrame: Convert list of dicts to list of lists
|
70 |
+
entities_data = [[entity['text'], entity['label']] for entity in entities]
|
71 |
|
72 |
email_info = {
|
73 |
"Subject": email.subject,
|
74 |
"From": email.from_,
|
75 |
"To": email.to,
|
76 |
"Date": email.date,
|
77 |
+
"Extracted Entities": entities_data # Adjusted for DataFrame
|
78 |
}
|
79 |
+
return [email_info[key] for key in ["Subject", "From", "To", "Date"]] + [entities_data]
|
80 |
|
81 |
labels = ["PERSON", "PRODUCT", "DEAL", "ORDER", "ORDER PAYMENT METHOD", "STORE", "LEGAL ENTITY", "MERCHANT", "FINANCIAL TRANSACTION", "UNCATEGORIZED", "DATE"]
|
82 |
|
|
|
96 |
gr.components.Textbox(label="From"),
|
97 |
gr.components.Textbox(label="To"),
|
98 |
gr.components.Textbox(label="Date"),
|
99 |
+
gr.components.Dataframe(headers=["Text", "Label"], label="Extracted Entities")
|
100 |
],
|
101 |
title="Email Info Extractor",
|
102 |
description="Upload an email file (.eml) to extract its details and detected entities."
|