Spaces:

ML-unipi
/

TermsOfServiceSummarization

Runtime error

tommasobaldi commited on Aug 29, 2022

Commit

6e3a821

1 Parent(s): 795ee13

working on text splitting

Files changed (1) hide show

app.py CHANGED Viewed

@@ -6,7 +6,6 @@ from transformers import pipeline, AutoTokenizer
 def main() -> None:
-    nltk.download("punkt")
     # header
     st.title(":bookmark_tabs: Terms Of Service Summarizer :bookmark_tabs:")
     st.markdown("The app aims to extract the main information from Terms Of Conditions, which are often too long and "
@@ -70,6 +69,7 @@ def main() -> None:
             accumulated_lists.append(join_sentences(result_list))
         return accumulated_lists
     pipe = create_pipeline()
     tokenizer = AutoTokenizer.from_pretrained("ML-unipi/bart-large-tos")
@@ -94,7 +94,7 @@ def main() -> None:
     summarize_button = st.button(label="Try it!")
     if summarize_button:
-        if target_text_input is not "":
             summary_sentences = []
             with st.spinner("Summarizing in progress..."):
                 sentences = split_sentences_by_token_length(nltk.sent_tokenize(target_text_input, language="english"),
@@ -106,7 +106,7 @@ def main() -> None:
                     # st.markdown(str(len(token_list)))
                     output = pipe(sentence)
                     summary = output[0]["summary_text"]
-                    for line in summary.split("."):
                         if line != "":
                             summary_sentences.append(line)
                 display_summary(summary_sentences)

 def main() -> None:
     # header
     st.title(":bookmark_tabs: Terms Of Service Summarizer :bookmark_tabs:")
     st.markdown("The app aims to extract the main information from Terms Of Conditions, which are often too long and "
             accumulated_lists.append(join_sentences(result_list))
         return accumulated_lists
+    nltk.download("punkt")
     pipe = create_pipeline()
     tokenizer = AutoTokenizer.from_pretrained("ML-unipi/bart-large-tos")
     summarize_button = st.button(label="Try it!")
     if summarize_button:
+        if target_text_input != "":
             summary_sentences = []
             with st.spinner("Summarizing in progress..."):
                 sentences = split_sentences_by_token_length(nltk.sent_tokenize(target_text_input, language="english"),
                     # st.markdown(str(len(token_list)))
                     output = pipe(sentence)
                     summary = output[0]["summary_text"]
+                    for line in summary.split(". "):
                         if line != "":
                             summary_sentences.append(line)
                 display_summary(summary_sentences)