PosterDemoSequenceClassificationBinary

Sleeping

AlGe commited on Jun 28, 2024

Commit

0659cc6

verified ·

1 Parent(s): 02f2078

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -106,7 +106,6 @@ def generate_charts(ner_output_bin: dict) -> Tuple[go.Figure, np.ndarray]:
     return fig2, wordcloud_image
 def generate_wordcloud(entities: List[Dict], color_map: Dict[str, str]) -> np.ndarray:
     token_texts = []
     token_scores = []
@@ -114,10 +113,11 @@ def generate_wordcloud(entities: List[Dict], color_map: Dict[str, str]) -> np.nd
     for entity in entities:
         for token in entity['tokens']:
-            token_texts.append(token)
             token_scores.append(entity['score'])
             token_types.append(entity['entity'])
-            print(f"{token} ({entity['entity']}): {entity['score']}")
     # Create a dictionary for word cloud
     word_freq = {text: score for text, score in zip(token_texts, token_scores)}
@@ -143,6 +143,7 @@ def generate_wordcloud(entities: List[Dict], color_map: Dict[str, str]) -> np.nd
     return image_array
 @spaces.GPU
 def all(text: str):
     ner_output_bin = process_ner(text, pipe_bin)

     return fig2, wordcloud_image
 def generate_wordcloud(entities: List[Dict], color_map: Dict[str, str]) -> np.ndarray:
     token_texts = []
     token_scores = []
     for entity in entities:
         for token in entity['tokens']:
+            cleaned_token = token.lstrip('_')
+            token_texts.append(cleaned_token)
             token_scores.append(entity['score'])
             token_types.append(entity['entity'])
+            print(f"{cleaned_token} ({entity['entity']}): {entity['score']}")
     # Create a dictionary for word cloud
     word_freq = {text: score for text, score in zip(token_texts, token_scores)}
     return image_array
 @spaces.GPU
 def all(text: str):
     ner_output_bin = process_ner(text, pipe_bin)