Spaces:

sabaridsnfuji
/

JP_NER

Running

App Files Files Community

sabarinathan commited on Sep 17, 2024

Commit

d67f838

verified ·

1 Parent(s): 39bccfa

Update app.py

Browse files

Files changed (1) hide show

app.py +7 -5

app.py CHANGED Viewed

@@ -1,4 +1,3 @@
 # -*- coding: utf-8 -*-
 """
 Created on Tue Sep 17 19:03:17 2024
@@ -53,7 +52,7 @@ class JapaneseNER():
         sample_encoding = self.tokenizer([
           "鈴木は4月の陽気の良い日に、鈴をつけて熊本県の阿蘇山に登った",
           "中国では、中国共産党による一党統治が続く",
-        ], truncation=True,padding=True,  # Ensure all sequences are of the same length
                                     max_length=512, return_tensors="pt")
         sample_encoding = {k: v.to(device) for k, v in sample_encoding.items()}
@@ -66,7 +65,7 @@ class JapaneseNER():
         print("Predicted labels:", predicted_label_id)
     def predict(self, text):
-        encoding = self.tokenizer([text], truncation=True,padding=True, max_length=512, return_tensors="pt")
         encoding = {k: v.to(device) for k, v in encoding.items()}
         # Perform prediction
@@ -106,16 +105,19 @@ def ner_inference(text):
         start_idx += 1
     doc.ents = ents  # Set the entities in the Doc
-    # Render using spacy displacy
     html = displacy.render(doc, style="ent", jupyter=False)  # Generate HTML for entities
     return html
 # Create Gradio interface
 import gradio as gr
 iface = gr.Interface(
     fn=ner_inference,  # The function to call for prediction
-    inputs=gr.Textbox(lines=5, placeholder="Enter Japanese text for NER..."),  # Input widget
     outputs="html",  # Output will be in HTML format using displacy
     title="Japanese Named Entity Recognition (NER)",
     description="Enter Japanese text and see the named entities highlighted in the output."

 # -*- coding: utf-8 -*-
 """
 Created on Tue Sep 17 19:03:17 2024
         sample_encoding = self.tokenizer([
           "鈴木は4月の陽気の良い日に、鈴をつけて熊本県の阿蘇山に登った",
           "中国では、中国共産党による一党統治が続く",
+        ], truncation=True, padding=True,  # Ensure all sequences are of the same length
                                     max_length=512, return_tensors="pt")
         sample_encoding = {k: v.to(device) for k, v in sample_encoding.items()}
         print("Predicted labels:", predicted_label_id)
     def predict(self, text):
+        encoding = self.tokenizer([text], truncation=True, padding=True, max_length=512, return_tensors="pt")
         encoding = {k: v.to(device) for k, v in encoding.items()}
         # Perform prediction
         start_idx += 1
     doc.ents = ents  # Set the entities in the Doc
+    # Render using spaCy displacy
     html = displacy.render(doc, style="ent", jupyter=False)  # Generate HTML for entities
     return html
+# Sample text for demonstration
+sample_text = "鈴木一朗は2020年に引退した。女優の石原さとみは多くの映画で主演している。"
 # Create Gradio interface
 import gradio as gr
 iface = gr.Interface(
     fn=ner_inference,  # The function to call for prediction
+    inputs=gr.Textbox(lines=5, placeholder="Enter Japanese text for NER...", default=sample_text),  # Input widget with sample text
     outputs="html",  # Output will be in HTML format using displacy
     title="Japanese Named Entity Recognition (NER)",
     description="Enter Japanese text and see the named entities highlighted in the output."