Spaces:

andrewgleave
/

note-ner-demo

Running

andrewgleave commited on Oct 10, 2022

Commit

32eb862

1 Parent(s): 9631ab8

WP

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,13 +1,11 @@
 import json
 import gradio as gr
-def ner(text):
-    api = gr.Interface.load("d4data/biomedical-ner-all", src="models")
-    result = api(text)
-    return result
 EXAMPLE_TEXTS = []
 with open("examples.json", "r") as f:
@@ -15,10 +13,31 @@ with open("examples.json", "r") as f:
     EXAMPLE_TEXTS = [x["text"] for x in example_json]
 interface = gr.Interface(
     ner,
     inputs=gr.Textbox(label="Input", value=""),
-    outputs=["json"],
     examples=EXAMPLE_TEXTS,
 )

 import json
 import gradio as gr
+from transformers import pipeline
+from transformers import AutoTokenizer, AutoModelForTokenClassification
+tokenizer = AutoTokenizer.from_pretrained("d4data/biomedical-ner-all")
+model = AutoModelForTokenClassification.from_pretrained("d4data/biomedical-ner-all")
 EXAMPLE_TEXTS = []
 with open("examples.json", "r") as f:
     EXAMPLE_TEXTS = [x["text"] for x in example_json]
+pipe = pipeline("ner", model=model, tokenizer=tokenizer, aggregation_strategy="simple")
+def ner(text):
+    raw = pipe(text)
+    result = {
+        "text": text,
+        "entities": [
+            {
+                "entity": x["entity_group"],
+                "word": x["word"],
+                "score": x["score"],
+                "start": x["start"],
+                "end": x["end"],
+            }
+            for x in raw
+        ],
+    }
+    return result, {}
 interface = gr.Interface(
     ner,
     inputs=gr.Textbox(label="Input", value=""),
+    outputs=[gr.HighlightedText(combine_adjacent=True), "json"],
     examples=EXAMPLE_TEXTS,
 )