ghomasHudson commited on
Commit
e568ca3
·
1 Parent(s): 9a19160

Basic coref

Browse files
Files changed (1) hide show
  1. app.py +11 -0
app.py CHANGED
@@ -16,6 +16,7 @@ st.title('Entity Linking Demo')
16
  article = st.text_area('Article to analyze:', value=open("example.txt").read())
17
 
18
  seen_entities = []
 
19
  if st.button('Submit'):
20
  good_ents = []
21
 
@@ -24,6 +25,16 @@ if st.button('Submit'):
24
  for ent in doc.ents:
25
  if ent._.kb_qid is None or ent.label_ not in ["ORG", "PERSON", "GPE"] or ent.text in seen_entities:
26
  continue
 
 
 
 
 
 
 
 
 
 
27
  seen_entities.append(ent.text)
28
  print((ent.text, ent.label_, ent._.kb_qid, ent._.url_wikidata, ent._.nerd_score))
29
  r = requests.get("https://www.wikidata.org/w/api.php?action=wbgetclaims&format=json&property=P18&entity=" + ent._.kb_qid)
 
16
  article = st.text_area('Article to analyze:', value=open("example.txt").read())
17
 
18
  seen_entities = []
19
+ seen_surnames = []
20
  if st.button('Submit'):
21
  good_ents = []
22
 
 
25
  for ent in doc.ents:
26
  if ent._.kb_qid is None or ent.label_ not in ["ORG", "PERSON", "GPE"] or ent.text in seen_entities:
27
  continue
28
+
29
+ if ent.label_ == "PERSON":
30
+ if len(ent.text.split()) == 1:
31
+ # Single name
32
+ if ent.text in seen_surnames:
33
+ continue
34
+ else:
35
+ # Multipart name
36
+ seen_surnames.append(ent.text.split()[-1])
37
+
38
  seen_entities.append(ent.text)
39
  print((ent.text, ent.label_, ent._.kb_qid, ent._.url_wikidata, ent._.nerd_score))
40
  r = requests.get("https://www.wikidata.org/w/api.php?action=wbgetclaims&format=json&property=P18&entity=" + ent._.kb_qid)