umarigan commited on
Commit
861ad26
·
verified ·
1 Parent(s): f436055

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -4
app.py CHANGED
@@ -105,11 +105,11 @@ def create_mask_dict(entities):
105
  entity_counters[entity['entity_group']] += 1
106
  mask_dict[entity['word']] = f"{entity['entity_group']}_{entity_counters[entity['entity_group']]}"
107
  return mask_dict
108
-
109
- def create_masked_text(input_text, mask_dict):
110
  masked_text = input_text
111
- for word, mask in sorted(mask_dict.items(), key=lambda x: len(x[0]), reverse=True):
112
- masked_text = re.sub(r'\b' + re.escape(word) + r'\b', mask, masked_text)
 
113
  return masked_text
114
 
115
 
 
105
  entity_counters[entity['entity_group']] += 1
106
  mask_dict[entity['word']] = f"{entity['entity_group']}_{entity_counters[entity['entity_group']]}"
107
  return mask_dict
108
+ def create_masked_text(input_text, entities, mask_dict):
 
109
  masked_text = input_text
110
+ for entity in sorted(entities, key=lambda x: x['start'], reverse=True):
111
+ if entity['entity_group'] not in ['CARDINAL', 'EVENT']:
112
+ masked_text = masked_text[:entity['start']] + mask_dict[entity['word']] + masked_text[entity['end']:]
113
  return masked_text
114
 
115