File size: 642 Bytes
f11b302
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
import re
import streamlit as st
import nlpaug.augmenter.word as naw

import os
os.environ["TOKENIZERS_PARALLELISM"] = "false"

@st.cache(allow_output_mutation=True, ttl=48*3600)
def load_model():
    aug = naw.ContextualWordEmbsAug(
        model_path='bert-base-uncased', action="insert")
    return aug

aug = load_model()

def parphrase(passage):
    sen = []
    for i in passage:
        res = len(re.findall(r'\w+', i))
        if res == 2:
            pass
        else:
            res = i.replace('"', "'").replace("\n", "")
            sen.append(res)

    pas = " ".join(sen)
    para_text = aug.augment(pas)
    return para_text