songhai2022 commited on
Commit
8902c6f
·
1 Parent(s): 6d87ffc

Create get_bert_keywords.py

Browse files
Files changed (1) hide show
  1. get_bert_keywords.py +12 -0
get_bert_keywords.py ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # import data manipulation libraries
2
+ from nltk.corpus import stopwords
3
+ from keybert import KeyBERT
4
+ from collections import Counter
5
+ # KeyBERT model
6
+ keybert_model = KeyBERT(model='all-MiniLM-L6-v2')
7
+
8
+ def get_bert_keywords(text, num_keywords, ignorewords):
9
+ result = keybert_model.extract_keywords(text, keyphrase_ngram_range=(
10
+ 1, 1), top_n=num_keywords, stop_words=stopwords.words('english')+ignorewords)
11
+ keyberts = [keyword for keyword, score in result]
12
+ return keyberts