yitingliii commited on
Commit
bfe44e3
·
verified ·
1 Parent(s): d4e4e9a

Update data_cleaning.py

Browse files
Files changed (1) hide show
  1. data_cleaning.py +4 -0
data_cleaning.py CHANGED
@@ -1,3 +1,7 @@
 
 
 
 
1
  def clean(df):
2
  stop_words = set(stopwords.words('english'))
3
  lemmatizer = WordNetLemmatizer()
 
1
+ from nltk.corpus import stopwords
2
+ from nltk.stem import WordNetLemmatizer
3
+ from bs4 import BeautifulSoup
4
+ import re
5
  def clean(df):
6
  stop_words = set(stopwords.words('english'))
7
  lemmatizer = WordNetLemmatizer()