Update data_cleaning.py
Browse files- data_cleaning.py +4 -0
data_cleaning.py
CHANGED
|
@@ -1,3 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
def clean(df):
|
| 2 |
stop_words = set(stopwords.words('english'))
|
| 3 |
lemmatizer = WordNetLemmatizer()
|
|
|
|
| 1 |
+
from nltk.corpus import stopwords
|
| 2 |
+
from nltk.stem import WordNetLemmatizer
|
| 3 |
+
from bs4 import BeautifulSoup
|
| 4 |
+
import re
|
| 5 |
def clean(df):
|
| 6 |
stop_words = set(stopwords.words('english'))
|
| 7 |
lemmatizer = WordNetLemmatizer()
|