yitingliii commited on
Commit
f7ba0f9
·
verified ·
1 Parent(s): 719567a

Update tfidf.py

Browse files
Files changed (1) hide show
  1. tfidf.py +4 -1
tfidf.py CHANGED
@@ -1,4 +1,7 @@
1
-
 
 
 
2
  from sklearn.feature_extraction.text import TfidfVectorizer
3
  tfidf = TfidfVectorizer(max_features=5000, ngram_range=(1, 2), stop_words='english')
4
  X_train_tfidf = tfidf.fit_transform(X_train)
 
1
+ from sklearn.model_selection import train_test_split
2
+ X = df['title']
3
+ y = df['labels']
4
+ X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
5
  from sklearn.feature_extraction.text import TfidfVectorizer
6
  tfidf = TfidfVectorizer(max_features=5000, ngram_range=(1, 2), stop_words='english')
7
  X_train_tfidf = tfidf.fit_transform(X_train)