# Create TFIDF vectorizer and fit it to training dataset
tfidf = TfidfVectorizer(ngram_range=(1,3), stop_words='english', lowercase=True)

# Transform train_v4['content'] to vectorize
X_train_vec_v4 = tfidf.fit_transform(train_v4["content"])