# Let's create a dummy dataset data = [' '.join(tokens)]
from sklearn.feature_extraction.text import CountVectorizer, TfidfTransformer in3x,net,watch,14zwhrd6,dildo,18
# Vectorizer to convert text into a matrix of token counts vectorizer = CountVectorizer() count_features = vectorizer.fit_transform(data) # Let's create a dummy dataset data = [' '