Text Feature Extraction Hashing Trick

Reminder: bag of words

The hashing trick


In [ ]:
X = ["Some say the world will end in fire,",
     "Some say in ice."]

In [ ]:
from sklearn.feature_extraction.text import HashingVectorizer

hashing_vectorizer = HashingVectorizer()
X_hashed  = hashing_vectorizer.transform(X)

In [ ]:
X_hashed

In [ ]:
hashing_vectorizer = HashingVectorizer(ngram_range=(1, 2))
X_hashed  = hashing_vectorizer.transform(X)
X_hashed