In [1]:
import nltk
sentence = "Hello my name is joe."
tokens = nltk.word_tokenize(sentence)
tokens
Out[1]:
In [2]:
tagged = nltk.pos_tag(tokens)
In [3]:
tagged
Out[3]:
In [4]:
entities = nltk.chunk.ne_chunk(tagged)
In [5]:
type(entities)
Out[5]:
In [6]:
%pylab inline
In [7]:
from nltk.corpus import treebank
In [8]:
t = treebank.parsed_sents('wsj_0001.mrg')[0]
In [9]:
t.draw()
In [ ]: