notebook.community

Edit and run



In [1]:

    
import nltk
sentence = "Hello my name is joe."
tokens = nltk.word_tokenize(sentence)
tokens









    Out[1]:





['Hello', 'my', 'name', 'is', 'joe', '.']



In [2]:

    
tagged = nltk.pos_tag(tokens)



In [3]:

    
tagged









    Out[3]:





[('Hello', 'NNP'),
 ('my', 'PRP$'),
 ('name', 'NN'),
 ('is', 'VBZ'),
 ('joe', 'NN'),
 ('.', '.')]



In [4]:

    
entities = nltk.chunk.ne_chunk(tagged)



In [5]:

    
type(entities)









    Out[5]:





nltk.tree.Tree



In [6]:

    
%pylab inline









    



Populating the interactive namespace from numpy and matplotlib



In [7]:

    
from nltk.corpus import treebank



In [8]:

    
t = treebank.parsed_sents('wsj_0001.mrg')[0]



In [9]:

    
t.draw()



In [ ]: