Creating Word Vectors with word2vec

N.B.: use "git pull" anywhere in the nyc-ds-academy directory to update to latest notebooks

Load dependencies


In [1]:
import nltk
from nltk import word_tokenize, sent_tokenize
import gensim
from gensim.models.word2vec import Word2Vec
from sklearn.manifold import TSNE
import pandas as pd
from bokeh.io import output_notebook
from bokeh.plotting import show, figure
%matplotlib inline


Using TensorFlow backend.

In [2]:
nltk.download('punkt') # English-language sentence tokenizer (not all periods end sentences; not all sentences start with a capital letter)


[nltk_data] Downloading package punkt to /home/jovyan/nltk_data...
[nltk_data]   Unzipping tokenizers/punkt.zip.
Out[2]:
True

Load data


In [3]:
nltk.download('gutenberg')


[nltk_data] Downloading package gutenberg to /home/jovyan/nltk_data...
[nltk_data]   Unzipping corpora/gutenberg.zip.
Out[3]:
True

In [4]:
from nltk.corpus import gutenberg

In [5]:
gutenberg.fileids()


Out[5]:
['austen-emma.txt',
 'austen-persuasion.txt',
 'austen-sense.txt',
 'bible-kjv.txt',
 'blake-poems.txt',
 'bryant-stories.txt',
 'burgess-busterbrown.txt',
 'carroll-alice.txt',
 'chesterton-ball.txt',
 'chesterton-brown.txt',
 'chesterton-thursday.txt',
 'edgeworth-parents.txt',
 'melville-moby_dick.txt',
 'milton-paradise.txt',
 'shakespeare-caesar.txt',
 'shakespeare-hamlet.txt',
 'shakespeare-macbeth.txt',
 'whitman-leaves.txt']

In [6]:
len(gutenberg.fileids())


Out[6]:
18

Tokenize text


In [7]:
gberg_sent_tokens = sent_tokenize(gutenberg.raw())

In [8]:
gberg_sent_tokens[0:5]


Out[8]:
['[Emma by Jane Austen 1816]\n\nVOLUME I\n\nCHAPTER I\n\n\nEmma Woodhouse, handsome, clever, and rich, with a comfortable home\nand happy disposition, seemed to unite some of the best blessings\nof existence; and had lived nearly twenty-one years in the world\nwith very little to distress or vex her.',
 "She was the youngest of the two daughters of a most affectionate,\nindulgent father; and had, in consequence of her sister's marriage,\nbeen mistress of his house from a very early period.",
 'Her mother\nhad died too long ago for her to have more than an indistinct\nremembrance of her caresses; and her place had been supplied\nby an excellent woman as governess, who had fallen little short\nof a mother in affection.',
 "Sixteen years had Miss Taylor been in Mr. Woodhouse's family,\nless as a governess than a friend, very fond of both daughters,\nbut particularly of Emma.",
 'Between _them_ it was more the intimacy\nof sisters.']

In [9]:
gberg_sent_tokens[1]


Out[9]:
"She was the youngest of the two daughters of a most affectionate,\nindulgent father; and had, in consequence of her sister's marriage,\nbeen mistress of his house from a very early period."

In [10]:
word_tokenize(gberg_sent_tokens[1])


Out[10]:
['She',
 'was',
 'the',
 'youngest',
 'of',
 'the',
 'two',
 'daughters',
 'of',
 'a',
 'most',
 'affectionate',
 ',',
 'indulgent',
 'father',
 ';',
 'and',
 'had',
 ',',
 'in',
 'consequence',
 'of',
 'her',
 'sister',
 "'s",
 'marriage',
 ',',
 'been',
 'mistress',
 'of',
 'his',
 'house',
 'from',
 'a',
 'very',
 'early',
 'period',
 '.']

In [11]:
word_tokenize(gberg_sent_tokens[1])[14]


Out[11]:
'father'

In [12]:
# a convenient method that handles newlines, as well as tokenizing sentences and words in one shot
gberg_sents = gutenberg.sents()

In [13]:
gberg_sents[0:5]


Out[13]:
[['[', 'Emma', 'by', 'Jane', 'Austen', '1816', ']'],
 ['VOLUME', 'I'],
 ['CHAPTER', 'I'],
 ['Emma',
  'Woodhouse',
  ',',
  'handsome',
  ',',
  'clever',
  ',',
  'and',
  'rich',
  ',',
  'with',
  'a',
  'comfortable',
  'home',
  'and',
  'happy',
  'disposition',
  ',',
  'seemed',
  'to',
  'unite',
  'some',
  'of',
  'the',
  'best',
  'blessings',
  'of',
  'existence',
  ';',
  'and',
  'had',
  'lived',
  'nearly',
  'twenty',
  '-',
  'one',
  'years',
  'in',
  'the',
  'world',
  'with',
  'very',
  'little',
  'to',
  'distress',
  'or',
  'vex',
  'her',
  '.'],
 ['She',
  'was',
  'the',
  'youngest',
  'of',
  'the',
  'two',
  'daughters',
  'of',
  'a',
  'most',
  'affectionate',
  ',',
  'indulgent',
  'father',
  ';',
  'and',
  'had',
  ',',
  'in',
  'consequence',
  'of',
  'her',
  'sister',
  "'",
  's',
  'marriage',
  ',',
  'been',
  'mistress',
  'of',
  'his',
  'house',
  'from',
  'a',
  'very',
  'early',
  'period',
  '.']]

In [14]:
gberg_sents[4]


Out[14]:
['She',
 'was',
 'the',
 'youngest',
 'of',
 'the',
 'two',
 'daughters',
 'of',
 'a',
 'most',
 'affectionate',
 ',',
 'indulgent',
 'father',
 ';',
 'and',
 'had',
 ',',
 'in',
 'consequence',
 'of',
 'her',
 'sister',
 "'",
 's',
 'marriage',
 ',',
 'been',
 'mistress',
 'of',
 'his',
 'house',
 'from',
 'a',
 'very',
 'early',
 'period',
 '.']

In [15]:
gberg_sents[4][14]


Out[15]:
'father'

Run word2vec


In [17]:
# model = Word2Vec(sentences=gberg_sents, size=64, sg=1, window=10, min_count=5, seed=42, workers=8)

In [18]:
# model.save('../raw_gutenberg_model.w2v')

Explore model


In [19]:
# skip re-training the model with the next line:  
model = gensim.models.Word2Vec.load('../raw_gutenberg_model.w2v')

In [20]:
model['dog']


Out[20]:
array([ 0.26904255, -0.1621359 ,  0.3750256 , -0.45720032,  0.11301365,
        0.38777879,  0.07985851, -0.41821676,  0.25089404,  0.33926705,
       -0.080161  , -0.41848078, -0.11926382,  0.05567036,  0.17746113,
        0.48711824, -0.07987826,  0.24794155,  0.51635629,  0.28091279,
       -0.02160198, -0.21664959, -0.16267581, -0.30657738, -0.05135779,
       -0.0717189 , -0.23059118,  0.39070779, -0.02148601, -0.02437739,
       -0.24497117, -0.21258108, -0.04940053,  0.47320694, -0.29593673,
       -0.3120383 , -0.16338396, -0.11775671,  0.09429431, -0.62936276,
        0.56831205, -0.04018871,  0.05976823,  0.29181743, -0.01939399,
        0.06972519, -0.29290241, -0.05240246,  0.26122624,  0.04284862,
       -0.10525419, -0.24352749,  0.34333584, -0.46437535,  0.81177765,
       -0.00473523, -0.38881841, -0.02673459, -0.40746167,  0.11519276,
        0.26032686,  0.12146576, -0.41793686,  0.24636635], dtype=float32)

In [21]:
len(model['dog'])


Out[21]:
64

In [22]:
model.most_similar('dog') # distance


Out[22]:
[('puppy', 0.8137584328651428),
 ('broth', 0.7907859683036804),
 ('cage', 0.7828431725502014),
 ('sweeper', 0.7751598358154297),
 ('pig', 0.7609682679176331),
 ('pet', 0.7605292797088623),
 ('boy', 0.7512097358703613),
 ('cow', 0.7502828240394592),
 ('fox', 0.745104968547821),
 ('Truck', 0.7432427406311035)]

In [23]:
model.most_similar('think')


Out[23]:
[('manage', 0.849516749382019),
 ('suppose', 0.8426423072814941),
 ('know', 0.8389058709144592),
 ('contradict', 0.8207963705062866),
 ('NOW', 0.8158916234970093),
 ('Mamma', 0.8147774934768677),
 ('interfere', 0.8047748804092407),
 ('imagine', 0.8041163682937622),
 ('anyhow', 0.8036106824874878),
 ('believe', 0.8022602796554565)]

In [24]:
model.most_similar('day')


Out[24]:
[('morning', 0.7969126105308533),
 ('night', 0.7783966064453125),
 ('time', 0.7478375434875488),
 ('month', 0.7393653392791748),
 ('week', 0.7346140742301941),
 ('evening', 0.704649806022644),
 ('feasting', 0.7016774415969849),
 ('Saturday', 0.6912297606468201),
 ('Adar', 0.6819364428520203),
 ('seventh', 0.675483226776123)]

In [25]:
model.most_similar('father')


Out[25]:
[('mother', 0.8784882426261902),
 ('brother', 0.8613675236701965),
 ('wife', 0.7934472560882568),
 ('sister', 0.7911010980606079),
 ('daughter', 0.785748302936554),
 ('Amnon', 0.776392936706543),
 ('Tamar', 0.7663865089416504),
 ('servant', 0.7563588619232178),
 ('uncle', 0.7395140528678894),
 ('bondwoman', 0.7374235391616821)]

In [26]:
model.most_similar('broth')


Out[26]:
[('poisoned', 0.8916468024253845),
 ('slice', 0.8743618130683899),
 ('basin', 0.8612580299377441),
 ('pepper', 0.8564265966415405),
 ('shell', 0.8563050031661987),
 ('shure', 0.8496631383895874),
 ('bun', 0.8453623056411743),
 ('Lightfoot', 0.8451728820800781),
 ('mandarin', 0.8446893095970154),
 ('cowslip', 0.8435923457145691)]

In [27]:
# close, but not quite; distinctly in female direction: 
model.most_similar(positive=['father', 'woman'], negative=['man'])


Out[27]:
[('sister', 0.7926232218742371),
 ('daughter', 0.7917730808258057),
 ('wife', 0.7815544605255127),
 ('husband', 0.7808158993721008),
 ('mother', 0.7753645181655884),
 ('brother', 0.7328757047653198),
 ('Tamar', 0.732427716255188),
 ('conceived', 0.717141330242157),
 ('Sarah', 0.7118659019470215),
 ('Rachel', 0.7106494903564453)]

In [29]:
model.most_similar(positive=['king', 'woman'], negative=['man'], topn=50)


Out[29]:
[('Rachel', 0.7507852911949158),
 ('Pharaoh', 0.7350609302520752),
 ('Sarah', 0.7345616817474365),
 ('Leah', 0.7254290580749512),
 ('Laban', 0.7232168912887573),
 ('Rebekah', 0.7184093594551086),
 ('Hagar', 0.7087153792381287),
 ('Padanaram', 0.7086805105209351),
 ('Abram', 0.7034566402435303),
 ('Bilhah', 0.6920945644378662),
 ('Solomon', 0.6878252029418945),
 ('Abimelech', 0.6848732233047485),
 ('Hamor', 0.6816117763519287),
 ('Esau', 0.6815595626831055),
 ('Zilpah', 0.6792290210723877),
 ('Jerubbaal', 0.6787564754486084),
 ('conceived', 0.6777492761611938),
 ('Onan', 0.674083411693573),
 ('daughter', 0.6740672588348389),
 ('Bethuel', 0.6726176142692566),
 ('Ephron', 0.6718195080757141),
 ('Sarai', 0.6691693067550659),
 ('damsel', 0.6690042018890381),
 ('Judah', 0.6685984134674072),
 ('Shechem', 0.6679830551147461),
 ('birthright', 0.6656962037086487),
 ('Lot', 0.6613132953643799),
 ('household', 0.6583735346794128),
 ('Mephibosheth', 0.6569991707801819),
 ('Babylon', 0.6507256031036377),
 ('queen', 0.6497037410736084),
 ('Heth', 0.6490903496742249),
 ('Tamar', 0.6490516662597656),
 ('Jerusalem', 0.6476879119873047),
 ('Hanun', 0.644147515296936),
 ('Samaria', 0.6416412591934204),
 ('kindred', 0.6413353681564331),
 ('Jethro', 0.6407186985015869),
 ('Benhadad', 0.640671968460083),
 ('Rahab', 0.6401610374450684),
 ('Gerar', 0.6396584510803223),
 ('Hittite', 0.6393617391586304),
 ('Canaan', 0.6370488405227661),
 ('David', 0.6362689733505249),
 ('Caleb', 0.6357195377349854),
 ('Esther', 0.6332159042358398),
 ('Jephunneh', 0.6326543688774109),
 ('concubine', 0.6308900713920593),
 ('Naboth', 0.6306082010269165),
 ('Asa', 0.6302342414855957)]

In [ ]:
# impressive for such a small data set, without any cleaning, e.g., to lower case (covered next)

Reduce word vector dimensionality with t-SNE


In [30]:
model.wv.vocab


Out[30]:
{'[': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac84a58>,
 'Emma': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac84278>,
 'by': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac84978>,
 'Jane': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac84550>,
 ']': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac84860>,
 'I': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac84940>,
 'CHAPTER': <gensim.models.keyedvectors.Vocab at 0x7f4c1bf62048>,
 'Woodhouse': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57be0>,
 ',': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57518>,
 'handsome': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab570b8>,
 'clever': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57d68>,
 'and': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57dd8>,
 'rich': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57e48>,
 'with': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab579b0>,
 'a': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab574e0>,
 'comfortable': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab574a8>,
 'home': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57240>,
 'happy': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab576d8>,
 'disposition': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57ba8>,
 'seemed': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57668>,
 'to': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab577f0>,
 'unite': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab575c0>,
 'some': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57f98>,
 'of': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57978>,
 'the': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57f28>,
 'best': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab572b0>,
 'blessings': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57780>,
 'existence': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57b00>,
 ';': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57748>,
 'had': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57c50>,
 'lived': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57438>,
 'nearly': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab572e8>,
 'twenty': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57588>,
 '-': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab57f60>,
 'one': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832cf8>,
 'years': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8329e8>,
 'in': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8321d0>,
 'world': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832550>,
 'very': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8326d8>,
 'little': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832518>,
 'distress': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832128>,
 'or': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8327f0>,
 'vex': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832da0>,
 'her': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832278>,
 '.': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832e10>,
 'She': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832588>,
 'was': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832f98>,
 'youngest': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832a20>,
 'two': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832f60>,
 'daughters': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8322e8>,
 'most': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8329b0>,
 'affectionate': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832048>,
 'indulgent': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832a90>,
 'father': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832240>,
 'consequence': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832780>,
 'sister': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832ba8>,
 "'": <gensim.models.keyedvectors.Vocab at 0x7f4c1b832860>,
 's': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832be0>,
 'marriage': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832c18>,
 'been': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832208>,
 'mistress': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832ef0>,
 'his': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832358>,
 'house': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832438>,
 'from': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8327b8>,
 'early': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8324a8>,
 'period': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832b70>,
 'Her': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832d68>,
 'mother': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832320>,
 'died': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832198>,
 'too': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832e80>,
 'long': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832d30>,
 'ago': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832b38>,
 'for': <gensim.models.keyedvectors.Vocab at 0x7f4c1b832400>,
 'have': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6b828>,
 'more': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6ba90>,
 'than': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6bd30>,
 'an': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6bf60>,
 'remembrance': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6bc50>,
 'caresses': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6b9b0>,
 'place': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6b6a0>,
 'supplied': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6bdd8>,
 'excellent': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6b160>,
 'woman': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6b208>,
 'as': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6bac8>,
 'governess': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6b3c8>,
 'who': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88198>,
 'fallen': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88978>,
 'short': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88860>,
 'affection': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac880f0>,
 'Sixteen': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88a20>,
 'Miss': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88e10>,
 'Taylor': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88f98>,
 'Mr': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac886d8>,
 'family': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88ef0>,
 'less': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88780>,
 'friend': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88f60>,
 'fond': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88e80>,
 'both': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac887b8>,
 'but': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88208>,
 'particularly': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88cf8>,
 'Between': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88320>,
 'it': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88240>,
 'intimacy': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac88da0>,
 'sisters': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac885f8>,
 'Even': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa34d68>,
 'before': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa34eb8>,
 'ceased': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa34e48>,
 'hold': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa34ba8>,
 'office': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa34160>,
 'mildness': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa34198>,
 'temper': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa34c88>,
 'hardly': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa346a0>,
 'allowed': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa34080>,
 'impose': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c2e8>,
 'any': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c7b8>,
 'restraint': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c898>,
 'shadow': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c470>,
 'authority': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c1d0>,
 'being': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c5c0>,
 'now': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3cb38>,
 'passed': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c8d0>,
 'away': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c128>,
 'they': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3cd68>,
 'living': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c400>,
 'together': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3cba8>,
 'mutually': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c358>,
 'attached': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c6a0>,
 'doing': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c080>,
 'just': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c048>,
 'what': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3cda0>,
 'she': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c780>,
 'liked': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3ce10>,
 'highly': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3cfd0>,
 'judgment': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c630>,
 'directed': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c908>,
 'chiefly': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c518>,
 'own': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c0f0>,
 'The': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3cb00>,
 'real': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c198>,
 'evils': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c2b0>,
 'indeed': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3ca90>,
 'situation': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c5f8>,
 'were': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3cdd8>,
 'power': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3ccc0>,
 'having': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c588>,
 'rather': <gensim.models.keyedvectors.Vocab at 0x7f4c1aa3c9e8>,
 'much': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6fcf8>,
 'way': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6f940>,
 'think': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6f9e8>,
 'well': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6f630>,
 'herself': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6fac8>,
 'these': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6f8d0>,
 'which': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6f208>,
 'threatened': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6f9b0>,
 'alloy': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6f128>,
 'many': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6f518>,
 'enjoyments': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6fa90>,
 'danger': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6f780>,
 'however': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6fdd8>,
 'at': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6f278>,
 'present': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6f978>,
 'so': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6ff60>,
 'unperceived': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6f2e8>,
 'that': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6f908>,
 'did': <gensim.models.keyedvectors.Vocab at 0x7f4c1bd6fe80>,
 'not': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2b828>,
 'means': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2b320>,
 'rank': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2b198>,
 'misfortunes': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2bac8>,
 'Sorrow': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2b278>,
 'came': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2bd68>,
 '--': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2b7b8>,
 'gentle': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2ba20>,
 'sorrow': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2b5c0>,
 'all': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2be80>,
 'shape': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2b5f8>,
 'disagreeable': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2b0b8>,
 'consciousness': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2bbe0>,
 '.--': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2b160>,
 'married': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2b668>,
 'It': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2b438>,
 'loss': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2bc88>,
 'first': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2b240>,
 'brought': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2b400>,
 'grief': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab2b048>,
 'on': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1be80>,
 'wedding': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1bf98>,
 'day': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1bcf8>,
 'this': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b9e8>,
 'beloved': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b2b0>,
 'sat': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1bbe0>,
 'mournful': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b668>,
 'thought': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1bf28>,
 'continuance': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1bda0>,
 'over': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b240>,
 'bride': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b898>,
 'people': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b978>,
 'gone': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b390>,
 'left': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b5c0>,
 'dine': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b1d0>,
 'no': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1bf60>,
 'prospect': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b908>,
 'third': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1bb00>,
 'cheer': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1be48>,
 'evening': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1bd68>,
 'composed': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1bb70>,
 'himself': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b0f0>,
 'sleep': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1bcc0>,
 'after': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1beb8>,
 'dinner': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b6d8>,
 'usual': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b160>,
 'then': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1bc88>,
 'only': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b588>,
 'sit': <gensim.models.keyedvectors.Vocab at 0x7f4c1be1b4e0>,
 'lost': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdabd68>,
 'event': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab7b8>,
 'every': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab5f8>,
 'promise': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab940>,
 'happiness': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdabf98>,
 'Weston': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdabe10>,
 'man': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdabfd0>,
 'unexceptionable': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdabb70>,
 'character': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab8d0>,
 'easy': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab898>,
 'fortune': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab3c8>,
 'suitable': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab240>,
 'age': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab978>,
 'pleasant': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab668>,
 'manners': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab320>,
 'there': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab0b8>,
 'satisfaction': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdaba58>,
 'considering': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdabc18>,
 'self': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdabdd8>,
 'denying': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab588>,
 'generous': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab630>,
 'friendship': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab9b0>,
 'always': <gensim.models.keyedvectors.Vocab at 0x7f4c1bdab048>,
 'wished': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9adc50>,
 'promoted': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad470>,
 'match': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9adb38>,
 'black': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad9e8>,
 'morning': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad6d8>,
 'work': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9adef0>,
 'want': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad0b8>,
 'would': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad7b8>,
 'be': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad8d0>,
 'felt': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad5f8>,
 'hour': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad9b0>,
 'recalled': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9adeb8>,
 'past': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9add30>,
 'kindness': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9adbe0>,
 'sixteen': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad198>,
 'how': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad4a8>,
 'taught': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9adcc0>,
 'played': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9addd8>,
 'five': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad0f0>,
 'old': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9adda0>,
 'devoted': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad940>,
 'powers': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad208>,
 'attach': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad048>,
 'amuse': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad550>,
 'health': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9adf28>,
 'nursed': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad320>,
 'through': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad4e0>,
 'various': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ada90>,
 'childhood': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ade10>,
 'A': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9adac8>,
 'large': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad390>,
 'debt': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad7f0>,
 'gratitude': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9adc18>,
 'owing': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9adb70>,
 'here': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9add68>,
 'intercourse': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad668>,
 'last': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad358>,
 'seven': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad630>,
 'equal': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9ad240>,
 'footing': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95ff28>,
 'perfect': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95fb00>,
 'unreserve': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f4a8>,
 'soon': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95fda0>,
 'followed': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f748>,
 'Isabella': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f390>,
 'their': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95ffd0>,
 'each': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f278>,
 'other': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f668>,
 'yet': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f080>,
 'dearer': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f3c8>,
 'recollection': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f780>,
 'companion': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95fe10>,
 'such': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f550>,
 'few': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95fb38>,
 'possessed': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95fc88>,
 ':': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f2e8>,
 'intelligent': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f240>,
 'informed': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f860>,
 'useful': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95fcf8>,
 'knowing': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f5c0>,
 'ways': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f400>,
 'interested': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f588>,
 'its': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f208>,
 'concerns': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f9b0>,
 'peculiarly': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f5f8>,
 'pleasure': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95fef0>,
 'scheme': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f048>,
 'hers': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f518>,
 'whom': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f6a0>,
 'could': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f198>,
 'speak': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f710>,
 'arose': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f128>,
 'never': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95fbe0>,
 'find': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95fd30>,
 'fault': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f2b0>,
 'How': <gensim.models.keyedvectors.Vocab at 0x7f4c1a95f8d0>,
 'bear': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b208>,
 'change': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b358>,
 '?--': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b278>,
 'true': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3bba8>,
 'going': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b5f8>,
 'half': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3be10>,
 'mile': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3bf28>,
 'them': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b7b8>,
 'aware': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3ba20>,
 'great': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b940>,
 'must': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b908>,
 'difference': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b6a0>,
 'between': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3bf98>,
 'Mrs': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b6d8>,
 'advantages': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b438>,
 'natural': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b080>,
 'domestic': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b828>,
 'suffering': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3bb70>,
 'intellectual': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3bda0>,
 'solitude': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3bcf8>,
 'dearly': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b518>,
 'loved': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b128>,
 'he': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3bd68>,
 'He': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b978>,
 'meet': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b898>,
 'conversation': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3ba58>,
 'rational': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b5c0>,
 'playful': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3bc50>,
 'evil': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3bd30>,
 'actual': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b9e8>,
 'disparity': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3bbe0>,
 'ages': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b4e0>,
 '(': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b7f0>,
 ')': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3bdd8>,
 'increased': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b0f0>,
 'constitution': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b668>,
 'habits': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3bfd0>,
 'life': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b9b0>,
 'without': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac3b8d0>,
 'activity': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32860>,
 'mind': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32128>,
 'body': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac325c0>,
 'older': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32c88>,
 'though': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32208>,
 'everywhere': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32438>,
 'friendliness': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac320f0>,
 'heart': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32eb8>,
 'amiable': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32ac8>,
 'talents': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32978>,
 'recommended': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32c18>,
 'him': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac329b0>,
 'time': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac327f0>,
 'comparatively': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32e10>,
 'removed': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32f98>,
 'matrimony': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32588>,
 'settled': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32ef0>,
 'London': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac322b0>,
 'miles': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32240>,
 'off': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32630>,
 'beyond': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32518>,
 'daily': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32780>,
 'reach': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32e48>,
 'October': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32080>,
 'November': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32ba8>,
 'struggled': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32898>,
 'Hartfield': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac326a0>,
 'Christmas': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac324e0>,
 'next': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32f28>,
 'visit': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac322e8>,
 'husband': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32f60>,
 'children': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32470>,
 'fill': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32d30>,
 'give': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32908>,
 'society': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32390>,
 'again': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac327b8>,
 'Highbury': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac329e8>,
 'populous': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32358>,
 'village': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32400>,
 'almost': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32198>,
 'town': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac32a90>,
 'spite': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac7b70>,
 'separate': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac7da0>,
 'lawn': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac7e10>,
 'shrubberies': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac7390>,
 'name': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac76d8>,
 'really': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac7470>,
 'belong': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac7668>,
 'afforded': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac7828>,
 'equals': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac7048>,
 'All': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac78d0>,
 'looked': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac7978>,
 'up': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac7c18>,
 'acquaintance': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac7128>,
 'universally': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac7f60>,
 'civil': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac7fd0>,
 'among': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac7518>,
 'accepted': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac70b8>,
 'even': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac71d0>,
 'melancholy': <gensim.models.keyedvectors.Vocab at 0x7f4c1aac72e8>,
 'sigh': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab491d0>,
 'wish': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49208>,
 'impossible': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49358>,
 'things': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49630>,
 'till': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab495f8>,
 'awoke': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab499e8>,
 'made': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49128>,
 'necessary': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab499b0>,
 'cheerful': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49588>,
 'His': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49b70>,
 'spirits': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49160>,
 'required': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49ba8>,
 'support': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49a20>,
 'nervous': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49b38>,
 'easily': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49710>,
 'depressed': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49c50>,
 'used': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49320>,
 'hating': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab490b8>,
 'part': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab494a8>,
 'kind': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab494e0>,
 'origin': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab497b8>,
 'reconciled': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab498d0>,
 'daughter': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49ac8>,
 'marrying': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab495c0>,
 'nor': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49048>,
 'ever': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49f60>,
 'compassion': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49ef0>,
 'entirely': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49978>,
 'when': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49518>,
 'obliged': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49cf8>,
 'selfishness': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab496d8>,
 'able': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49dd8>,
 'suppose': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49d30>,
 'feel': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49860>,
 'differently': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49908>,
 'disposed': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49828>,
 'done': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab493c8>,
 'sad': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab49cc0>,
 'thing': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8607f0>,
 'deal': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860e80>,
 'happier': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860ef0>,
 'if': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860828>,
 'spent': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860be0>,
 'rest': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860ac8>,
 'smiled': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860e10>,
 'cheerfully': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860550>,
 'keep': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860978>,
 'thoughts': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860198>,
 'tea': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860588>,
 'say': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860470>,
 'exactly': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860518>,
 'said': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860240>,
 '"': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860ba8>,
 'Poor': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860780>,
 '!--': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8608d0>,
 'What': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860fd0>,
 'pity': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8605c0>,
 'is': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860f28>,
 '!"': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860b38>,
 'cannot': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860b00>,
 'agree': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8609e8>,
 'you': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8604e0>,
 'papa': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860860>,
 'know': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860d30>,
 'good': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860a20>,
 'humoured': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8604a8>,
 'thoroughly': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860c18>,
 'deserves': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860da0>,
 'wife': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860a58>,
 ';--': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860cf8>,
 'live': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860080>,
 'us': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8606d8>,
 'my': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860cc0>,
 'odd': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860630>,
 'humours': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860898>,
 'might': <gensim.models.keyedvectors.Vocab at 0x7f4c1b860eb8>,
 '?"': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a710>,
 'But': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a828>,
 'where': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a358>,
 'advantage': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a898>,
 '?': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93af60>,
 'This': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a2e8>,
 'three': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a5c0>,
 'times': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a3c8>,
 'And': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a8d0>,
 'dear': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a668>,
 '."': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93af98>,
 'often': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a6d8>,
 'we': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93aac8>,
 'shall': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a6a0>,
 'see': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93ae10>,
 'coming': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a9e8>,
 'We': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a400>,
 'meeting': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a7f0>,
 '!': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a7b8>,
 'begin': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a748>,
 'go': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93ab38>,
 'pay': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93ad30>,
 'My': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93acf8>,
 'am': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a1d0>,
 'get': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a240>,
 'far': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93aa20>,
 'Randalls': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a278>,
 'distance': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93aba8>,
 'walk': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93ae80>,
 'No': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a208>,
 'nobody': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93ae48>,
 'your': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a518>,
 'walking': <gensim.models.keyedvectors.Vocab at 0x7f4c1b93a048>,
 'carriage': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6e390>,
 'sure': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6e7f0>,
 'James': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6e320>,
 'will': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6eda0>,
 'like': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6ee80>,
 'put': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6e898>,
 'horses': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6e358>,
 'are': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab6e1d0>,
 'poor': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa390>,
 'while': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa5f8>,
 'paying': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa8d0>,
 'our': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa668>,
 'They': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa278>,
 'into': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa7b8>,
 'stable': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa940>,
 'You': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa1d0>,
 'already': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aab38>,
 'talked': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aab00>,
 'night': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aae80>,
 'may': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aaf98>,
 'because': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa240>,
 'doubt': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa710>,
 'whether': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aae10>,
 'take': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa160>,
 'anywhere': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa4e0>,
 'else': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa6d8>,
 'That': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aaa58>,
 'got': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aaba8>,
 'Hannah': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa978>,
 'Nobody': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa7f0>,
 'mentioned': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aaac8>,
 'glad': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa9b0>,
 'lucky': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aafd0>,
 'slighted': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa128>,
 'upon': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa860>,
 'account': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa780>,
 'make': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aadd8>,
 'servant': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa080>,
 'pretty': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa2b0>,
 'spoken': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aad30>,
 'girl': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa748>,
 'opinion': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa908>,
 'Whenever': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aa320>,
 'asks': <gensim.models.keyedvectors.Vocab at 0x7f4c1a9aaeb8>,
 'me': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcfbe0>,
 'do': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcfdd8>,
 'manner': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcfc88>,
 'needlework': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcfd68>,
 'observe': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcfba8>,
 'turns': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcfe48>,
 'lock': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcfef0>,
 'door': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcffd0>,
 'right': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcff98>,
 'comfort': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcfcf8>,
 'somebody': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcfe10>,
 'about': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcf0b8>,
 'goes': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcf160>,
 'hearing': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcf358>,
 'tell': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcf128>,
 'spared': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcf1d0>,
 'exertions': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcf4a8>,
 'maintain': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcf2b0>,
 'flow': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcf438>,
 'ideas': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcf470>,
 'hoped': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcf588>,
 'help': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcf390>,
 'tolerably': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcf3c8>,
 'attacked': <gensim.models.keyedvectors.Vocab at 0x7f4c1afcf4e0>,
 'regrets': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09630>,
 'table': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09940>,
 'placed': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09438>,
 'visitor': <gensim.models.keyedvectors.Vocab at 0x7f4c1be091d0>,
 'immediately': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09278>,
 'afterwards': <gensim.models.keyedvectors.Vocab at 0x7f4c1be092b0>,
 'walked': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09710>,
 'unnecessary': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09d30>,
 'Knightley': <gensim.models.keyedvectors.Vocab at 0x7f4c1be098d0>,
 'sensible': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09fd0>,
 'eight': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09518>,
 'thirty': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09a20>,
 'intimate': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09358>,
 'connected': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09080>,
 'elder': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09198>,
 'brother': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09160>,
 'frequent': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09b00>,
 'welcome': <gensim.models.keyedvectors.Vocab at 0x7f4c1be096d8>,
 'directly': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09cc0>,
 'mutual': <gensim.models.keyedvectors.Vocab at 0x7f4c1be094a8>,
 'connexions': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09c18>,
 'returned': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09e80>,
 'late': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09cf8>,
 'days': <gensim.models.keyedvectors.Vocab at 0x7f4c1be093c8>,
 'absence': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09898>,
 'Brunswick': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09a58>,
 'Square': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09c50>,
 'circumstance': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09eb8>,
 'animated': <gensim.models.keyedvectors.Vocab at 0x7f4c1be097b8>,
 'inquiries': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09390>,
 'answered': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09c88>,
 'When': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09400>,
 'gratefully': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09b38>,
 'observed': <gensim.models.keyedvectors.Vocab at 0x7f4c1be092e8>,
 'come': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09588>,
 'out': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09f60>,
 'call': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09f98>,
 'afraid': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09be0>,
 'shocking': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09048>,
 'Not': <gensim.models.keyedvectors.Vocab at 0x7f4c1be097f0>,
 'sir': <gensim.models.keyedvectors.Vocab at 0x7f4c1be099e8>,
 'beautiful': <gensim.models.keyedvectors.Vocab at 0x7f4c1be09908>,
 'moonlight': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2da90>,
 'mild': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d8d0>,
 'draw': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d0f0>,
 'back': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2ddd8>,
 'fire': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d438>,
 'found': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d198>,
 'damp': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d0b8>,
 'dirty': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d668>,
 'catch': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d390>,
 'cold': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d358>,
 'Look': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d320>,
 'shoes': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d6d8>,
 'Well': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d518>,
 'quite': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d860>,
 'surprising': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d828>,
 'vast': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d9e8>,
 'rain': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d908>,
 'rained': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d898>,
 'dreadfully': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d940>,
 'hard': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d588>,
 'breakfast': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d9b0>,
 'wanted': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2db00>,
 'By': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2dcf8>,
 'bye': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2dc88>,
 'joy': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2dc50>,
 'Being': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2dcc0>,
 'sort': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2db70>,
 'feeling': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2dc18>,
 'hurry': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2dba8>,
 'congratulations': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2df60>,
 'hope': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2de48>,
 'went': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2df98>,
 'behave': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d4a8>,
 'Who': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d710>,
 'cried': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2de10>,
 'Ah': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d780>,
 'Tis': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2d5f8>,
 'business': <gensim.models.keyedvectors.Vocab at 0x7f4c1af2dfd0>,
 'please': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839eb8>,
 'possibly': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8390b8>,
 '`': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839470>,
 ".'": <gensim.models.keyedvectors.Vocab at 0x7f4c1b839780>,
 'regard': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8396a0>,
 'comes': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839da0>,
 'question': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839518>,
 'dependence': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839f28>,
 'independence': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839898>,
 'At': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839d30>,
 'rate': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839550>,
 'better': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839940>,
 '_one_': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839710>,
 'those': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8399e8>,
 'fanciful': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839ef0>,
 'troublesome': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8398d0>,
 'creature': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839c18>,
 'playfully': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839a20>,
 'head': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839438>,
 'certainly': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8394e0>,
 'believe': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8395c0>,
 ',"': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8391d0>,
 'sometimes': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839dd8>,
 'dearest': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839c50>,
 'mean': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839400>,
 '_you_': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839c88>,
 'horrible': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8390f0>,
 'idea': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839be0>,
 'Oh': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839d68>,
 'meant': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839908>,
 'myself': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839320>,
 'loves': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8396d8>,
 'joke': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8397f0>,
 'another': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8392b0>,
 'fact': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839240>,
 'faults': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839278>,
 'told': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839ac8>,
 'agreeable': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8393c8>,
 'knew': <gensim.models.keyedvectors.Vocab at 0x7f4c1b839ba8>,
 'suspect': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4e710>,
 'knows': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4eda0>,
 'flatter': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4e9b0>,
 'reflection': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4e4e0>,
 'has': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4e6d8>,
 'persons': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4e390>,
 'chances': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4e828>,
 'willing': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4eb70>,
 'let': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4ecc0>,
 'pass': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4ed68>,
 '--"': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4e438>,
 'hear': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4e470>,
 'behaved': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4e550>,
 'charmingly': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4e400>,
 'Every': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4e908>,
 'punctual': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4eeb8>,
 'looks': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4ee10>,
 'tear': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4e9e8>,
 'face': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4e198>,
 'seen': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab4ee80>,
 'apart': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e518>,
 'Dear': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e080>,
 'bears': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e898>,
 'sorry': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e7b8>,
 'lose': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e198>,
 'miss': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e400>,
 'thinks': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e780>,
 'turned': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e860>,
 'divided': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e630>,
 'tears': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e2b0>,
 'smiles': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85ec50>,
 'should': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85eb70>,
 'acceptable': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e160>,
 'important': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e208>,
 'secure': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e710>,
 'provision': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85ebe0>,
 'therefore': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e588>,
 'allow': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e748>,
 'pain': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e390>,
 'happily': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85eef0>,
 'forgotten': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85eda0>,
 'matter': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85eeb8>,
 'considerable': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85ecc0>,
 'four': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85edd8>,
 'proved': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85ee10>,
 'marry': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e470>,
 'shook': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e6d8>,
 'fondly': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85eb38>,
 'replied': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e240>,
 'matches': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e940>,
 'foretell': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85ef28>,
 'whatever': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85eba8>,
 'Pray': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85ec88>,
 'none': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e358>,
 'greatest': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85ee48>,
 'amusement': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e9b0>,
 'success': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85e0f0>,
 'widower': <gensim.models.keyedvectors.Vocab at 0x7f4c1b85ef60>,
 'perfectly': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853278>,
 'constantly': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853320>,
 'occupied': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853f60>,
 'either': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853c18>,
 'friends': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853cc0>,
 'wherever': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853cf8>,
 'need': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8536a0>,
 'spend': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853048>,
 'single': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853940>,
 'year': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853a20>,
 'alone': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853d30>,
 'Some': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853438>,
 'others': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853b00>,
 'son': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853b38>,
 'uncle': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853160>,
 'letting': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853400>,
 'solemn': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8537b8>,
 'nonsense': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853e10>,
 'subject': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8536d8>,
 'believed': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853a58>,
 'Ever': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853470>,
 'since': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853860>,
 'met': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853518>,
 'Broadway': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853f98>,
 'Lane': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853ba8>,
 'began': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8535c0>,
 'darted': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853ef0>,
 'gallantry': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8533c8>,
 'borrowed': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8537f0>,
 'Farmer': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8532e8>,
 'planned': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8530f0>,
 'blessed': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853748>,
 'instance': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853a90>,
 'leave': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853908>,
 'making': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853198>,
 'understand': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853668>,
 ',\'"': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853710>,
 'supposes': <gensim.models.keyedvectors.Vocab at 0x7f4c1b8534a8>,
 'endeavour': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853128>,
 'Your': <gensim.models.keyedvectors.Vocab at 0x7f4c1b853898>,
 'properly': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab14860>,
 'delicately': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab14c18>,
 'endeavouring': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab14550>,
 'bring': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab14b00>,
 'worthy': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab14cf8>,
 'employment': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab14f98>,
 'young': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab14a58>,
 'lady': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab14390>,
 'imagine': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab14be0>,
 'planning': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab14780>,
 'saying': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab14ac8>,
 'yourself': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab147b8>,
 'idle': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab14630>,
 ",'": <gensim.models.keyedvectors.Vocab at 0x7f4c1ab14588>,
 'why': <gensim.models.keyedvectors.Vocab at 0x7f4c1ab14198>,
 'talk': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1080>,
 'Where': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1d30>,
 'merit': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1518>,
 'proud': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1550>,
 'guess': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1e48>,
 '_that_': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1278>,
 'can': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1f98>,
 'known': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1908>,
 'triumph': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1b38>,
 'cleverer': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1358>,
 'depend': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef12e8>,
 'merely': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1e80>,
 'luck': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1ba8>,
 'There': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1a20>,
 'talent': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1588>,
 'word': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1710>,
 'quarrel': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef12b0>,
 'claim': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef10f0>,
 'drawn': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1780>,
 'pictures': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef17f0>,
 'something': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1160>,
 'nothing': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1fd0>,
 'If': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef14a8>,
 'visits': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1da0>,
 'given': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef16a0>,
 'smoothed': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1ac8>,
 'matters': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1470>,
 'enough': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1668>,
 'comprehend': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1e10>,
 'open': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1f28>,
 'hearted': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef14e0>,
 'unaffected': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1c50>,
 'safely': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef19e8>,
 'manage': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef19b0>,
 'likely': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1a90>,
 'harm': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1b00>,
 'interference': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1748>,
 'rejoined': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef10b8>,
 'understanding': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef18d0>,
 'pray': <gensim.models.keyedvectors.Vocab at 0x7f4c1bef1438>,
 'silly': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c550>,
 'break': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c470>,
 'circle': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c080>,
 'grievously': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c828>,
 'Only': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c4e0>,
 'Elton': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94cd30>,
 ',--': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c2e8>,
 'look': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94cb70>,
 'whole': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94cda0>,
 'fitted': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94cac8>,
 'comfortably': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c710>,
 'shame': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c1d0>,
 'longer': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c780>,
 'joining': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c4a8>,
 'hands': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94ccc0>,
 'same': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94cd68>,
 'service': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c668>,
 'shew': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94cf98>,
 'attention': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94ca20>,
 'ask': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c320>,
 'dare': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c400>,
 'With': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94cdd8>,
 'laughing': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c0b8>,
 'fish': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c358>,
 'chicken': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94ceb8>,
 'chuse': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c3c8>,
 'Depend': <gensim.models.keyedvectors.Vocab at 0x7f4c1a94c048>,
 'six': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90ceb8>,
 'care': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90c780>,
 'II': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90c630>,
 'native': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90c208>,
 'born': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90c978>,
 'respectable': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90c7b8>,
 'generations': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90c438>,
 'rising': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90c828>,
 'gentility': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90cb38>,
 'property': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90c518>,
 'received': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90c748>,
 'education': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90c128>,
 'succeeding': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90cb00>,
 'small': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90ce10>,
 'become': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90c9e8>,
 'indisposed': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90c668>,
 'homely': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90c160>,
 'pursuits': <gensim.models.keyedvectors.Vocab at 0x7f4c1b90cdd8>,
 'brothers': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13208>,
 'engaged': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13e10>,
 'satisfied': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13e80>,
 'active': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13a20>,
 'social': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13978>,
 'entering': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13a90>,
 'militia': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13a58>,
 'county': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13d30>,
 'embodied': <gensim.models.keyedvectors.Vocab at 0x7f4c1be136a0>,
 'Captain': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13048>,
 'general': <gensim.models.keyedvectors.Vocab at 0x7f4c1be136d8>,
 'favourite': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13b70>,
 'military': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13828>,
 'introduced': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13e48>,
 'Churchill': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13780>,
 'Yorkshire': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13160>,
 'fell': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13c50>,
 'love': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13dd8>,
 'surprized': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13320>,
 'except': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13eb8>,
 'full': <gensim.models.keyedvectors.Vocab at 0x7f4c1be130f0>,
 'pride': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13630>,
 'importance': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13cf8>,
 'connexion': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13710>,
 'offend': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13b38>,
 'command': <gensim.models.keyedvectors.Vocab at 0x7f4c1be134e0>,
 'bore': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13358>,
 'proportion': <gensim.models.keyedvectors.Vocab at 0x7f4c1be139e8>,
 'estate': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13390>,
 'took': <gensim.models.keyedvectors.Vocab at 0x7f4c1be135c0>,
 'infinite': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13ac8>,
 'mortification': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13c88>,
 'threw': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13748>,
 'due': <gensim.models.keyedvectors.Vocab at 0x7f4c1be137f0>,
 'decorum': <gensim.models.keyedvectors.Vocab at 0x7f4c1be13da0>,
 'unsuitable': <gensim.models.keyedvectors.Vocab at 0x7f4c1be134a8>,
 'produce': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8a860>,
 'ought': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8ab38>,
 'whose': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8ac88>,
 'warm': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8aef0>,
 'sweet': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8ab00>,
 'return': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8ac50>,
 'goodness': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8a080>,
 'spirit': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8a9e8>,
 'resolution': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8a7b8>,
 'pursue': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8ad68>,
 'refrain': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8a1d0>,
 'unreasonable': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8a5f8>,
 'anger': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8a6a0>,
 'missing': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8a2b0>,
 'former': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8ac18>,
 'income': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8afd0>,
 'still': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8aa58>,
 'comparison': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8a550>,
 'Enscombe': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8aa20>,
 'cease': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8ada0>,
 'once': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8aeb8>,
 'considered': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8a710>,
 'especially': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8a8d0>,
 'Churchills': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8acc0>,
 'amazing': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8a7f0>,
 'worst': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8a278>,
 'bargain': <gensim.models.keyedvectors.Vocab at 0x7f4c1be8a9b0>,
 'poorer': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac58828>,
 'child': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac58518>,
 'From': <gensim.models.keyedvectors.Vocab at 0x7f4c1ac58ef0>,
 'expense': <gensim.models.keyedvectors.Vocab at 0x7f4c1beeae48>,
 'relieved': <gensim.models.keyedvectors.Vocab at 0x7f4c1beeadd8>,
 'boy': <gensim.models.keyedvectors.Vocab at 0x7f4c1beeae80>,
 'additional': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea4e0>,
 'softening': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea198>,
 'lingering': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea358>,
 'illness': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea438>,
 'reconciliation': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea0b8>,
 'kindred': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea2e8>,
 'offered': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea2b0>,
 'charge': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea1d0>,
 'Frank': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea940>,
 'decease': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea320>,
 'scruples': <gensim.models.keyedvectors.Vocab at 0x7f4c1beeacf8>,
 'reluctance': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea908>,
 'supposed': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea470>,
 'overcome': <gensim.models.keyedvectors.Vocab at 0x7f4c1beeac18>,
 'considerations': <gensim.models.keyedvectors.Vocab at 0x7f4c1beeaf60>,
 'wealth': <gensim.models.keyedvectors.Vocab at 0x7f4c1beeac88>,
 'seek': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea3c8>,
 'improve': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea400>,
 'complete': <gensim.models.keyedvectors.Vocab at 0x7f4c1beeabe0>,
 'became': <gensim.models.keyedvectors.Vocab at 0x7f4c1beeaba8>,
 'desirable': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea518>,
 'quitted': <gensim.models.keyedvectors.Vocab at 0x7f4c1beeab38>,
 'trade': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea4a8>,
 'established': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea898>,
 'favourable': <gensim.models.keyedvectors.Vocab at 0x7f4c1beea0f0>,
 ...}

In [31]:
len(model.wv.vocab)


Out[31]:
17011

In [ ]:
# X = model[model.wv.vocab]

In [ ]:
# tsne = TSNE(n_components=2, n_iter=1000) # 200 is minimum iter; default is 1000

In [ ]:
# X_2d = tsne.fit_transform(X)

In [ ]:
# coords_df = pd.DataFrame(X_2d, columns=['x','y'])
# coords_df['token'] = model.wv.vocab.keys()

In [ ]:
# coords_df.to_csv('../raw_gutenberg_tsne.csv', index=False)

Visualize 2D representation of word vectors


In [32]:
coords_df = pd.read_csv('./raw_gutenberg_tsne.csv')

In [34]:
coords_df.head()


Out[34]:
x y token
0 4.736166 0.330797 [
1 2.382989 -4.162857 Emma
2 -5.468009 -2.095312 by
3 2.030853 -4.465032 Jane
4 4.746364 0.328226 ]

In [33]:
_ = coords_df.plot.scatter('x', 'y', figsize=(12,12), marker='.', s=10, alpha=0.2)



In [35]:
output_notebook() # output bokeh plots inline in notebook


Loading BokehJS ...

In [36]:
subset_df = coords_df.sample(n=5000)

In [37]:
p = figure(plot_width=800, plot_height=800)
_ = p.text(x=subset_df.x, y=subset_df.y, text=subset_df.token)

In [38]:
show(p)



In [ ]: