In [1]:
from everything import * # https://github.com/fnielsen/everything
In [2]:
from dasem.dannet import Dannet
In [3]:
dannet = Dannet()
In [4]:
# Query for sentiment words in DanNet
query = """
select label, value
from (select sa.synset_id, sa.value
from synset_attributes sa
where sa.type = 'connotation'), synsets as s
where s.id = synset_id
"""
df = dannet.db.query(query)
df.head()
Indexing schema. This will take a second...finished!
Out[4]:
label
value
0
{børnehave_1_3}
negative
1
{mafia_1_2}
negative
2
{sammenrend_1; sammensurium_1}
negative
3
{tingeltangel_1}
negative
4
{kongerække_1_1}
positive
In [5]:
# Extract words from the label
dannet_words = {}
for idx, row in df.iterrows():
synset_words = row['label'].split(';')
for word in synset_words:
dannet_words[word[1:].split('_')[0]] = row['value']
In [6]:
# Compare with development version of AFINN
try:
missing_words, swapped_words = [], []
filename = expanduser('~/fnielsen/data/Nielsen2011Sentiment_afinndk.txt')
afinn = read_csv(filename, sep='\t', encoding='utf-8', header=None)
for dannet_word, dannet_valence in dannet_words.iteritems():
if dannet_word not in afinn[0].values:
missing_words.append((dannet_word, dannet_valence))
else:
afinn_valence = afinn.ix[afinn[0]==dannet_word, 1].values[0]
if ((dannet_valence == 'positive' and afinn_valence < 0) or
(dannet_valence == 'negative' and afinn_valence > 0)):
swapped_words.append((dannet_word, dannet_valence))
pprint(sorted(swapped_words))
pprint(sorted(missing_words))
except:
pass
[(u'dr\xf8mme', u'negative')]
[(u'agterlanterne', u'negative'),
(u'amazone', u'positive'),
(u'andenklassesborger', u'negative'),
(u'andenrangsborger', u'negative'),
(u'angloman', u'negative'),
(u'antikvitet', u'negative'),
(u'arbejdsnarkoman', u'negative'),
(u'artist', u'positive'),
(u'auteur', u'positive'),
(u'avisskriveri', u'negative'),
(u'baby', u'positive'),
(u'badenymfe', u'positive'),
(u'bamse', u'yes'),
(u'bamsefar', u'yes'),
(u'bandit', u'negative'),
(u'barnerumpe', u'negative'),
(u'barner\xf8v', u'negative'),
(u'baryler', u'negative'),
(u'bedsteborger', u'negative'),
(u'behagelighed', u'positive'),
(u'bengel', u'negative'),
(u'ber\xf8mthed', u'positive'),
(u'besk', u'negative'),
(u'betonbyggeri', u'negative'),
(u'betonkasse', u'negative'),
(u'betonklods', u'negative'),
(u'betonsilo', u'negative'),
(u'biks,1', u'negative'),
(u'billig', u'negative'),
(u'bisse,1', u'negative'),
(u'blegn\xe6b', u'negative'),
(u'blodsuger', u'negative'),
(u'blomsterflor', u'positive'),
(u'bl\xe5str\xf8mpe', u'negative'),
(u'bl\xe6ksprutte', u'positive'),
(u'bl\xe6rer\xf8v', u'negative'),
(u'bl\xf8ddyr', u'negative'),
(u'boldspiller', u'positive'),
(u'bolighaj', u'negative'),
(u'boligspekulant', u'negative'),
(u'bolsje', u'negative'),
(u'bolv\xe6rksmatros', u'negative'),
(u'bondefanger', u'negative'),
(u'bondetamp', u'negative'),
(u'bongop\xe6dagog', u'negative'),
(u'bonsai', u'yes'),
(u'bonsaitr\xe6', u'yes'),
(u'borgerdyr', u'negative'),
(u'bras,1', u'negative'),
(u'brokkasse', u'negative'),
(u'br\xe6nde,2', u'positive'),
(u'buk,1', u'negative'),
(u'bulderbasse', u'negative'),
(u'bulldozer', u'negative'),
(u'bums,3', u'negative'),
(u'bundskraber', u'negative'),
(u'bussemand', u'negative'),
(u'byld', u'negative'),
(u'bytte,1', u'negative'),
(u'b\xe6nkevarmer', u'negative'),
(u'b\xe6rme', u'negative'),
(u'b\xf8ddel', u'yes'),
(u'b\xf8hland', u'negative'),
(u'b\xf8lle,1', u'negative'),
(u'b\xf8r,1', u'negative'),
(u'b\xf8rnehave', u'negative'),
(u'b\xf8rnelokker', u'negative'),
(u'b\xf8rnemishandler', u'negative'),
(u'b\xf8rsbaron', u'negative'),
(u'b\xf8rshaj', u'negative'),
(u'b\xf8rsspekulant', u'negative'),
(u'b\xf8rste,3', u'negative'),
(u'celebritet', u'positive'),
(u'chancerytter', u'negative'),
(u'charlatan', u'negative'),
(u'chauvinist', u'negative'),
(u'damptromle', u'negative'),
(u'dandy', u'negative'),
(u'defaitist', u'negative'),
(u'degn', u'negative'),
(u'desperado', u'negative'),
(u'diktator', u'negative'),
(u'dilettant', u'negative'),
(u'dinosaurus', u'negative'),
(u'diplomat', u'positive'),
(u'distancebl\xe6nder', u'negative'),
(u'dj\xe6vel', u'negative'),
(u'dj\xe6velskab', u'negative'),
(u'dogmatiker', u'negative'),
(u'dompap', u'negative'),
(u'dosmer', u'negative'),
(u'dovenkrop', u'negative'),
(u'drenger\xf8v', u'negative'),
(u'drivhusplante', u'negative'),
(u'drivkraft', u'positive'),
(u'drog,1', u'negative'),
(u'drukm\xe5s', u'negative'),
(u'drys', u'negative'),
(u'dr\xe6bermaskine', u'negative'),
(u'dr\xf8m', u'positive'),
(u'dr\xf8mmeslot', u'positive'),
(u'dr\xf8nnert', u'negative'),
(u'due', u'positive'),
(u'dukke,1', u'negative'),
(u'duksedreng', u'negative'),
(u'dulle', u'negative'),
(u'dumpekandidat', u'negative'),
(u'dv\xe6rg', u'negative'),
(u'dydsdragon', u'negative'),
(u'dydsm\xf8nster', u'negative'),
(u'dyr,1', u'negative'),
(u'd\xe5re,1', u'negative'),
(u'd\xe5se', u'negative'),
(u'd\xf8dbider', u'negative'),
(u'd\xf8genigt', u'negative'),
(u'd\xf8gnflue', u'negative'),
(u'efterplaprer', u'negative'),
(u'eftersnakker', u'negative'),
(u'eftersp\xf8rge', u'positive'),
(u'eftertragte', u'positive'),
(u'egocentriker', u'negative'),
(u'egotripper', u'negative'),
(u'elitebilist', u'positive'),
(u'eunuk', u'negative'),
(u'evne,1', u'positive'),
(u'fagforeningspamper', u'negative'),
(u'falskneri', u'negative'),
(u'fantast', u'negative'),
(u'faris\xe6er', u'negative'),
(u'fedtspiller', u'negative'),
(u'feinschmecker', u'positive'),
(u'fejlfinder', u'negative'),
(u'feltmadras', u'negative'),
(u'ferieparadis', u'positive'),
(u'fidusmager', u'negative'),
(u'fiffikus', u'positive'),
(u'filister', u'negative'),
(u'finke', u'negative'),
(u'fisk,1', u'negative'),
(u'fisse', u'negative'),
(u'fisselette', u'negative'),
(u'fjollehoved', u'negative'),
(u'fjumrehoved', u'negative'),
(u'flab', u'negative'),
(u'fladpande', u'negative'),
(u'flakke,1', u'negative'),
(u'flane,1', u'negative'),
(u'flipproletar', u'negative'),
(u'flokdyr', u'negative'),
(u'flommeeurop\xe6er', u'negative'),
(u'flovmand', u'negative'),
(u'fluepapir', u'negative'),
(u'fl\xe6b', u'negative'),
(u'fl\xf8debolle', u'negative'),
(u'fl\xf8desk\xe6g', u'negative'),
(u'fl\xf8s', u'negative'),
(u'forbryderspire', u'negative'),
(u'forf\xf8rer', u'yes'),
(u'forgrundsfigur', u'positive'),
(u'formalist', u'negative'),
(u'formynder', u'negative'),
(u'forn\xe6rmelse', u'negative'),
(u'forr\xe6der', u'negative'),
(u'fortr\xe6ffelighed', u'positive'),
(u'fremmedlegeme', u'negative'),
(u'frille', u'positive'),
(u'fryns', u'negative'),
(u'fr\xe6kkert', u'negative'),
(u'fr\xf8\xe6der', u'negative'),
(u'fulderik', u'negative'),
(u'fumleg\xe6nger', u'negative'),
(u'fumler', u'negative'),
(u'fund', u'positive'),
(u'fundamentalist', u'negative'),
(u'furie', u'negative'),
(u'fusel', u'negative'),
(u'fuser', u'negative'),
(u'fyld', u'negative'),
(u'fyldeb\xf8tte', u'negative'),
(u'fyrt\xe5rn', u'positive'),
(u'fysiolog', u'yes'),
(u'f\xe5ret', u'negative'),
(u'f\xe6hoved', u'negative'),
(u'gadedreng', u'negative'),
(u'galanteri', u'negative'),
(u'galfrans', u'negative'),
(u'galgenfugl', u'negative'),
(u'gamin', u'negative'),
(u'gavflab', u'negative'),
(u'gentleman', u'positive'),
(u'gesj\xe6ft', u'negative'),
(u'gespenst', u'negative'),
(u'gigolo', u'negative'),
(u'gimpe,1', u'negative'),
(u'glut', u'positive'),
(u'gnavpotte', u'negative'),
(u'gnier', u'negative'),
(u'godtfolk', u'positive'),
(u'goliat', u'positive'),
(u'gorilla', u'negative'),
(u'grand old lady', u'positive'),
(u'grand old man', u'positive'),
(u'gratie', u'positive'),
(u'grib', u'negative'),
(u'grimrian', u'negative'),
(u'gris,1', u'negative'),
(u'grov\xe6der', u'negative'),
(u'grundejer', u'yes'),
(u'gr\xe6dekone', u'negative'),
(u'gr\xe6depil', u'negative'),
(u'gr\xe6sselig', u'negative'),
(u'gr\xf8ftegraver', u'negative'),
(u'gr\xf8nskolling', u'yes'),
(u'gud', u'positive'),
(u'gudedrik', u'positive'),
(u'gudinde', u'positive'),
(u'gudsbespotter', u'negative'),
(u'guf', u'positive'),
(u'guld', u'positive'),
(u'gulddreng', u'positive'),
(u'guldklump', u'positive'),
(u'gullaschbaron', u'negative'),
(u'guttermand', u'positive'),
(u'g\xe5s', u'negative'),
(u'g\xe6st', u'negative'),
(u'g\xf8geunge', u'negative'),
(u'haj', u'positive'),
(u'hakkebr\xe6t', u'negative'),
(u'haleneger', u'negative'),
(u'haltefanden', u'negative'),
(u'halvhjerne', u'negative'),
(u'handyr', u'positive'),
(u'hanekylling', u'negative'),
(u'hanrej', u'negative'),
(u'hare', u'negative'),
(u'harpe', u'negative'),
(u'havgasse', u'negative'),
(u'hejre,1', u'negative'),
(u'heks', u'negative'),
(u'helgen', u'positive'),
(u'helt,1', u'positive'),
(u'helteskikkelse', u'positive'),
(u'heltinde', u'positive'),
(u'helvedesmaskine', u'negative'),
(u'heros', u'positive'),
(u'hertug', u'negative'),
(u'himmerigsmundfuld', u'positive'),
(u'hjemmef\xf8dning', u'negative'),
(u'hjerne', u'positive'),
(u'hjernevrider', u'negative'),
(u'hjerte', u'yes'),
(u'hjerteknuser', u'yes'),
(u'hjertensk\xe6r', u'yes'),
(u'hofnar', u'yes'),
(u'hoforgan', u'negative'),
(u'hofsnog', u'negative'),
(u'horeunge', u'negative'),
(u'horkarl', u'negative'),
(u'hormonb\xf8f', u'negative'),
(u'hovednavn', u'positive'),
(u'hugaf', u'negative'),
(u'humanist', u'positive'),
(u'humorist', u'positive'),
(u'hum\xf8rbombe', u'positive'),
(u'hum\xf8rspiller', u'negative'),
(u'hum\xf8rspreder', u'positive'),
(u'hund,1', u'negative'),
(u'hundehandler', u'negative'),
(u'hundeklipper', u'negative'),
(u'hundj\xe6vel', u'negative'),
(u'husar', u'negative'),
(u'hvalp', u'negative'),
(u'hyggeonkel', u'positive'),
(u'hystade', u'negative'),
(u'h\xe5ndlanger', u'negative'),
(u'h\xe5ndv\xe6rker', u'positive'),
(u'h\xe5rkl\xf8ver', u'negative'),
(u'h\xe6dersmand', u'positive'),
(u'h\xe6ngehoved', u'negative'),
(u'h\xe6nger\xf8v', u'negative'),
(u'h\xe6ngetr\xe6', u'negative'),
(u'h\xf8nisse', u'negative'),
(u'ideal,1', u'positive'),
(u'idealist', u'positive'),
(u'idealkvinde', u'positive'),
(u'idol', u'positive'),
(u'ignorant,1', u'negative'),
(u'isjomfru', u'negative'),
(u'jasiger', u'negative'),
(u'jern', u'positive'),
(u'jernlady', u'positive'),
(u'judas', u'negative'),
(u'j\xf8dehader', u'negative'),
(u'kagekone', u'negative'),
(u'kakkelovnsr\xf8r', u'negative'),
(u'kandest\xf8ber', u'negative'),
(u'kanon,1', u'positive'),
(u'kapacitet', u'positive'),
(u'kapitalist', u'negative'),
(u'karklud', u'negative'),
(u'kastebold', u'negative'),
(u'katalysator', u'positive'),
(u'keeper', u'yes'),
(u'kendis', u'positive'),
(u'klamphugger', u'negative'),
(u'klamphuggerl\xe6ge', u'negative'),
(u'klaphat', u'negative'),
(u'klaptorsk', u'negative'),
(u'klassiker', u'positive'),
(u'klidmoster', u'negative'),
(u'klodrian', u'negative'),
(u'klods', u'negative'),
(u'klodsmajor', u'negative'),
(u'klud', u'negative'),
(u'kludder', u'negative'),
(u'klummer,1', u'negative'),
(u'klumpedumpe', u'negative'),
(u'kluns', u'negative'),
(u'knag,1', u'positive'),
(u'knoldesparker', u'negative'),
(u'knop', u'positive'),
(u'ko', u'negative'),
(u'kokette', u'negative'),
(u'kokotte,2', u'negative'),
(u'koleriker', u'negative'),
(u'kolos', u'negative'),
(u'komet', u'positive'),
(u'konge', u'positive'),
(u'konger\xe6kke', u'positive'),
(u'kontormus', u'negative'),
(u'kordreng', u'positive'),
(u'korthus', u'negative'),
(u'koryf\xe6', u'positive'),
(u'kostbarhed', u'positive'),
(u'krabat', u'negative'),
(u'kraftidiot', u'negative'),
(u'krakiler', u'negative'),
(u'kram,2', u'positive'),
(u'kran', u'negative'),
(u'kratlusker', u'negative'),
(u'kravl', u'negative'),
(u'krudtkarl', u'positive'),
(u'krudtt\xf8nde', u'positive'),
(u'krukke,1', u'negative'),
(u'kryb', u'negative'),
(u'krykhusar', u'negative'),
(u'kr\xe6', u'negative'),
(u'kr\xe6mmer', u'negative'),
(u'kr\xe6s', u'positive'),
(u'kr\xe6ve', u'negative'),
(u'kunnen', u'positive'),
(u'kunstv\xe6rk', u'positive'),
(u'kuv\xf8seguf', u'positive'),
(u'kvabso', u'negative'),
(u'kvabtorsk', u'negative'),
(u'kvaj', u'negative'),
(u'kvajpande', u'negative'),
(u'kvaksalver', u'negative'),
(u'kvalitet', u'positive'),
(u'kvartalsdranker', u'negative'),
(u'kv\xe6rulant', u'negative'),
(u'k\xe6lling', u'negative'),
(u'k\xe6ltring', u'negative'),
(u'k\xe6mpekvinde', u'negative'),
(u'k\xe6reste,1', u'yes'),
(u'k\xf8benhavnersnude', u'negative'),
(u'k\xf8dbjerg', u'negative'),
(u'k\xf8kkenskriver', u'negative'),
(u'laban', u'negative'),
(u'ladeport', u'negative'),
(u'lady', u'positive'),
(u'lakaj', u'negative'),
(u'lammesteg', u'positive'),
(u'lamseben', u'positive'),
(u'landsfader', u'positive'),
(u'lappeskr\xe6dder', u'negative'),
(u'laps', u'negative'),
(u'larve', u'positive'),
(u'las', u'negative'),
(u'lazaron', u'negative'),
(u'lebbe', u'negative'),
(u'lemmedasker', u'negative'),
(u'lig,1', u'negative'),
(u'lokker', u'negative'),
(u'lort,2', u'negative'),
(u'luskebuks', u'negative'),
(u'l\xe6kkerbid', u'positive'),
(u'l\xe6kkerbisken', u'positive'),
(u'l\xe6kkeri', u'positive'),
(u'l\xf8mmel', u'negative'),
(u'l\xf8vinde', u'positive'),
(u'madamme', u'negative'),
(u'madonna', u'positive'),
(u'mafia', u'negative'),
(u'mage,1', u'yes'),
(u'magtstr\xe6ber', u'negative'),
(u'mam', u'positive'),
(u'mammon', u'negative'),
(u'mappedyr', u'negative'),
(u'mark,1', u'negative'),
(u'mastodont', u'negative'),
(u'matrone', u'negative'),
(u'medusa', u'negative'),
(u'mestermand', u'yes'),
(u'metervare', u'negative'),
(u'mikrofonholder', u'negative'),
(u'mikroskop', u'yes'),
(u'misd\xe6der', u'negative'),
(u'moderdyr', u'negative'),
(u'monstrum', u'negative'),
(u'mundgodt', u'positive'),
(u'murmeldyr', u'negative'),
(u'museumsgenstand', u'negative'),
(u'museumsstykke', u'negative'),
(u'm\xe5lkonge', u'positive'),
(u'm\xe5lmager', u'positive'),
(u'm\xe5lmand', u'yes'),
(u'm\xe5lvogter', u'yes'),
(u'm\xe6r', u'negative'),
(u'm\xf8ghund', u'negative'),
(u'narkobaron', u'negative'),
(u'narrefisse', u'negative'),
(u'nathue', u'negative'),
(u'naziborg', u'negative'),
(u'nektar', u'positive'),
(u'nemme,1', u'positive'),
(u'nidding', u'negative'),
(u'nymfe', u'positive'),
(u'n\xf8glespiller', u'positive'),
(u'ogginok', u'negative'),
(u'oldsag', u'negative'),
(u'oldtidslevn', u'negative'),
(u'oldtidslevning', u'negative'),
(u'opkomling', u'negative'),
(u'original,1', u'negative'),
(u'overd\xe5dighed', u'positive'),
(u'pakke,1', u'positive'),
(u'pamper', u'negative'),
(u'papirnusser', u'negative'),
(u'papirnusseri', u'negative'),
(u'pariserr\xf8v', u'positive'),
(u'parvenu', u'negative'),
(u'pengepuger', u'negative'),
(u'perlek\xe6de', u'positive'),
(u'perlerad', u'positive'),
(u'perler\xe6kke', u'positive'),
(u'pestbyld', u'negative'),
(u'petitstof', u'negative'),
(u'pjalt', u'negative'),
(u'pjask', u'negative'),
(u'pjat', u'negative'),
(u'plagiat', u'negative'),
(u'plankev\xe6rkslytter', u'negative'),
(u'platugle', u'negative'),
(u'plimsoller', u'negative'),
(u'pragt', u'positive'),
(u'pragtstykke', u'positive'),
(u'pragtv\xe6rk', u'positive'),
(u'pram', u'negative'),
(u'prins', u'positive'),
(u'problembarn', u'negative'),
(u'profos', u'yes'),
(u'proselyt', u'negative'),
(u'pr\xe6station', u'positive'),
(u'pukkelryg', u'negative'),
(u'pullimut', u'negative'),
(u'pulverheks', u'negative'),
(u'p\xe5h\xe6ng', u'yes'),
(u'quisling', u'negative'),
(u'ragelse', u'negative'),
(u'rapand', u'positive'),
(u'rappenskralde', u'negative'),
(u'rejek\xe6lling', u'negative'),
(u'rendemaske', u'negative'),
(u'ridder', u'positive'),
(u'ringeagte', u'negative'),
(u'rivejern', u'negative'),
(u'rod,1', u'negative'),
(u'rottehul', u'negative'),
(u'rotterede', u'negative'),
(u'r\xe6dsel', u'negative'),
(u'r\xe6v', u'negative'),
(u'r\xf8verkule', u'negative'),
(u'r\xf8vpuler', u'negative'),
(u'sag', u'positive'),
(u'sammenkog', u'negative'),
(u'sammenrend', u'negative'),
(u'sammensurium', u'negative'),
(u'sans,1', u'positive'),
(u'satyr', u'negative'),
(u'sexbombe', u'positive'),
(u'sexkilling', u'positive'),
(u'sild', u'positive'),
(u'silo', u'negative'),
(u'siv', u'positive'),
(u'sjask,2', u'negative'),
(u'sjuske,1', u'negative'),
(u'skarpskytte', u'positive'),
(u'skat', u'positive'),
(u'skrammel', u'negative'),
(u'skribleri', u'negative'),
(u'skrubbe,1', u'negative'),
(u'skrud', u'positive'),
(u'skrummel', u'negative'),
(u'skude', u'negative'),
(u'skur', u'negative'),
(u'sk\xe5r', u'positive'),
(u'sk\xe6gabe', u'yes'),
(u'sk\xf8nheds\xe5benbaring', u'positive'),
(u'sk\xf8njomfru', u'positive'),
(u'sk\xf8rlevner', u'negative'),
(u'sk\xf8rtej\xe6ger', u'yes'),
(u'sladderblad', u'negative'),
(u'sladretaske', u'negative'),
(u'slaveanstalt', u'negative'),
(u'slavearbejde', u'negative'),
(u'slipsedreng', u'negative'),
(u'smudsblad', u'negative'),
(u'sm\xe5kravl', u'negative'),
(u'sm\xe6deskrift', u'negative'),
(u'snydepels', u'negative'),
(u'snydetamp', u'negative'),
(u'spejderdreng', u'negative'),
(u'spidsborger', u'negative'),
(u'spilde,2', u'negative'),
(u'spilford\xe6rver', u'negative'),
(u'spinatfugl', u'negative'),
(u'sportsfanatiker', u'negative'),
(u'sportsidiot', u'negative'),
(u'spradebasse', u'negative'),
(u'spritter', u'negative'),
(u'spr\xf8jt', u'negative'),
(u'spr\xf8jte,1', u'negative'),
(u'stabejs', u'negative'),
(u'starfucker', u'negative'),
(u'stav\xe6r', u'negative'),
(u'stemmekv\xe6g', u'negative'),
(u'stemmesamler', u'positive'),
(u'stemmesluger', u'positive'),
(u'stil\xf8velse', u'negative'),
(u'storebror', u'yes'),
(u'storspiller', u'positive'),
(u'stratenr\xf8ver', u'negative'),
(u'streng,1', u'positive'),
(u'strigle,1', u'negative'),
(u'st\xf8der', u'negative'),
(u'sultekost', u'negative'),
(u'superleder', u'positive'),
(u'supermand', u'positive'),
(u'sut,2', u'negative'),
(u'svigermor', u'positive'),
(u'sviner', u'negative'),
(u'svinger', u'positive'),
(u'sv\xe6kling', u'negative'),
(u'sv\xe6rv\xe6gter', u'positive'),
(u'syrehoved', u'negative'),
(u'syvsover', u'negative'),
(u's\xe6k', u'negative'),
(u's\xe6llert', u'positive'),
(u's\xe6rling', u'negative'),
(u's\xf8helt', u'positive'),
(u's\xf8ndagsbarn', u'positive'),
(u's\xf8ndagsbilist', u'negative'),
(u'talent,1', u'positive'),
(u'tallerkenneger', u'negative'),
(u'taskenspiller', u'negative'),
(u'tingeltangel', u'negative'),
(u'tornado', u'positive'),
(u'tosse,1', u'negative'),
(u'trivi', u'negative'),
(u'trivialroman', u'negative'),
(u'tro,2', u'positive'),
(u'trold', u'negative'),
(u'trussereder', u'negative'),
(u'trussetyv', u'yes'),
(u'tr\xe6dem\xf8lle', u'negative'),
(u'tr\xe6mand', u'negative'),
(u'tugthuskandidat', u'negative'),
(u'tumpe', u'negative'),
(u'turistparadis', u'positive'),
(u'tusindkunstner', u'positive'),
(u'tv-narkoman', u'negative'),
(u'tyran', u'negative'),
(u'tyskerh\xe5ndlanger', u'negative'),
(u't\xf8jte', u'negative'),
(u't\xf8lper', u'negative'),
(u't\xf8rvetriller', u'negative'),
(u't\xf8s', u'negative'),
(u't\xf8sedreng', u'negative'),
(u'udbytter', u'negative'),
(u'udhaler', u'negative'),
(u'umulius', u'negative'),
(u'underdog', u'negative'),
(u'underhund', u'negative'),
(u'underm\xe5ler', u'yes'),
(u'uniform,1', u'negative'),
(u'urh\xf8ne', u'yes'),
(u'usselryg', u'negative'),
(u'vagthund', u'negative'),
(u'valgmand', u'yes'),
(u'vanskabning', u'negative'),
(u'varietet', u'yes'),
(u'varyler', u'negative'),
(u'vatpik', u'negative'),
(u'ven', u'yes'),
(u'violinkasse', u'negative'),
(u'virtuos,1', u'positive'),
(u'vissenpind', u'negative'),
(u'vraggods', u'negative'),
(u'v\xe6rdi', u'positive'),
(u'v\xe6rdigenstand', u'positive'),
(u'v\xe6rk,1', u'positive'),
(u'yndlingsoffer', u'negative'),
(u'yngling', u'yes'),
(u'ynk', u'negative'),
(u'\xe5rgangsvin', u'positive'),
(u'\xe5rsunge', u'yes'),
(u'\xe6dedolk', u'negative'),
(u'\xe6sel', u'negative'),
(u'\xf8jentjener', u'negative'),
(u'\xf8lhund', u'negative'),
(u'\xf8nske,2', u'positive')]
In [ ]:
Content source: fnielsen/dasem
Similar notebooks: