In [1]:
import urllib.request
from collections import defaultdict, Counter
wp_url = "https://en.wikipedia.org/wiki/Budapest"
text = urllib.request.urlopen(wp_url).read().decode('utf8')
words = text.split()
In [2]:
%%timeit
word_freq = {}
for word in words:
if word not in word_freq:
word_freq[word] = 1
else:
word_freq[word] += 1
In [3]:
%%timeit
word_freq = {}
for word in words:
try:
word_freq[word] += 1
except KeyError:
word_freq[word] = 1
In [4]:
%%timeit
word_freq = {}
for word in words:
word_freq.setdefault(word, 0)
word_freq[word] += 1
In [5]:
%%timeit
word_freq = defaultdict(int)
for word in words:
word_freq[word] += 1
In [6]:
%%timeit
word_freq = Counter(words)