In [1]:
#-*- coding:utf-8
In [2]:
strings = "stressed"
print(strings[::-1])
In [3]:
strings1 = u"パタトクカシーー"
print(strings1[::2])
In [4]:
strings_p = u"パトカー"
strings_t = u"タクシー"
strings_sum = ''
for p, t in zip(strings_p, strings_t):
strings_sum += p + t
print(strings_sum)
In [5]:
strings3 = "Now I need a drink, alcoholic of course, after the heavy lectures involving quantum mechanics."
count_list = [len(i) for i in strings3.split(' ')]
count_list
Out[5]:
In [6]:
strings4 = "Hi He Lied Because Boron Could Not Oxidize Fluorine. New Nations Might Also Sign Peace Security Clause. Arthur King Can."
strings4 = strings4.replace('.', '')
strings4 = strings4.split(' ')
dictionary = {}
for i in range(len(strings4)):
if i+1 in [1, 5, 6, 7, 8, 9, 15, 16, 19]:
dictionary.update({strings4[i][:1]: strings4[i]})
else:
dictionary.update({strings4[i][:2]: strings4[i]})
print(dictionary)
In [7]:
def ngram(sequence, n, mode='c'):
if mode == 'c':
return [sequence[i:i+n] for i in range(len(sequence)-1)]
elif mode == 'w':
sequence = [s.strip(',.') for s in sequence.split(' ')] # スペースや記号を除去した単語リストの生成
return [tuple(sequence[i:i+n]) for i in range(len(sequence)-1)]
sequence = "I am an NLPer"
print(ngram(sequence, 2))
print(ngram(sequence, 2, 'w'))
In [8]:
X = set(ngram('paraparaparadise', 2))
Y = (ngram('paragraph', 2))
print(X.intersection(Y))
print(X.union(Y))
print(X.difference(Y))
print('se' in X)
print('se' in Y)
In [9]:
#-*- coding:utf-8 -*-
def print_template(x, y, z):
return u'%s時の%sは%s' % (x, y, z)
template = print_template(12, u'気温', 22.4)
print(template)
In [10]:
def cipher(sequence):
return "".join((map(str, [chr(219-ord(i)) if i.islower() else i for i in sequence])))
strings = "I am an NLPer"
encryption = cipher(strings)
decryption = cipher(encryption)
print(encryption)
print(decryption)
In [11]:
import random
sequence = "I couldn't believe that I could actually understand what I was reading : the phenomenal power of the human mind."
[s[0]+"".join(map(str, random.sample(s[1:-1], len(s)-2)))+s[-1] if len(s) >= 5 \
else str(s) for s in sequence.split(' ')]
Out[11]:
In [ ]: