In [1]:
s = 'あいうえお'
In [2]:
b = s.encode('unicode-escape')
In [3]:
print(b)
In [4]:
print(type(b))
In [5]:
s_from_b = b.decode('unicode-escape')
In [6]:
print(s_from_b)
In [7]:
print(type(s_from_b))
In [8]:
s_from_b_error = b.decode('utf-8')
In [9]:
print(s_from_b_error)
In [10]:
print(type(s_from_b_error))
In [11]:
s_from_s = s_from_b_error.encode().decode('unicode-escape')
In [12]:
print(s_from_s)
In [13]:
print(type(s_from_s))
In [14]:
import codecs
s_from_s_codecs = codecs.decode(s_from_b_error, 'unicode-escape')
In [15]:
print(s_from_s_codecs)
In [16]:
print(type(s_from_s_codecs))
In [17]:
s_ascii = ascii('あ')
In [18]:
print(s_ascii)
In [19]:
print(type(s_ascii))
In [20]:
print(s_ascii[0])
In [21]:
print(s_ascii[-1])
In [22]:
print(len(s_ascii))
In [23]:
print(ascii('あ') == "'\\u3042'")
In [24]:
s_unicode_escape = ascii('あ')[1:-1]
In [25]:
print(s_unicode_escape)
In [26]:
print(type(s_unicode_escape))
In [27]:
print(s_unicode_escape == '\\u3042')
In [28]:
print('\u3042')
In [29]:
print(len('\u3042'))
In [30]:
print('\u3042' == 'あ')
In [31]:
print('\\u3042')
In [32]:
print(r'\u3042')
In [33]:
print(len(r'\u3042'))
In [34]:
with open('data/src/unicode_escape.txt') as f:
s = f.read()
print(s)
print(type(s))
print(len(s))
In [35]:
with open('data/src/unicode_escape.txt', encoding='unicode-escape') as f:
s = f.read()
print(s)
print(type(s))
print(len(s))
In [36]:
b_json = b'{"a": "\u3042"}'
In [37]:
print(b_json)
In [38]:
print(b_json.decode())
In [39]:
print(b_json.decode('unicode-escape'))
In [40]:
import json
In [41]:
print(json.loads(b_json.decode()))
In [42]:
print(type(json.loads(b_json.decode())))
In [43]:
print(json.loads(b_json))