2014-07-16 11:45:10 +01:00
|
|
|
# test reading a given number of characters
|
|
|
|
|
|
|
|
def do(mode):
|
2014-10-04 07:54:16 +01:00
|
|
|
if mode == 'rb':
|
|
|
|
enc = None
|
|
|
|
else:
|
|
|
|
enc = 'utf-8'
|
|
|
|
f = open('unicode/data/utf-8_2.txt', mode=mode, encoding=enc)
|
2014-07-16 11:45:10 +01:00
|
|
|
print(f.read(1))
|
|
|
|
print(f.read(1))
|
|
|
|
print(f.read(2))
|
|
|
|
print(f.read(4))
|
2015-01-29 14:56:09 +00:00
|
|
|
|
|
|
|
# skip to end of line
|
|
|
|
f.readline()
|
|
|
|
|
|
|
|
# check 3-byte utf-8 char
|
|
|
|
print(f.read(1 if mode == 'rt' else 3))
|
|
|
|
|
|
|
|
# check 4-byte utf-8 char
|
|
|
|
print(f.read(1 if mode == 'rt' else 4))
|
|
|
|
|
2014-07-16 11:45:10 +01:00
|
|
|
f.close()
|
|
|
|
|
|
|
|
do('rb')
|
|
|
|
do('rt')
|