| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641 |
- # Test cases for strings (compile and run)
- [case testStrBasics]
- from typing import Tuple
- def f() -> str:
- return 'some string'
- def g() -> str:
- return 'some\a \v \t \x7f " \n \0string 🐍'
- def tostr(x: int) -> str:
- return str(x)
- def booltostr(x: bool) -> str:
- return str(x)
- def concat(x: str, y: str) -> str:
- return x + y
- def eq(x: str) -> int:
- if x == 'foo':
- return 0
- elif x != 'bar':
- return 1
- return 2
- def match(x: str, y: str) -> Tuple[bool, bool]:
- return (x.startswith(y), x.endswith(y))
- [file driver.py]
- from native import f, g, tostr, booltostr, concat, eq, match
- import sys
- assert f() == 'some string'
- assert f() is sys.intern('some string')
- assert g() == 'some\a \v \t \x7f " \n \0string 🐍'
- assert tostr(57) == '57'
- assert concat('foo', 'bar') == 'foobar'
- assert booltostr(True) == 'True'
- assert booltostr(False) == 'False'
- assert eq('foo') == 0
- assert eq('zar') == 1
- assert eq('bar') == 2
- assert int(tostr(0)) == 0
- assert int(tostr(20)) == 20
- assert match('', '') == (True, True)
- assert match('abc', '') == (True, True)
- assert match('abc', 'a') == (True, False)
- assert match('abc', 'c') == (False, True)
- assert match('', 'abc') == (False, False)
- [case testStringOps]
- from typing import List, Optional
- def do_split(s: str, sep: Optional[str] = None, max_split: Optional[int] = None) -> List[str]:
- if sep is not None:
- if max_split is not None:
- return s.split(sep, max_split)
- else:
- return s.split(sep)
- return s.split()
- ss = "abc abcd abcde abcdef"
- def test_split() -> None:
- assert do_split(ss) == ["abc", "abcd", "abcde", "abcdef"]
- assert do_split(ss, " ") == ["abc", "abcd", "abcde", "abcdef"]
- assert do_split(ss, "-") == ["abc abcd abcde abcdef"]
- assert do_split(ss, " ", -1) == ["abc", "abcd", "abcde", "abcdef"]
- assert do_split(ss, " ", 0) == ["abc abcd abcde abcdef"]
- assert do_split(ss, " ", 1) == ["abc", "abcd abcde abcdef"]
- assert do_split(ss, " ", 2) == ["abc", "abcd", "abcde abcdef"]
- def getitem(s: str, index: int) -> str:
- return s[index]
- from testutil import assertRaises
- s = "abc"
- def test_getitem() -> None:
- assert getitem(s, 0) == "a"
- assert getitem(s, 1) == "b"
- assert getitem(s, 2) == "c"
- assert getitem(s, -3) == "a"
- assert getitem(s, -2) == "b"
- assert getitem(s, -1) == "c"
- with assertRaises(IndexError, "string index out of range"):
- getitem(s, 4)
- with assertRaises(IndexError, "string index out of range"):
- getitem(s, -4)
- def str_to_int(s: str, base: Optional[int] = None) -> int:
- if base:
- return int(s, base)
- else:
- return int(s)
- def test_str_to_int() -> None:
- assert str_to_int("1") == 1
- assert str_to_int("10") == 10
- assert str_to_int("a", 16) == 10
- assert str_to_int("1a", 16) == 26
- with assertRaises(ValueError, "invalid literal for int() with base 10: 'xyz'"):
- str_to_int("xyz")
- def test_slicing() -> None:
- # Use dummy adds to avoid constant folding
- zero = int()
- two = zero + 2
- s = "foobar" + str()
- assert s[two:] == "obar"
- assert s[:two] == "fo"
- assert s[two:-two] == "ob"
- assert s[two:two] == ""
- assert s[two:two + 1] == "o"
- assert s[-two:] == "ar"
- assert s[:-two] == "foob"
- assert s[:] == "foobar"
- assert s[two:333] == "obar"
- assert s[333:two] == ""
- assert s[two:-333] == ""
- assert s[-333:two] == "fo"
- big_int: int = 1000 * 1000 * 1000 * 1000 * 1000 * 1000 * 1000
- assert s[1:big_int] == "oobar"
- assert s[big_int:] == ""
- assert s[-big_int:-1] == "fooba"
- def test_str_replace() -> None:
- a = "foofoofoo"
- assert a.replace("foo", "bar") == "barbarbar"
- assert a.replace("foo", "bar", -1) == "barbarbar"
- assert a.replace("foo", "bar", 1) == "barfoofoo"
- assert a.replace("foo", "bar", 4) == "barbarbar"
- assert a.replace("aaa", "bar") == "foofoofoo"
- assert a.replace("ofo", "xyzw") == "foxyzwxyzwo"
- def is_true(x: str) -> bool:
- if x:
- return True
- else:
- return False
- def is_true2(x: str) -> bool:
- return bool(x)
- def is_false(x: str) -> bool:
- if not x:
- return True
- else:
- return False
- def test_str_to_bool() -> None:
- assert is_false('')
- assert not is_true('')
- assert not is_true2('')
- for x in 'a', 'foo', 'bar', 'some string':
- assert is_true(x)
- assert is_true2(x)
- assert not is_false(x)
- def test_str_min_max() -> None:
- x: str = 'aaa'
- y: str = 'bbb'
- z: str = 'aa'
- assert min(x, y) == 'aaa'
- assert min(x, z) == 'aa'
- assert max(x, y) == 'bbb'
- assert max(x, z) == 'aaa'
- [case testStringFormattingCStyle]
- [typing fixtures/typing-full.pyi]
- from typing import Tuple
- var = 'mypyc'
- num = 20
- def test_basics() -> None:
- assert 'Hello %s, this is a test' % var == "Hello mypyc, this is a test"
- assert 'Hello %s %d, this is a test' % (var, num) == "Hello mypyc 20, this is a test"
- t: Tuple[str, int] = (var, num)
- assert 'Hello %s %d, this is a test' % t == "Hello mypyc 20, this is a test"
- large_num = 2**65
- assert 'number: %d' % large_num == 'number: 36893488147419103232'
- neg_num = -3
- assert 'negative integer: %d' % neg_num == 'negative integer: -3'
- assert 'negative integer: %d' % (-large_num) == 'negative integer: -36893488147419103232'
- bool_var1 = True
- bool_var2 = False
- assert 'bool: %s, %s' % (bool_var1, bool_var2) == 'bool: True, False'
- float_num = 123.4
- assert '%f' % float_num == '123.400000'
- assert '%.2f' % float_num == '123.40'
- assert '%.5f' % float_num == '123.40000'
- assert '%10.2f' % float_num == ' 123.40'
- assert '%10.5f' % float_num == ' 123.40000'
- assert '%010.5f' % float_num == '0123.40000'
- assert '%015.5f' % float_num == '000000123.40000'
- assert '%e' % float_num == '1.234000e+02'
- large_float = 1.23e30
- large_float2 = 1234123412341234123400000000000000000
- small_float = 1.23e-20
- assert '%f, %f, %f' % (small_float, large_float, large_float2) == \
- '0.000000, 1229999999999999959718843908096.000000, 1234123412341234169005079998930878464.000000'
- assert '%s, %s, %s' % (small_float, large_float, large_float2) == \
- '1.23e-20, 1.23e+30, 1234123412341234123400000000000000000'
- assert '%d, %d, %d' % (small_float, large_float, large_float2) == \
- '0, 1229999999999999959718843908096, 1234123412341234123400000000000000000'
- nan_num = float('nan')
- inf_num = float('inf')
- assert '%s, %s' % (nan_num, inf_num) == 'nan, inf'
- assert '%f, %f' % (nan_num, inf_num) == 'nan, inf'
- [case testFStrings]
- import decimal
- from datetime import datetime
- var = 'mypyc'
- num = 20
- def test_fstring_basics() -> None:
- assert f'Hello {var}, this is a test' == "Hello mypyc, this is a test"
- large_num = 2**65
- assert f'number: {large_num}' == 'number: 36893488147419103232'
- neg_num = -3
- assert f'negative integer: {neg_num}' == 'negative integer: -3'
- assert f'negative integer: {-large_num}' == 'negative integer: -36893488147419103232'
- bool_var1 = True
- bool_var2 = False
- assert f'bool: {bool_var1}, {bool_var2}' == 'bool: True, False'
- x = bytes([1, 2, 3, 4])
- # assert f'bytes: {x}' == "bytes: b'\\x01\\x02\\x03\\x04'"
- # error: If x = b'abc' then f"{x}" or "{}".format(x) produces "b'abc'", not "abc". If this is desired behavior, use f"{x!r}" or "{!r}".format(x). Otherwise, decode the bytes
- float_num = 123.4
- assert f'{float_num}' == '123.4'
- assert f'{float_num:.2f}' == '123.40'
- assert f'{float_num:.5f}' == '123.40000'
- assert f'{float_num:>10.2f}' == ' 123.40'
- assert f'{float_num:>10.5f}' == ' 123.40000'
- assert f'{float_num:>010.5f}' == '0123.40000'
- assert f'{float_num:>015.5f}' == '000000123.40000'
- assert f'{float_num:e}' == '1.234000e+02'
- large_float = 1.23e30
- large_float2 = 1234123412341234123400000000000000000
- small_float = 1.23e-20
- assert f'{small_float}, {large_float}, {large_float2}' == '1.23e-20, 1.23e+30, 1234123412341234123400000000000000000'
- nan_num = float('nan')
- inf_num = float('inf')
- assert f'{nan_num}, {inf_num}' == 'nan, inf'
- # F-strings would be translated into ''.join[string literals, format method call, ...] in mypy AST.
- # Currently we are using a str.join specializer for f-string speed up. We might not cover all cases
- # and the rest ones should fall back to a normal str.join method call.
- # TODO: Once we have a new pipeline for f-strings, this test case can be moved to testStringOps.
- def test_str_join() -> None:
- var = 'mypyc'
- num = 10
- assert ''.join(['a', 'b', '{}'.format(var), 'c']) == 'abmypycc'
- assert ''.join(['a', 'b', '{:{}}'.format(var, ''), 'c']) == 'abmypycc'
- assert ''.join(['a', 'b', '{:{}}'.format(var, '>10'), 'c']) == 'ab mypycc'
- assert ''.join(['a', 'b', '{:{}}'.format(var, '>{}'.format(num)), 'c']) == 'ab mypycc'
- assert var.join(['a', '{:{}}'.format(var, ''), 'b']) == 'amypycmypycmypycb'
- assert ','.join(['a', '{:{}}'.format(var, ''), 'b']) == 'a,mypyc,b'
- assert ''.join(['x', var]) == 'xmypyc'
- class A:
- def __init__(self, name, age):
- self.name = name
- self.age = age
- def __repr__(self):
- return f'{self.name} is {self.age} years old.'
- def test_fstring_datatype() -> None:
- u = A('John Doe', 14)
- assert f'{u}' == 'John Doe is 14 years old.'
- d = {'name': 'John Doe', 'age': 14}
- assert f'{d}' == "{'name': 'John Doe', 'age': 14}"
- def test_fstring_escape() -> None:
- assert f"{'inside'}" == 'inside'
- assert f'{"inside"}' == 'inside'
- assert f"""inside""" == 'inside'
- assert f'''inside''' == 'inside'
- assert f"\"{'inside'}\"" == '"inside"'
- assert f'\'{"inside"}\'' == "'inside'"
- assert f'{{10}}' == '{10}'
- assert f'{{10 + 10}}' == '{10 + 10}'
- assert f'{{{10 + 10}}}' == '{20}'
- assert f'{{{{10 + 10}}}}' == '{{10 + 10}}'
- def test_fstring_conversion() -> None:
- assert f'Hello {var!r}' == "Hello 'mypyc'"
- # repr() is equivalent to !r
- assert f'Hello {repr(var)}' == "Hello 'mypyc'"
- assert f'Hello {var!a}' == "Hello 'mypyc'"
- # ascii() is equivalent to !a
- assert f'Hello {ascii(var)}' == "Hello 'mypyc'"
- tmp_str = """this
- is a new line."""
- assert f'Test: {tmp_str!a}' == "Test: 'this\\n is a new line.'"
- s = 'test: āĀēĒčČ..šŠūŪžŽ'
- assert f'{s}' == 'test: āĀēĒčČ..šŠūŪžŽ'
- assert f'{s!a}' == "'test: \\u0101\\u0100\\u0113\\u0112\\u010d\\u010c..\\u0161\\u0160\\u016b\\u016a\\u017e\\u017d'"
- assert f'Hello {var!s}' == 'Hello mypyc'
- assert f'Hello {num!s}' == 'Hello 20'
- def test_fstring_align() -> None:
- assert f'Hello {var:>20}' == "Hello mypyc"
- assert f'Hello {var!r:>20}' == "Hello 'mypyc'"
- assert f'Hello {var:>{num}}' == "Hello mypyc"
- assert f'Hello {var!r:>{num}}' == "Hello 'mypyc'"
- def test_fstring_multi() -> None:
- assert f'Hello {var}, hello again {var}' == "Hello mypyc, hello again mypyc"
- a = 'py'
- s = f'my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}my{a}'
- assert s == 'mypymypymypymypymypymypymypymypymypymypymypymypymypymypymypymypymypymypymypymypymypymypymypymypy'
- def test_fstring_python_doc() -> None:
- name = 'Fred'
- assert f"He said his name is {name!r}." == "He said his name is 'Fred'."
- assert f"He said his name is {repr(name)}." == "He said his name is 'Fred'."
- width = 10
- precision = 4
- value = decimal.Decimal('12.34567')
- assert f'result: {value:{width}.{precision}}' == 'result: 12.35' # nested field
- today = datetime(year=2017, month=1, day=27)
- assert f'{today:%B %d, %Y}' == 'January 27, 2017' # using date format specifier
- number = 1024
- assert f'{number:#0x}' == '0x400' # using integer format specifier
- [case testStringFormatMethod]
- from typing import Tuple
- def test_format_method_basics() -> None:
- x = str()
- assert 'x{}'.format(x) == 'x'
- assert 'ā{}'.format(x) == 'ā'
- assert '😀{}'.format(x) == '😀'
- assert ''.format() == ''
- assert 'abc'.format() == 'abc'
- assert '{}{}'.format(1, 2) == '12'
- name = 'Eric'
- age = 14
- assert "My name is {name}, I'm {age}.".format(name=name, age=age) == "My name is Eric, I'm 14."
- assert "My name is {A}, I'm {B}.".format(A=name, B=age) == "My name is Eric, I'm 14."
- assert "My name is {}, I'm {B}.".format(name, B=age) == "My name is Eric, I'm 14."
- bool_var1 = True
- bool_var2 = False
- assert 'bool: {}, {}'.format(bool_var1, bool_var2) == 'bool: True, False'
- def test_format_method_empty_braces() -> None:
- name = 'Eric'
- age = 14
- assert 'Hello, {}!'.format(name) == 'Hello, Eric!'
- assert '{}'.format(name) == 'Eric'
- assert '{}! Hi!'.format(name) == 'Eric! Hi!'
- assert '{}, Hi, {}'.format(name, name) == 'Eric, Hi, Eric'
- assert 'Hi! {}'.format(name) == 'Hi! Eric'
- assert "Hi, I'm {}. I'm {}.".format(name, age) == "Hi, I'm Eric. I'm 14."
- assert '{{}}'.format() == '{}'
- assert '{{{{}}}}'.format() == '{{}}'
- assert '{{}}{}'.format(name) == '{}Eric'
- assert 'Hi! {{{}}}'.format(name) == 'Hi! {Eric}'
- assert 'Hi! {{ {}'.format(name) == 'Hi! { Eric'
- assert 'Hi! {{ {} }}}}'.format(name) == 'Hi! { Eric }}'
- def test_format_method_numbers() -> None:
- s = 'int: {0:d}; hex: {0:x}; oct: {0:o}; bin: {0:b}'.format(-233)
- assert s == 'int: -233; hex: -e9; oct: -351; bin: -11101001'
- num = 2**65
- s = 'int: {0:d}; hex: {0:x}; oct: {0:o}; bin: {0:b}'.format(num)
- assert s == 'int: 36893488147419103232; hex: 20000000000000000; oct: 4000000000000000000000; bin: 100000000000000000000000000000000000000000000000000000000000000000'
- s = 'int: {0:d}; hex: {0:x}; oct: {0:o}; bin: {0:b}'.format(-num)
- assert s == 'int: -36893488147419103232; hex: -20000000000000000; oct: -4000000000000000000000; bin: -100000000000000000000000000000000000000000000000000000000000000000'
- large_num = 2**65
- assert 'number: {}'.format(large_num) == 'number: 36893488147419103232'
- neg_num = -3
- assert 'negative integer: {}'.format(neg_num) == 'negative integer: -3'
- assert 'negative integer: {}'.format(-large_num) == 'negative integer: -36893488147419103232'
- large_float = 1.23e30
- large_float2 = 1234123412341234123400000000000000000
- small_float = 1.23e-20
- assert '{}, {}, {}'.format(small_float, large_float, large_float2) == '1.23e-20, 1.23e+30, 1234123412341234123400000000000000000'
- nan_num = float('nan')
- inf_num = float('inf')
- assert '{}, {}'.format(nan_num, inf_num) == 'nan, inf'
- def format_args(*args: int) -> str:
- return 'x{}y{}'.format(*args)
- def format_kwargs(**kwargs: int) -> str:
- return 'c{x}d{y}'.format(**kwargs)
- def format_args_self(*args: int) -> str:
- return '{}'.format(args)
- def format_kwargs_self(**kwargs: int) -> str:
- return '{}'.format(kwargs)
- def test_format_method_args() -> None:
- assert format_args(10, 2) == 'x10y2'
- assert format_args_self(10, 2) == '(10, 2)'
- assert format_kwargs(x=10, y=2) == 'c10d2'
- assert format_kwargs(x=10, y=2, z=1) == 'c10d2'
- assert format_kwargs_self(x=10, y=2, z=1) == "{'x': 10, 'y': 2, 'z': 1}"
- def test_format_method_different_kind() -> None:
- s1 = "Literal['😀']"
- assert 'Revealed type is {}'.format(s1) == "Revealed type is Literal['😀']"
- s2 = "Revealed type is"
- assert "{} Literal['😀']".format(s2) == "Revealed type is Literal['😀']"
- s3 = "测试:"
- assert "{}{} {}".format(s3, s2, s1) == "测试:Revealed type is Literal['😀']"
- assert "Test: {}{}".format(s3, s1) == "Test: 测试:Literal['😀']"
- assert "Test: {}{}".format(s3, s2) == "Test: 测试:Revealed type is"
- def test_format_method_nested() -> None:
- var = 'mypyc'
- num = 10
- assert '{:{}}'.format(var, '') == 'mypyc'
- assert '{:{}}'.format(var, '>10') == ' mypyc'
- assert '{:{}}'.format(var, '>{}'.format(num)) == ' mypyc'
- class Point:
- def __init__(self, x, y):
- self.x, self.y = x, y
- def __str__(self):
- return 'Point({self.x}, {self.y})'.format(self=self)
- # Format examples from Python doc
- # https://docs.python.org/3/library/string.html#formatexamples
- def test_format_method_python_doc() -> None:
- # Accessing arguments by position:
- assert '{0}, {1}, {2}'.format('a', 'b', 'c') == 'a, b, c'
- assert '{}, {}, {}'.format('a', 'b', 'c') == 'a, b, c'
- assert '{2}, {1}, {0}'.format('a', 'b', 'c') == 'c, b, a'
- assert '{2}, {1}, {0}'.format(*'abc') == 'c, b, a' # unpacking argument sequence
- # assert '{0}{1}{0}'.format('abra', 'cad') = 'abracadabra' # arguments' indices can be repeated
- # Accessing arguments by name:
- s = 'Coordinates: {latitude}, {longitude}'.format(latitude='37.24N', longitude='-115.81W')
- assert s == 'Coordinates: 37.24N, -115.81W'
- coord = {'latitude': '37.24N', 'longitude': '-115.81W'}
- assert 'Coordinates: {latitude}, {longitude}'.format(**coord) == 'Coordinates: 37.24N, -115.81W'
- # Accessing arguments’ attributes:
- assert str(Point(4, 2)) == 'Point(4, 2)'
- # Accessing arguments’ items:
- coord2 = (3, 5)
- assert 'X: {0[0]}; Y: {0[1]}'.format(coord2) == 'X: 3; Y: 5'
- # Replacing %s and %r:
- s = "repr() shows quotes: {!r}; str() doesn't: {!s}".format('test1', 'test2')
- assert s == "repr() shows quotes: 'test1'; str() doesn't: test2"
- # Aligning the text and specifying a width:
- assert '{:<30}'.format('left aligned') == 'left aligned '
- assert '{:>30}'.format('right aligned') == ' right aligned'
- assert '{:^30}'.format('centered') == ' centered '
- assert '{:*^30}'.format('centered') == '***********centered***********' # use '*' as a fill char
- # Replacing %+f, %-f, and % f and specifying a sign:
- assert '{:+f}; {:+f}'.format(3.14, -3.14) == '+3.140000; -3.140000' # show it always
- assert '{: f}; {: f}'.format(3.14, -3.14) == ' 3.140000; -3.140000' # show a space for positive numbers
- assert '{:-f}; {:-f}'.format(3.14, -3.14) == '3.140000; -3.140000' # show only the minus -- same as '{:f}; {:f}'
- # Replacing %x and %o and converting the value to different bases:
- s = 'int: {0:d}; hex: {0:x}; oct: {0:o}; bin: {0:b}'.format(42) # format also supports binary numbers
- assert s == 'int: 42; hex: 2a; oct: 52; bin: 101010'
- s = 'int: {0:d}; hex: {0:#x}; oct: {0:#o}; bin: {0:#b}'.format(42) # with 0x, 0o, or 0b as prefix:
- assert s == 'int: 42; hex: 0x2a; oct: 0o52; bin: 0b101010'
- # Using the comma as a thousands separator:
- assert '{:,}'.format(1234567890) == '1,234,567,890'
- # Expressing a percentage:
- points = 19.0
- total = 22.0
- assert 'Correct answers: {:.2%}'.format(points/total) == 'Correct answers: 86.36%'
- # Using type-specific formatting:
- import datetime
- d = datetime.datetime(2010, 7, 4, 12, 15, 58)
- assert '{:%Y-%m-%d %H:%M:%S}'.format(d) == '2010-07-04 12:15:58'
- # Nesting arguments and more complex examples:
- tmp_strs = []
- for align, text in zip('<^>', ['left', 'center', 'right']):
- tmp_strs.append('{0:{fill}{align}16}'.format(text, fill=align, align=align))
- assert tmp_strs == ['left<<<<<<<<<<<<', '^^^^^center^^^^^', '>>>>>>>>>>>right']
- octets = [192, 168, 0, 1]
- assert '{:02X}{:02X}{:02X}{:02X}'.format(*octets) == 'C0A80001'
- width = 5
- tmp_strs = []
- for num in range(5,12):
- tmp_str = ''
- for base in 'dXob':
- tmp_str += ('{0:{width}{base}}'.format(num, base=base, width=width))
- tmp_strs.append(tmp_str)
- assert tmp_strs == [' 5 5 5 101',\
- ' 6 6 6 110',\
- ' 7 7 7 111',\
- ' 8 8 10 1000',\
- ' 9 9 11 1001',\
- ' 10 A 12 1010',\
- ' 11 B 13 1011']
- [case testChr]
- # Some test cases are from https://docs.python.org/3/howto/unicode.html
- def try_invalid(x: int) -> bool:
- try:
- chr(x + int())
- return False
- except ValueError:
- return True
- def test_chr() -> None:
- assert chr(57344) == '\ue000'
- assert chr(0) == '\x00'
- assert chr(65) == 'A'
- assert chr(150) == '\x96'
- try:
- chr(-1)
- assert False
- except ValueError:
- pass
- try:
- chr(1114112)
- assert False
- except ValueError:
- pass
- assert chr(1114111) == '\U0010ffff'
- x = 0
- assert chr(x + int()) == '\x00'
- x = 100
- assert chr(x + int()) == 'd'
- x = 150
- assert chr(x + int()) == '\x96'
- x = 257
- assert chr(x + int()) == 'ā'
- x = 65537
- assert chr(x + int()) == '𐀁'
- assert try_invalid(-1)
- assert try_invalid(1114112)
- [case testOrd]
- def test_ord() -> None:
- assert ord('\ue000') == 57344
- s = "a\xac\u1234\u20ac\U00008000"
- # ^^^^ two-digit hex escape
- # ^^^^^^ four-digit Unicode escape
- # ^^^^^^^^^^ eight-digit Unicode escape
- l1 = [ord(c) for c in s]
- assert l1 == [97, 172, 4660, 8364, 32768]
- u = 'abcdé'
- assert ord(u[-1]) == 233
- assert ord(b'a') == 97
- assert ord(b'a' + bytes()) == 97
- u2 = '\U0010ffff'
- assert ord(u2) == 1114111
- try:
- ord('aa')
- assert False
- except TypeError:
- pass
- [case testDecode]
- def test_decode() -> None:
- assert "\N{GREEK CAPITAL LETTER DELTA}" == '\u0394'
- assert "\u0394" == "\u0394"
- assert "\U00000394" == '\u0394'
- assert b'\x80abc'.decode('utf-8', 'replace') == '\ufffdabc'
- assert b'\x80abc'.decode('utf-8', 'backslashreplace') == '\\x80abc'
- assert b'abc'.decode() == 'abc'
- assert b'abc'.decode('utf-8') == 'abc'
- assert b'\x80abc'.decode('utf-8', 'ignore') == 'abc'
- assert b'\x80abc'.decode('UTF-8', 'ignore') == 'abc'
- assert b'\x80abc'.decode('Utf-8', 'ignore') == 'abc'
- assert b'\x80abc'.decode('utf_8', 'ignore') == 'abc'
- assert b'\x80abc'.decode('latin1', 'ignore') == '\x80abc'
- assert b'\xd2\xbb\xb6\xfe\xc8\xfd'.decode('gbk', 'ignore') == '一二三'
- assert b'\xd2\xbb\xb6\xfe\xc8\xfd'.decode('latin1', 'ignore') == 'Ò»¶þÈý'
- assert b'Z\xc3\xbcrich'.decode("utf-8") == 'Zürich'
- try:
- b'Z\xc3\xbcrich'.decode('ascii')
- assert False
- except UnicodeDecodeError:
- pass
- assert bytearray(range(5)).decode() == '\x00\x01\x02\x03\x04'
- b = bytearray(b'\xe4\xbd\xa0\xe5\xa5\xbd')
- assert b.decode() == '你好'
- assert b.decode('gbk') == '浣犲ソ'
- assert b.decode('latin1') == 'ä½\xa0好'
- [case testEncode]
- from testutil import assertRaises
- def test_encode() -> None:
- u = chr(40960) + 'abcd' + chr(1972)
- assert u.encode() == b'\xea\x80\x80abcd\xde\xb4'
- assert u.encode('utf-8') == b'\xea\x80\x80abcd\xde\xb4'
- with assertRaises(UnicodeEncodeError):
- u.encode('ascii')
- with assertRaises(LookupError):
- u.encode('aaa')
- assert u.encode('utf-8', 'aaaaaa') == b'\xea\x80\x80abcd\xde\xb4'
- assert u.encode('ascii', 'ignore') == b'abcd'
- assert u.encode('ASCII', 'ignore') == b'abcd'
- assert u.encode('ascii', 'replace') == b'?abcd?'
- assert u.encode('ascii', 'xmlcharrefreplace') == b'ꀀabcd޴'
- assert u.encode('ascii', 'backslashreplace') == b'\\ua000abcd\\u07b4'
- assert u.encode('ascii', 'namereplace') == b'\\N{YI SYLLABLE IT}abcd\\u07b4'
- assert 'pythön!'.encode() == b'pyth\xc3\xb6n!'
- assert '一二三'.encode('gbk') == b'\xd2\xbb\xb6\xfe\xc8\xfd'
- assert u.encode('UTF-8', 'ignore') == b'\xea\x80\x80abcd\xde\xb4'
- assert u.encode('Utf_8') == b'\xea\x80\x80abcd\xde\xb4'
- assert u.encode('UTF_8') == b'\xea\x80\x80abcd\xde\xb4'
- assert u'\u00E1'.encode('latin1') == b'\xe1'
- with assertRaises(UnicodeEncodeError):
- u.encode('latin1')
|