summaryrefslogtreecommitdiff
path: root/Examples/test-suite/python/unicode_strings_runme.py
blob: 57bd7abcaa8ee76acef4536a521c792a8dc0301a (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
import sys

import unicode_strings

if sys.version_info[0:2] >= (3, 1):
    test_string = "h\udce9llo w\u00f6rld"
    if unicode_strings.non_utf8_c_str() != test_string:
        raise ValueError("Test comparison mismatch")
    if unicode_strings.non_utf8_std_string() != test_string:
        raise ValueError("Test comparison mismatch")

def check(s1, s2):
    if s1 != s2:
        raise RuntimeError("{} != {}".format(s1, s2))

# Testing SWIG_PYTHON_2_UNICODE flag which allows unicode strings to be passed to C
if sys.version_info[0:2] < (3, 0):
    # Python 3.0-3.2 results in a SyntaxError when using u"" string literals, so we use a
    # convoluted unicode string construction using unicode() and unichr().
    # Conventional Python 2 syntax shown in comments.
    check(unicode_strings.charstring("hello1"), "hello1")
    check(unicode_strings.charstring(str(unicode("hello2"))), "hello2") # u"hello2"
    check(unicode_strings.charstring(unicode("hello3")), "hello3") # u"hello3"
    check(unicode_strings.charstring(str("hello4")), "hello4")
    unicode_strings.charstring(unicode("hell" + unichr(0xb0) + "5")) # u"hell\xb05"
    unicode_strings.charstring(unicode("hell" + unichr(0x00f6) +"6")) # u"hell\u00f66"
    low_surrogate_string = unichr(0xdcff) # u"\udcff"
    unicode_strings.instring(low_surrogate_string)
else:
    low_surrogate_string = "\udcff"
    try:
        unicode_strings.instring(low_surrogate_string)
        raise RuntimeError("Exception should have been thrown")
    except TypeError as e:
        # Python 3 will fail the PyUnicode_AsUTF8String conversion resulting in a TypeError.
        # The real error is actually:
        # UnicodeEncodeError: 'utf-8' codec can't encode character '\udcff' in position 0: surrogates not allowed
        pass