File: unicode_strings_runme.py

package info (click to toggle)
swig 4.4.0-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 45,980 kB
  • sloc: cpp: 54,284; ansic: 29,022; java: 17,595; python: 12,734; cs: 10,421; ruby: 7,263; yacc: 6,501; makefile: 5,860; javascript: 5,538; sh: 5,422; perl: 4,246; php: 3,733; ml: 2,198; tcl: 2,015; lisp: 1,448; xml: 115
file content (38 lines) | stat: -rw-r--r-- 1,782 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
import sys

import unicode_strings

if sys.version_info[0:2] >= (3, 1):
    test_string = "h\udce9llo w\u00f6rld"
    if unicode_strings.non_utf8_c_str() != test_string:
        raise ValueError("Test comparison mismatch")
    if unicode_strings.non_utf8_std_string() != test_string:
        raise ValueError("Test comparison mismatch")

def check(s1, s2):
    if s1 != s2:
        raise RuntimeError("{} != {}".format(s1, s2))

# Testing SWIG_PYTHON_2_UNICODE flag which allows unicode strings to be passed to C
if sys.version_info[0:2] < (3, 0):
    # Python 3.0-3.2 results in a SyntaxError when using u"" string literals, so we use a
    # convoluted unicode string construction using unicode() and unichr().
    # Conventional Python 2 syntax shown in comments.
    check(unicode_strings.charstring("hello1"), "hello1")
    check(unicode_strings.charstring(str(unicode("hello2"))), "hello2") # u"hello2"
    check(unicode_strings.charstring(unicode("hello3")), "hello3") # u"hello3"
    check(unicode_strings.charstring(str("hello4")), "hello4")
    unicode_strings.charstring(unicode("hell" + unichr(0xb0) + "5")) # u"hell\xb05"
    unicode_strings.charstring(unicode("hell" + unichr(0x00f6) +"6")) # u"hell\u00f66"
    low_surrogate_string = unichr(0xdcff) # u"\udcff"
    unicode_strings.instring(low_surrogate_string)
else:
    low_surrogate_string = "\udcff"
    try:
        unicode_strings.instring(low_surrogate_string)
        raise RuntimeError("Exception should have been thrown")
    except TypeError as e:
        # Python 3 will fail the PyUnicode_AsUTF8String conversion resulting in a TypeError.
        # The real error is actually:
        # UnicodeEncodeError: 'utf-8' codec can't encode character '\udcff' in position 0: surrogates not allowed
        pass