Examples/test-suite/python/unicode_strings_runme.py - third_party/swig - Git at Google

 import sys

 import unicode_strings

 if sys.version_info[0:2] >= (3, 1):
     test_string = "h\udce9llo w\u00f6rld"
     if unicode_strings.non_utf8_c_str() != test_string:
         raise ValueError("Test comparison mismatch")
     if unicode_strings.non_utf8_std_string() != test_string:
         raise ValueError("Test comparison mismatch")

 def check(s1, s2):
     if s1 != s2:
         raise RuntimeError("{} != {}".format(s1, s2))

 # Testing SWIG_PYTHON_2_UNICODE flag which allows unicode strings to be passed to C
 if sys.version_info[0:2] < (3, 0):
     # Python 3.0-3.2 results in a SyntaxError when using u"" string literals, so we use a
     # convoluted unicode string construction using unicode() and unichr().
     # Conventional Python 2 syntax shown in comments.
     check(unicode_strings.charstring("hello1"), "hello1")
     check(unicode_strings.charstring(str(unicode("hello2"))), "hello2") # u"hello2"
     check(unicode_strings.charstring(unicode("hello3")), "hello3") # u"hello3"
     check(unicode_strings.charstring(str("hello4")), "hello4")
     unicode_strings.charstring(unicode("hell" + unichr(0xb0) + "5")) # u"hell\xb05"
     unicode_strings.charstring(unicode("hell" + unichr(0x00f6) +"6")) # u"hell\u00f66"
     low_surrogate_string = unichr(0xdcff) # u"\udcff"
     unicode_strings.instring(low_surrogate_string)
 else:
     low_surrogate_string = "\udcff"
     try:
         unicode_strings.instring(low_surrogate_string)
         raise RuntimeError("Exception should have been thrown")
     except TypeError as e:
         # Python 3 will fail the PyUnicode_AsUTF8String conversion resulting in a TypeError.
         # The real error is actually:
         # UnicodeEncodeError: 'utf-8' codec can't encode character '\udcff' in position 0: surrogates not allowed
         pass
	import sys

	import unicode_strings

	if sys.version_info[0:2] >= (3, 1):
	test_string = "h\udce9llo w\u00f6rld"
	if unicode_strings.non_utf8_c_str() != test_string:
	raise ValueError("Test comparison mismatch")
	if unicode_strings.non_utf8_std_string() != test_string:
	raise ValueError("Test comparison mismatch")

	def check(s1, s2):
	if s1 != s2:
	raise RuntimeError("{} != {}".format(s1, s2))

	# Testing SWIG_PYTHON_2_UNICODE flag which allows unicode strings to be passed to C
	if sys.version_info[0:2] < (3, 0):
	# Python 3.0-3.2 results in a SyntaxError when using u"" string literals, so we use a
	# convoluted unicode string construction using unicode() and unichr().
	# Conventional Python 2 syntax shown in comments.
	check(unicode_strings.charstring("hello1"), "hello1")
	check(unicode_strings.charstring(str(unicode("hello2"))), "hello2") # u"hello2"
	check(unicode_strings.charstring(unicode("hello3")), "hello3") # u"hello3"
	check(unicode_strings.charstring(str("hello4")), "hello4")
	unicode_strings.charstring(unicode("hell" + unichr(0xb0) + "5")) # u"hell\xb05"
	unicode_strings.charstring(unicode("hell" + unichr(0x00f6) +"6")) # u"hell\u00f66"
	low_surrogate_string = unichr(0xdcff) # u"\udcff"
	unicode_strings.instring(low_surrogate_string)
	else:
	low_surrogate_string = "\udcff"
	try:
	unicode_strings.instring(low_surrogate_string)
	raise RuntimeError("Exception should have been thrown")
	except TypeError as e:
	# Python 3 will fail the PyUnicode_AsUTF8String conversion resulting in a TypeError.
	# The real error is actually:
	# UnicodeEncodeError: 'utf-8' codec can't encode character '\udcff' in position 0: surrogates not allowed
	pass