|
|
|
|
|
|
|
|
import sys |
|
|
import unittest |
|
|
|
|
|
import Cython.Compiler.StringEncoding as StringEncoding |
|
|
|
|
|
|
|
|
class StringEncodingTest(unittest.TestCase): |
|
|
""" |
|
|
Test the StringEncoding module. |
|
|
""" |
|
|
def test_string_contains_lone_surrogates(self): |
|
|
self.assertFalse(StringEncoding.string_contains_lone_surrogates(u"abc")) |
|
|
self.assertFalse(StringEncoding.string_contains_lone_surrogates(u"\uABCD")) |
|
|
self.assertFalse(StringEncoding.string_contains_lone_surrogates(u"\N{SNOWMAN}")) |
|
|
|
|
|
|
|
|
|
|
|
if sys.version_info[0] != 2: |
|
|
self.assertTrue(StringEncoding.string_contains_lone_surrogates(u"\uD800\uDFFF")) |
|
|
|
|
|
|
|
|
obfuscated_surrogate_pair = (u"\uDFFF" + "\uD800")[::-1] |
|
|
if sys.version_info[0] == 2 and sys.maxunicode == 65565: |
|
|
self.assertFalse(StringEncoding.string_contains_lone_surrogates(obfuscated_surrogate_pair)) |
|
|
else: |
|
|
self.assertTrue(StringEncoding.string_contains_lone_surrogates(obfuscated_surrogate_pair)) |
|
|
|
|
|
self.assertTrue(StringEncoding.string_contains_lone_surrogates(u"\uD800")) |
|
|
self.assertTrue(StringEncoding.string_contains_lone_surrogates(u"\uDFFF")) |
|
|
self.assertTrue(StringEncoding.string_contains_lone_surrogates(u"\uDFFF\uD800")) |
|
|
self.assertTrue(StringEncoding.string_contains_lone_surrogates(u"\uD800x\uDFFF")) |
|
|
|
|
|
def test_string_contains_surrogates(self): |
|
|
self.assertFalse(StringEncoding.string_contains_surrogates(u"abc")) |
|
|
self.assertFalse(StringEncoding.string_contains_surrogates(u"\uABCD")) |
|
|
self.assertFalse(StringEncoding.string_contains_surrogates(u"\N{SNOWMAN}")) |
|
|
|
|
|
self.assertTrue(StringEncoding.string_contains_surrogates(u"\uD800")) |
|
|
self.assertTrue(StringEncoding.string_contains_surrogates(u"\uDFFF")) |
|
|
self.assertTrue(StringEncoding.string_contains_surrogates(u"\uD800\uDFFF")) |
|
|
self.assertTrue(StringEncoding.string_contains_surrogates(u"\uDFFF\uD800")) |
|
|
self.assertTrue(StringEncoding.string_contains_surrogates(u"\uD800x\uDFFF")) |
|
|
|