summaryrefslogtreecommitdiff
path: root/Lib/test/test_ucn.py
diff options
context:
space:
mode:
authorMarc-André Lemburg <mal@egenix.com>2000-06-30 09:45:20 +0000
committerMarc-André Lemburg <mal@egenix.com>2000-06-30 09:45:20 +0000
commit6cdec2efbb0139600aa582ffc4530172194364be (patch)
treef82c38de54b39abb169081f3944f76ea2947c875 /Lib/test/test_ucn.py
parent5f2e75e87ce7ca3fd2b2de7a4af4c3fede289b77 (diff)
downloadcpython-git-6cdec2efbb0139600aa582ffc4530172194364be.tar.gz
New test for the ucnhash module.
Diffstat (limited to 'Lib/test/test_ucn.py')
-rw-r--r--Lib/test/test_ucn.py82
1 files changed, 82 insertions, 0 deletions
diff --git a/Lib/test/test_ucn.py b/Lib/test/test_ucn.py
new file mode 100644
index 0000000000..d631406a00
--- /dev/null
+++ b/Lib/test/test_ucn.py
@@ -0,0 +1,82 @@
+""" Test script for the Unicode implementation.
+
+Written by Bill Tutt.
+
+(c) Copyright CNRI, All Rights Reserved. NO WARRANTY.
+
+"""#"
+print 'Testing General Unicode Character Name, and case insensitivity...',
+
+# General and case insensitivity test:
+s = u"\N{LATIN CAPITAL LETTER T}" \
+ u"\N{LATIN SMALL LETTER H}" \
+ u"\N{LATIN SMALL LETTER E}" \
+ u"\N{SPACE}" \
+ u"\N{LATIN SMALL LETTER R}" \
+ u"\N{LATIN CAPITAL LETTER E}" \
+ u"\N{LATIN SMALL LETTER D}" \
+ u"\N{SPACE}" \
+ u"\N{LATIN SMALL LETTER f}" \
+ u"\N{LATIN CAPITAL LeTtEr o}" \
+ u"\N{LATIN SMaLl LETTER x}" \
+ u"\N{SPACE}" \
+ u"\N{LATIN SMALL LETTER A}" \
+ u"\N{LATIN SMALL LETTER T}" \
+ u"\N{LATIN SMALL LETTER E}" \
+ u"\N{SPACE}" \
+ u"\N{LATIN SMALL LETTER T}" \
+ u"\N{LATIN SMALL LETTER H}" \
+ u"\N{LATIN SMALL LETTER E}" \
+ u"\N{SpAcE}" \
+ u"\N{LATIN SMALL LETTER S}" \
+ u"\N{LATIN SMALL LETTER H}" \
+ u"\N{LATIN SMALL LETTER E}" \
+ u"\N{LATIN SMALL LETTER E}" \
+ u"\N{LATIN SMALL LETTER P}" \
+ u"\N{FULL STOP}"
+assert s == u"The rEd fOx ate the sheep.", s
+print "done."
+
+# misc. symbol testing
+print "Testing misc. symbols for unicode character name expansion....",
+assert u"\N{PILCROW SIGN}" == u"\u00b6"
+assert u"\N{REPLACEMENT CHARACTER}" == u"\uFFFD"
+assert u"\N{HALFWIDTH KATAKANA SEMI-VOICED SOUND MARK}" == u"\uFF9F"
+assert u"\N{FULLWIDTH LATIN SMALL LETTER A}" == u"\uFF41"
+print "done."
+
+
+# strict error testing:
+print "Testing unicode character name expansion strict error handling....",
+k_cchMaxUnicodeName = 83
+
+s = "\N{" + "1" * (k_cchMaxUnicodeName + 2) + "}"
+try:
+ unicode(s, 'unicode-escape', 'strict')
+except UnicodeError:
+ pass
+else:
+ raise AssertionError, "failed to raise an exception when presented " \
+ "with a UCN > k_cchMaxUnicodeName"
+try:
+ unicode("\N{blah}", 'unicode-escape', 'strict')
+except UnicodeError:
+ pass
+else:
+ raise AssertionError, "failed to raise an exception when given a bogus character name"
+
+try:
+ unicode("\N{SPACE", 'unicode-escape', 'strict')
+except UnicodeError:
+ pass
+else:
+ raise AssertionError, "failed to raise an exception for a missing closing brace."
+
+try:
+ unicode("\NSPACE", 'unicode-escape', 'strict')
+except UnicodeError:
+ pass
+else:
+ raise AssertionError, "failed to raise an exception for a missing opening brace."
+print "done."
+