1 """ Test script for the unicodedata module.
3 Written by Marc-Andre Lemburg (mal@lemburg.com).
5 (c) Copyright CNRI, All Rights Reserved. NO WARRANTY.
8 import unittest
, test
.test_support
16 class UnicodeMethodsTest(unittest
.TestCase
):
18 # update this, if the database changes
19 expectedchecksum
= 'a37276dc2c158bef6dfd908ad34525c97180fad9'
21 def test_method_checksum(self
):
23 for i
in range(65536):
26 # Predicates (single char)
27 u
"01"[char
.isalnum()],
28 u
"01"[char
.isalpha()],
29 u
"01"[char
.isdecimal()],
30 u
"01"[char
.isdigit()],
31 u
"01"[char
.islower()],
32 u
"01"[char
.isnumeric()],
33 u
"01"[char
.isspace()],
34 u
"01"[char
.istitle()],
35 u
"01"[char
.isupper()],
37 # Predicates (multiple chars)
38 u
"01"[(char
+ u
'abc').isalnum()],
39 u
"01"[(char
+ u
'abc').isalpha()],
40 u
"01"[(char
+ u
'123').isdecimal()],
41 u
"01"[(char
+ u
'123').isdigit()],
42 u
"01"[(char
+ u
'abc').islower()],
43 u
"01"[(char
+ u
'123').isnumeric()],
44 u
"01"[(char
+ u
' \t').isspace()],
45 u
"01"[(char
+ u
'abc').istitle()],
46 u
"01"[(char
+ u
'ABC').isupper()],
48 # Mappings (single char)
53 # Mappings (multiple chars)
54 (char
+ u
'abc').lower(),
55 (char
+ u
'ABC').upper(),
56 (char
+ u
'abc').title(),
57 (char
+ u
'ABC').title(),
60 h
.update(u
''.join(data
).encode(encoding
))
61 result
= h
.hexdigest()
62 self
.assertEqual(result
, self
.expectedchecksum
)
64 class UnicodeDatabaseTest(unittest
.TestCase
):
67 # In case unicodedata is not available, this will raise an ImportError,
68 # but the other test cases will still be run
75 class UnicodeFunctionsTest(UnicodeDatabaseTest
):
77 # update this, if the database changes
78 expectedchecksum
= 'cfe20a967a450ebc82ca68c3e4eed344164e11af'
80 def test_function_checksum(self
):
84 for i
in range(0x10000):
88 str(self
.db
.digit(char
, -1)),
89 str(self
.db
.numeric(char
, -1)),
90 str(self
.db
.decimal(char
, -1)),
91 self
.db
.category(char
),
92 self
.db
.bidirectional(char
),
93 self
.db
.decomposition(char
),
94 str(self
.db
.mirrored(char
)),
95 str(self
.db
.combining(char
)),
97 h
.update(''.join(data
))
98 result
= h
.hexdigest()
99 self
.assertEqual(result
, self
.expectedchecksum
)
101 def test_digit(self
):
102 self
.assertEqual(self
.db
.digit(u
'A', None), None)
103 self
.assertEqual(self
.db
.digit(u
'9'), 9)
104 self
.assertEqual(self
.db
.digit(u
'\u215b', None), None)
105 self
.assertEqual(self
.db
.digit(u
'\u2468'), 9)
107 self
.assertRaises(TypeError, self
.db
.digit
)
108 self
.assertRaises(TypeError, self
.db
.digit
, u
'xx')
109 self
.assertRaises(ValueError, self
.db
.digit
, u
'x')
111 def test_numeric(self
):
112 self
.assertEqual(self
.db
.numeric(u
'A',None), None)
113 self
.assertEqual(self
.db
.numeric(u
'9'), 9)
114 self
.assertEqual(self
.db
.numeric(u
'\u215b'), 0.125)
115 self
.assertEqual(self
.db
.numeric(u
'\u2468'), 9.0)
117 self
.assertRaises(TypeError, self
.db
.numeric
)
118 self
.assertRaises(TypeError, self
.db
.numeric
, u
'xx')
119 self
.assertRaises(ValueError, self
.db
.numeric
, u
'x')
121 def test_decimal(self
):
122 self
.assertEqual(self
.db
.decimal(u
'A',None), None)
123 self
.assertEqual(self
.db
.decimal(u
'9'), 9)
124 self
.assertEqual(self
.db
.decimal(u
'\u215b', None), None)
125 self
.assertEqual(self
.db
.decimal(u
'\u2468', None), None)
127 self
.assertRaises(TypeError, self
.db
.decimal
)
128 self
.assertRaises(TypeError, self
.db
.decimal
, u
'xx')
129 self
.assertRaises(ValueError, self
.db
.decimal
, u
'x')
131 def test_category(self
):
132 self
.assertEqual(self
.db
.category(u
'\uFFFE'), 'Cn')
133 self
.assertEqual(self
.db
.category(u
'a'), 'Ll')
134 self
.assertEqual(self
.db
.category(u
'A'), 'Lu')
136 self
.assertRaises(TypeError, self
.db
.category
)
137 self
.assertRaises(TypeError, self
.db
.category
, u
'xx')
139 def test_bidirectional(self
):
140 self
.assertEqual(self
.db
.bidirectional(u
'\uFFFE'), '')
141 self
.assertEqual(self
.db
.bidirectional(u
' '), 'WS')
142 self
.assertEqual(self
.db
.bidirectional(u
'A'), 'L')
144 self
.assertRaises(TypeError, self
.db
.bidirectional
)
145 self
.assertRaises(TypeError, self
.db
.bidirectional
, u
'xx')
147 def test_decomposition(self
):
148 self
.assertEqual(self
.db
.decomposition(u
'\uFFFE'),'')
149 self
.assertEqual(self
.db
.decomposition(u
'\u00bc'), '<fraction> 0031 2044 0034')
151 self
.assertRaises(TypeError, self
.db
.decomposition
)
152 self
.assertRaises(TypeError, self
.db
.decomposition
, u
'xx')
154 def test_mirrored(self
):
155 self
.assertEqual(self
.db
.mirrored(u
'\uFFFE'), 0)
156 self
.assertEqual(self
.db
.mirrored(u
'a'), 0)
157 self
.assertEqual(self
.db
.mirrored(u
'\u2201'), 1)
159 self
.assertRaises(TypeError, self
.db
.mirrored
)
160 self
.assertRaises(TypeError, self
.db
.mirrored
, u
'xx')
162 def test_combining(self
):
163 self
.assertEqual(self
.db
.combining(u
'\uFFFE'), 0)
164 self
.assertEqual(self
.db
.combining(u
'a'), 0)
165 self
.assertEqual(self
.db
.combining(u
'\u20e1'), 230)
167 self
.assertRaises(TypeError, self
.db
.combining
)
168 self
.assertRaises(TypeError, self
.db
.combining
, u
'xx')
170 def test_normalize(self
):
171 self
.assertRaises(TypeError, self
.db
.normalize
)
172 self
.assertRaises(ValueError, self
.db
.normalize
, 'unknown', u
'xx')
173 # The rest can be found in test_normalization.py
174 # which requires an external file.
177 class UnicodeMiscTest(UnicodeDatabaseTest
):
179 def test_decimal_numeric_consistent(self
):
180 # Test that decimal and numeric are consistent,
181 # i.e. if a character has a decimal value,
182 # it's numeric value should be the same.
184 for i
in xrange(0x10000):
186 dec
= self
.db
.decimal(c
, -1)
188 self
.assertEqual(dec
, self
.db
.numeric(c
))
190 self
.assert_(count
>= 10) # should have tested at least the ASCII digits
192 def test_digit_numeric_consistent(self
):
193 # Test that digit and numeric are consistent,
194 # i.e. if a character has a digit value,
195 # it's numeric value should be the same.
197 for i
in xrange(0x10000):
199 dec
= self
.db
.digit(c
, -1)
201 self
.assertEqual(dec
, self
.db
.numeric(c
))
203 self
.assert_(count
>= 10) # should have tested at least the ASCII digits
206 test
.test_support
.run_unittest(
212 if __name__
== "__main__":