| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  | #!/usr/bin/env python | 
					
						
							|  |  |  | # | 
					
						
							|  |  |  | # test_multibytecodec_support.py | 
					
						
							|  |  |  | #   Common Unittest Routines for CJK codecs | 
					
						
							|  |  |  | # | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | import sys, codecs, os.path | 
					
						
							|  |  |  | import unittest | 
					
						
							|  |  |  | from test import test_support | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  | from io import BytesIO | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | class TestBase: | 
					
						
							|  |  |  |     encoding        = ''   # codec name | 
					
						
							|  |  |  |     codec           = None # codec tuple (with 4 elements) | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |     tstring         = None # must set. 2 strings to test StreamReader | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     codectests      = None # must set. codec test tuple | 
					
						
							|  |  |  |     roundtriptest   = 1    # set if roundtrip is possible with unicode | 
					
						
							|  |  |  |     has_iso10646    = 0    # set if this encoding contains whole iso10646 map | 
					
						
							|  |  |  |     xmlcharnametest = None # string to test xmlcharrefreplace | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |     unmappedunicode = '\udeee' # a unicode codepoint that is not mapped. | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def setUp(self): | 
					
						
							|  |  |  |         if self.codec is None: | 
					
						
							|  |  |  |             self.codec = codecs.lookup(self.encoding) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |         self.encode = self.codec.encode | 
					
						
							|  |  |  |         self.decode = self.codec.decode | 
					
						
							|  |  |  |         self.reader = self.codec.streamreader | 
					
						
							|  |  |  |         self.writer = self.codec.streamwriter | 
					
						
							|  |  |  |         self.incrementalencoder = self.codec.incrementalencoder | 
					
						
							|  |  |  |         self.incrementaldecoder = self.codec.incrementaldecoder | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def test_chunkcoding(self): | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |         for native, utf8 in zip(*[map(bytes, str8(f).splitlines(1)) | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |                                   for f in self.tstring]): | 
					
						
							|  |  |  |             u = self.decode(native)[0] | 
					
						
							|  |  |  |             self.assertEqual(u, utf8.decode('utf-8')) | 
					
						
							|  |  |  |             if self.roundtriptest: | 
					
						
							|  |  |  |                 self.assertEqual(native, self.encode(u)[0]) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def test_errorhandle(self): | 
					
						
							|  |  |  |         for source, scheme, expected in self.codectests: | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |             if isinstance(source, bytes): | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |                 func = self.decode | 
					
						
							|  |  |  |             else: | 
					
						
							|  |  |  |                 func = self.encode | 
					
						
							|  |  |  |             if expected: | 
					
						
							|  |  |  |                 result = func(source, scheme)[0] | 
					
						
							|  |  |  |                 self.assertEqual(result, expected) | 
					
						
							|  |  |  |             else: | 
					
						
							|  |  |  |                 self.assertRaises(UnicodeError, func, source, scheme) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |     def test_xmlcharrefreplace(self): | 
					
						
							|  |  |  |         if self.has_iso10646: | 
					
						
							|  |  |  |             return | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |         s = "\u0b13\u0b23\u0b60 nd eggs" | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |         self.assertEqual( | 
					
						
							|  |  |  |             self.encode(s, "xmlcharrefreplace")[0], | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |             b"ଓଣୠ nd eggs" | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |         ) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def test_customreplace_encode(self): | 
					
						
							|  |  |  |         if self.has_iso10646: | 
					
						
							|  |  |  |             return | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         from htmlentitydefs import codepoint2name | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         def xmlcharnamereplace(exc): | 
					
						
							|  |  |  |             if not isinstance(exc, UnicodeEncodeError): | 
					
						
							|  |  |  |                 raise TypeError("don't know how to handle %r" % exc) | 
					
						
							|  |  |  |             l = [] | 
					
						
							|  |  |  |             for c in exc.object[exc.start:exc.end]: | 
					
						
							|  |  |  |                 if ord(c) in codepoint2name: | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |                     l.append("&%s;" % codepoint2name[ord(c)]) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |                 else: | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |                     l.append("&#%d;" % ord(c)) | 
					
						
							|  |  |  |             return ("".join(l), exc.end) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |         codecs.register_error("test.xmlcharnamereplace", xmlcharnamereplace) | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |         if self.xmlcharnametest: | 
					
						
							|  |  |  |             sin, sout = self.xmlcharnametest | 
					
						
							|  |  |  |         else: | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |             sin = "\xab\u211c\xbb = \u2329\u1234\u232a" | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |             sout = b"«ℜ» = ⟨ሴ⟩" | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |         self.assertEqual(self.encode(sin, | 
					
						
							|  |  |  |                                     "test.xmlcharnamereplace")[0], sout) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def test_callback_wrong_objects(self): | 
					
						
							|  |  |  |         def myreplace(exc): | 
					
						
							|  |  |  |             return (ret, exc.end) | 
					
						
							|  |  |  |         codecs.register_error("test.cjktest", myreplace) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |         for ret in ([1, 2, 3], [], None, object(), b'string', b''): | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |             self.assertRaises(TypeError, self.encode, self.unmappedunicode, | 
					
						
							|  |  |  |                               'test.cjktest') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def test_callback_long_index(self): | 
					
						
							|  |  |  |         def myreplace(exc): | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |             return ('x', int(exc.end)) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |         codecs.register_error("test.cjktest", myreplace) | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |         self.assertEqual(self.encode('abcd' + self.unmappedunicode + 'efgh', | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |                                      'test.cjktest'), (b'abcdxefgh', 9)) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |         def myreplace(exc): | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |             return ('x', sys.maxint + 1) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |         codecs.register_error("test.cjktest", myreplace) | 
					
						
							|  |  |  |         self.assertRaises(IndexError, self.encode, self.unmappedunicode, | 
					
						
							|  |  |  |                           'test.cjktest') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def test_callback_None_index(self): | 
					
						
							|  |  |  |         def myreplace(exc): | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |             return ('x', None) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |         codecs.register_error("test.cjktest", myreplace) | 
					
						
							|  |  |  |         self.assertRaises(TypeError, self.encode, self.unmappedunicode, | 
					
						
							|  |  |  |                           'test.cjktest') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def test_callback_backward_index(self): | 
					
						
							|  |  |  |         def myreplace(exc): | 
					
						
							|  |  |  |             if myreplace.limit > 0: | 
					
						
							|  |  |  |                 myreplace.limit -= 1 | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |                 return ('REPLACED', 0) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |             else: | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |                 return ('TERMINAL', exc.end) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |         myreplace.limit = 3 | 
					
						
							|  |  |  |         codecs.register_error("test.cjktest", myreplace) | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |         self.assertEqual(self.encode('abcd' + self.unmappedunicode + 'efgh', | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |                                      'test.cjktest'), | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |                 (b'abcdREPLACEDabcdREPLACEDabcdREPLACEDabcdTERMINALefgh', 9)) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def test_callback_forward_index(self): | 
					
						
							|  |  |  |         def myreplace(exc): | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |             return ('REPLACED', exc.end + 2) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |         codecs.register_error("test.cjktest", myreplace) | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |         self.assertEqual(self.encode('abcd' + self.unmappedunicode + 'efgh', | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |                                      'test.cjktest'), (b'abcdREPLACEDgh', 9)) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def test_callback_index_outofbound(self): | 
					
						
							|  |  |  |         def myreplace(exc): | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |             return ('TERM', 100) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |         codecs.register_error("test.cjktest", myreplace) | 
					
						
							|  |  |  |         self.assertRaises(IndexError, self.encode, self.unmappedunicode, | 
					
						
							|  |  |  |                           'test.cjktest') | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def test_incrementalencoder(self): | 
					
						
							|  |  |  |         UTF8Reader = codecs.getreader('utf-8') | 
					
						
							| 
									
										
										
										
											2007-05-07 22:24:25 +00:00
										 |  |  |         for sizehint in [None] + list(range(1, 33)) + \ | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |                         [64, 128, 256, 512, 1024]: | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |             istream = UTF8Reader(BytesIO(self.tstring[1])) | 
					
						
							|  |  |  |             ostream = BytesIO() | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |             encoder = self.incrementalencoder() | 
					
						
							|  |  |  |             while 1: | 
					
						
							|  |  |  |                 if sizehint is not None: | 
					
						
							|  |  |  |                     data = istream.read(sizehint) | 
					
						
							|  |  |  |                 else: | 
					
						
							|  |  |  |                     data = istream.read() | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |                 if not data: | 
					
						
							|  |  |  |                     break | 
					
						
							|  |  |  |                 e = encoder.encode(data) | 
					
						
							|  |  |  |                 ostream.write(e) | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |             self.assertEqual(ostream.getvalue(), self.tstring[0]) | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |     def test_incrementaldecoder(self): | 
					
						
							|  |  |  |         UTF8Writer = codecs.getwriter('utf-8') | 
					
						
							| 
									
										
										
										
											2007-05-07 22:24:25 +00:00
										 |  |  |         for sizehint in [None, -1] + list(range(1, 33)) + \ | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |                         [64, 128, 256, 512, 1024]: | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |             istream = BytesIO(self.tstring[0]) | 
					
						
							|  |  |  |             ostream = UTF8Writer(BytesIO()) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |             decoder = self.incrementaldecoder() | 
					
						
							|  |  |  |             while 1: | 
					
						
							|  |  |  |                 data = istream.read(sizehint) | 
					
						
							|  |  |  |                 if not data: | 
					
						
							|  |  |  |                     break | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |                 else: | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |                     u = decoder.decode(data) | 
					
						
							|  |  |  |                     ostream.write(u) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             self.assertEqual(ostream.getvalue(), self.tstring[1]) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def test_incrementalencoder_error_callback(self): | 
					
						
							|  |  |  |         inv = self.unmappedunicode | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         e = self.incrementalencoder() | 
					
						
							|  |  |  |         self.assertRaises(UnicodeEncodeError, e.encode, inv, True) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         e.errors = 'ignore' | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |         self.assertEqual(e.encode(inv, True), b'') | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |         e.reset() | 
					
						
							|  |  |  |         def tempreplace(exc): | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |             return ('called', exc.end) | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |         codecs.register_error('test.incremental_error_callback', tempreplace) | 
					
						
							|  |  |  |         e.errors = 'test.incremental_error_callback' | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |         self.assertEqual(e.encode(inv, True), b'called') | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |         # again | 
					
						
							|  |  |  |         e.errors = 'ignore' | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |         self.assertEqual(e.encode(inv, True), b'') | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def test_streamreader(self): | 
					
						
							|  |  |  |         UTF8Writer = codecs.getwriter('utf-8') | 
					
						
							|  |  |  |         for name in ["read", "readline", "readlines"]: | 
					
						
							| 
									
										
										
										
											2007-05-07 22:24:25 +00:00
										 |  |  |             for sizehint in [None, -1] + list(range(1, 33)) + \ | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |                             [64, 128, 256, 512, 1024]: | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |                 istream = self.reader(BytesIO(self.tstring[0])) | 
					
						
							|  |  |  |                 ostream = UTF8Writer(BytesIO()) | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |                 func = getattr(istream, name) | 
					
						
							|  |  |  |                 while 1: | 
					
						
							|  |  |  |                     data = func(sizehint) | 
					
						
							|  |  |  |                     if not data: | 
					
						
							|  |  |  |                         break | 
					
						
							|  |  |  |                     if name == "readlines": | 
					
						
							|  |  |  |                         ostream.writelines(data) | 
					
						
							|  |  |  |                     else: | 
					
						
							|  |  |  |                         ostream.write(data) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |                 self.assertEqual(ostream.getvalue(), self.tstring[1]) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def test_streamwriter(self): | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |         readfuncs = ('read', 'readline', 'readlines') | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |         UTF8Reader = codecs.getreader('utf-8') | 
					
						
							|  |  |  |         for name in readfuncs: | 
					
						
							| 
									
										
										
										
											2007-05-07 22:24:25 +00:00
										 |  |  |             for sizehint in [None] + list(range(1, 33)) + \ | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |                             [64, 128, 256, 512, 1024]: | 
					
						
							| 
									
										
										
										
											2007-05-17 23:59:11 +00:00
										 |  |  |                 istream = UTF8Reader(BytesIO(self.tstring[1])) | 
					
						
							|  |  |  |                 ostream = self.writer(BytesIO()) | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |                 func = getattr(istream, name) | 
					
						
							|  |  |  |                 while 1: | 
					
						
							|  |  |  |                     if sizehint is not None: | 
					
						
							|  |  |  |                         data = func(sizehint) | 
					
						
							|  |  |  |                     else: | 
					
						
							|  |  |  |                         data = func() | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |                     if not data: | 
					
						
							|  |  |  |                         break | 
					
						
							|  |  |  |                     if name == "readlines": | 
					
						
							|  |  |  |                         ostream.writelines(data) | 
					
						
							|  |  |  |                     else: | 
					
						
							|  |  |  |                         ostream.write(data) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |                 self.assertEqual(ostream.getvalue(), self.tstring[0]) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  | if len('\U00012345') == 2: # ucs2 build | 
					
						
							| 
									
										
										
										
											2007-05-03 17:18:26 +00:00
										 |  |  |     _unichr = chr | 
					
						
							|  |  |  |     def chr(v): | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |         if v >= 0x10000: | 
					
						
							|  |  |  |             return _unichr(0xd800 + ((v - 0x10000) >> 10)) + \ | 
					
						
							|  |  |  |                    _unichr(0xdc00 + ((v - 0x10000) & 0x3ff)) | 
					
						
							|  |  |  |         else: | 
					
						
							|  |  |  |             return _unichr(v) | 
					
						
							|  |  |  |     _ord = ord | 
					
						
							|  |  |  |     def ord(c): | 
					
						
							|  |  |  |         if len(c) == 2: | 
					
						
							|  |  |  |             return 0x10000 + ((_ord(c[0]) - 0xd800) << 10) + \ | 
					
						
							|  |  |  |                           (ord(c[1]) - 0xdc00) | 
					
						
							|  |  |  |         else: | 
					
						
							|  |  |  |             return _ord(c) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class TestBase_Mapping(unittest.TestCase): | 
					
						
							|  |  |  |     pass_enctest = [] | 
					
						
							|  |  |  |     pass_dectest = [] | 
					
						
							|  |  |  |     supmaps = [] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def __init__(self, *args, **kw): | 
					
						
							|  |  |  |         unittest.TestCase.__init__(self, *args, **kw) | 
					
						
							| 
									
										
										
										
											2005-12-10 17:44:27 +00:00
										 |  |  |         self.open_mapping_file() # test it to report the error early | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def open_mapping_file(self): | 
					
						
							|  |  |  |         return test_support.open_urlresource(self.mapfileurl) | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def test_mapping_file(self): | 
					
						
							| 
									
										
										
										
											2007-05-03 17:18:26 +00:00
										 |  |  |         unichrs = lambda s: ''.join(map(chr, map(eval, s.split('+')))) | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |         urt_wa = {} | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2005-12-10 17:44:27 +00:00
										 |  |  |         for line in self.open_mapping_file(): | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |             if not line: | 
					
						
							|  |  |  |                 break | 
					
						
							|  |  |  |             data = line.split('#')[0].strip().split() | 
					
						
							|  |  |  |             if len(data) != 2: | 
					
						
							|  |  |  |                 continue | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             csetval = eval(data[0]) | 
					
						
							|  |  |  |             if csetval <= 0x7F: | 
					
						
							| 
									
										
										
										
											2007-07-23 18:06:59 +00:00
										 |  |  |                 csetch = bytes([csetval & 0xff]) | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |             elif csetval >= 0x1000000: | 
					
						
							| 
									
										
										
										
											2007-07-23 18:06:59 +00:00
										 |  |  |                 csetch = bytes([(csetval >> 24), ((csetval >> 16) & 0xff), | 
					
						
							|  |  |  |                                 ((csetval >> 8) & 0xff), (csetval & 0xff)]) | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |             elif csetval >= 0x10000: | 
					
						
							| 
									
										
										
										
											2007-07-23 18:06:59 +00:00
										 |  |  |                 csetch = bytes([(csetval >> 16), ((csetval >> 8) & 0xff), | 
					
						
							|  |  |  |                                 (csetval & 0xff)]) | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |             elif csetval >= 0x100: | 
					
						
							| 
									
										
										
										
											2007-07-23 18:06:59 +00:00
										 |  |  |                 csetch = bytes([(csetval >> 8), (csetval & 0xff)]) | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |             else: | 
					
						
							|  |  |  |                 continue | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             unich = unichrs(data[1]) | 
					
						
							| 
									
										
										
										
											2006-08-18 22:13:04 +00:00
										 |  |  |             if ord(unich) == 0xfffd or unich in urt_wa: | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  |                 continue | 
					
						
							|  |  |  |             urt_wa[unich] = csetch | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             self._testpoint(csetch, unich) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def test_mapping_supplemental(self): | 
					
						
							|  |  |  |         for mapping in self.supmaps: | 
					
						
							|  |  |  |             self._testpoint(*mapping) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _testpoint(self, csetch, unich): | 
					
						
							|  |  |  |         if (csetch, unich) not in self.pass_enctest: | 
					
						
							|  |  |  |             self.assertEqual(unich.encode(self.encoding), csetch) | 
					
						
							|  |  |  |         if (csetch, unich) not in self.pass_dectest: | 
					
						
							| 
									
										
										
										
											2007-05-02 19:09:54 +00:00
										 |  |  |             self.assertEqual(str(csetch, self.encoding), unich) | 
					
						
							| 
									
										
										
										
											2004-01-17 14:29:29 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | def load_teststring(encoding): | 
					
						
							| 
									
										
										
										
											2006-04-21 10:40:58 +00:00
										 |  |  |     from test import cjkencodings_test | 
					
						
							|  |  |  |     return cjkencodings_test.teststring[encoding] |