mirror of
				https://github.com/python/cpython.git
				synced 2025-10-26 03:04:41 +00:00 
			
		
		
		
	 b4ff1113ca
			
		
	
	
		b4ff1113ca
		
	
	
	
	
		
			
			for this iconv() implementation in the init function. For encoding: use a byteswapped version of the input if neccessary. For decoding: byteswap every piece returned by iconv() if neccessary (but not those pieces returned from the callback) Comment out test_sane() in the test script, because whether this works depends on whether byte swapping is neccessary or not (an on Py_UNICODE_SIZE)
		
			
				
	
	
		
			99 lines
		
	
	
	
		
			3.8 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			99 lines
		
	
	
	
		
			3.8 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| from test import test_support
 | |
| import unittest, sys
 | |
| import codecs, _iconv_codec
 | |
| from encodings import iconv_codec
 | |
| from StringIO import StringIO
 | |
| 
 | |
| class IconvCodecTest(unittest.TestCase):
 | |
| 
 | |
|     if sys.byteorder == 'big':
 | |
|         spam = '\x00s\x00p\x00a\x00m' * 2
 | |
|     else:
 | |
|         spam = 's\x00p\x00a\x00m\x00' * 2
 | |
| 
 | |
|     def test_sane(self):
 | |
|         # FIXME: Commented out, because it's not clear whether
 | |
|         # the internal encoding choosen requires byte swapping
 | |
|         # for this iconv() implementation.
 | |
|         if False:
 | |
|             self.encoder, self.decoder, self.reader, self.writer = \
 | |
|                 codecs.lookup(_iconv_codec.internal_encoding)
 | |
|             self.assertEqual(self.decoder(self.spam), (u'spamspam', 16))
 | |
|             self.assertEqual(self.encoder(u'spamspam'), (self.spam, 8))
 | |
|             self.assertEqual(self.reader(StringIO(self.spam)).read(), u'spamspam')
 | |
|             f = StringIO()
 | |
|             self.writer(f).write(u'spamspam')
 | |
|             self.assertEqual(f.getvalue(), self.spam)
 | |
| 
 | |
|     def test_basic_errors(self):
 | |
|         self.encoder, self.decoder, self.reader, self.writer = \
 | |
|             iconv_codec.lookup("ascii")
 | |
|         def testencerror(errors):
 | |
|             return self.encoder(u'sp\ufffdam', errors)
 | |
|         def testdecerror(errors):
 | |
|             return self.decoder('sp\xffam', errors)
 | |
| 
 | |
|         self.assertRaises(UnicodeEncodeError, testencerror, 'strict')
 | |
|         self.assertRaises(UnicodeDecodeError, testdecerror, 'strict')
 | |
|         self.assertEqual(testencerror('replace'), ('sp?am', 5))
 | |
|         self.assertEqual(testdecerror('replace'), (u'sp\ufffdam', 5))
 | |
|         self.assertEqual(testencerror('ignore'), ('spam', 5))
 | |
|         self.assertEqual(testdecerror('ignore'), (u'spam', 5))
 | |
| 
 | |
|     def test_pep293_errors(self):
 | |
|         self.encoder, self.decoder, self.reader, self.writer = \
 | |
|             iconv_codec.lookup("ascii")
 | |
|         def testencerror(errors):
 | |
|             return self.encoder(u'sp\ufffdam', errors)
 | |
|         def testdecerror(errors):
 | |
|             return self.decoder('sp\xffam', errors)
 | |
| 
 | |
|         self.assertEqual(testencerror('xmlcharrefreplace'),
 | |
|                          ('sp�am', 5))
 | |
|         self.assertEqual(testencerror('backslashreplace'),
 | |
|                          ('sp\\ufffdam', 5))
 | |
| 
 | |
|         def error_bomb(exc):
 | |
|             return (u'*'*40, len(exc.object))
 | |
|         def error_mock(exc):
 | |
|             error_mock.lastexc = exc
 | |
|             return (unicode(exc.object[exc.start - 1]), exc.end)
 | |
| 
 | |
|         codecs.register_error('test_iconv_codec.bomb', error_bomb)
 | |
|         codecs.register_error('test_iconv_codec.mock', error_mock)
 | |
| 
 | |
|         self.assertEqual(testencerror('test_iconv_codec.bomb'),
 | |
|                          ('sp' + ('*'*40), 5))
 | |
|         self.assertEqual(testdecerror('test_iconv_codec.bomb'),
 | |
|                          (u'sp' + (u'*'*40), 5))
 | |
| 
 | |
|         self.assertEqual(testencerror('test_iconv_codec.mock'), ('sppam', 5))
 | |
|         exc = error_mock.lastexc
 | |
|         self.assertEqual(exc.object, u'sp\ufffdam')
 | |
|         self.assertEqual(exc.start, 2)
 | |
|         self.assertEqual(exc.end, 3)
 | |
|         self.assert_(isinstance(exc, UnicodeEncodeError))
 | |
| 
 | |
|         self.assertEqual(testdecerror('test_iconv_codec.mock'), (u'sppam', 5))
 | |
|         exc = error_mock.lastexc
 | |
|         self.assertEqual(exc.object, 'sp\xffam')
 | |
|         self.assertEqual(exc.start, 2)
 | |
|         self.assertEqual(exc.end, 3)
 | |
|         self.assert_(isinstance(exc, UnicodeDecodeError))
 | |
| 
 | |
|     def test_empty_escape_decode(self):
 | |
|         self.encoder, self.decoder, self.reader, self.writer = \
 | |
|             iconv_codec.lookup("ascii")
 | |
|         self.assertEquals(self.decoder(u""), ("", 0))
 | |
|         self.assertEquals(self.encoder(""), (u"", 0))
 | |
| 
 | |
| def test_main():
 | |
|     suite = unittest.TestSuite()
 | |
|     suite.addTest(unittest.makeSuite(IconvCodecTest))
 | |
|     test_support.run_suite(suite)
 | |
| 
 | |
| 
 | |
| if __name__ == "__main__":
 | |
|     test_main()
 | |
| 
 | |
| # ex: ts=8 sts=4 et
 |