| 
									
										
										
										
											2000-06-29 19:33:43 +00:00
										 |  |  | """Simple API for XML (SAX) implementation for Python.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | This module provides an implementation of the SAX 2 interface; | 
					
						
							|  |  |  | information about the Java version of the interface can be found at | 
					
						
							|  |  |  | http://www.megginson.com/SAX/.  The Python version of the interface is | 
					
						
							|  |  |  | documented at <...>. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | This package contains the following modules: | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2000-09-18 16:31:08 +00:00
										 |  |  | handler -- Base classes and constants which define the SAX 2 API for | 
					
						
							|  |  |  |            the 'client-side' of SAX for Python. | 
					
						
							| 
									
										
										
										
											2000-06-29 19:33:43 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2000-09-18 16:31:08 +00:00
										 |  |  | saxutils -- Implementation of the convenience classes commonly used to | 
					
						
							|  |  |  |             work with SAX. | 
					
						
							| 
									
										
										
										
											2000-06-29 19:33:43 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2000-09-18 16:31:08 +00:00
										 |  |  | xmlreader -- Base classes and constants which define the SAX 2 API for | 
					
						
							|  |  |  |              the parsers used with SAX for Python. | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2000-09-24 20:38:18 +00:00
										 |  |  | expatreader -- Driver that allows use of the Expat parser with SAX. | 
					
						
							| 
									
										
										
										
											2000-06-29 19:33:43 +00:00
										 |  |  | """
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2000-09-24 18:54:49 +00:00
										 |  |  | from xmlreader import InputSource | 
					
						
							| 
									
										
										
										
											2000-07-01 13:44:04 +00:00
										 |  |  | from handler import ContentHandler, ErrorHandler | 
					
						
							|  |  |  | from _exceptions import SAXException, SAXNotRecognizedException, \ | 
					
						
							| 
									
										
										
										
											2000-10-06 17:41:52 +00:00
										 |  |  |                         SAXParseException, SAXNotSupportedException, \ | 
					
						
							|  |  |  |                         SAXReaderNotAvailable | 
					
						
							| 
									
										
										
										
											2000-09-18 16:31:08 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2000-07-01 04:58:47 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2000-09-24 18:54:49 +00:00
										 |  |  | def parse(source, handler, errorHandler=ErrorHandler()): | 
					
						
							| 
									
										
										
										
											2000-09-24 21:31:06 +00:00
										 |  |  |     parser = make_parser() | 
					
						
							| 
									
										
										
										
											2000-09-18 16:31:08 +00:00
										 |  |  |     parser.setContentHandler(handler) | 
					
						
							|  |  |  |     parser.setErrorHandler(errorHandler) | 
					
						
							| 
									
										
										
										
											2000-09-24 18:54:49 +00:00
										 |  |  |     parser.parse(source) | 
					
						
							| 
									
										
										
										
											2000-07-01 04:58:47 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2000-09-18 16:31:08 +00:00
										 |  |  | def parseString(string, handler, errorHandler=ErrorHandler()): | 
					
						
							| 
									
										
										
										
											2000-07-01 04:58:47 +00:00
										 |  |  |     try: | 
					
						
							| 
									
										
										
										
											2000-09-18 16:31:08 +00:00
										 |  |  |         from cStringIO import StringIO | 
					
						
							| 
									
										
										
										
											2000-07-01 04:58:47 +00:00
										 |  |  |     except ImportError: | 
					
						
							| 
									
										
										
										
											2000-09-18 16:31:08 +00:00
										 |  |  |         from StringIO import StringIO | 
					
						
							| 
									
										
										
										
											2000-10-23 18:09:50 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2000-09-18 16:31:08 +00:00
										 |  |  |     if errorHandler is None: | 
					
						
							|  |  |  |         errorHandler = ErrorHandler() | 
					
						
							| 
									
										
										
										
											2000-09-24 21:31:06 +00:00
										 |  |  |     parser = make_parser() | 
					
						
							| 
									
										
										
										
											2000-09-18 16:31:08 +00:00
										 |  |  |     parser.setContentHandler(handler) | 
					
						
							|  |  |  |     parser.setErrorHandler(errorHandler) | 
					
						
							| 
									
										
										
										
											2000-09-24 18:54:49 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     inpsrc = InputSource() | 
					
						
							|  |  |  |     inpsrc.setByteStream(StringIO(string)) | 
					
						
							|  |  |  |     parser.parse(inpsrc) | 
					
						
							| 
									
										
										
										
											2000-09-21 08:34:04 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | # this is the parser list used by the make_parser function if no | 
					
						
							|  |  |  | # alternatives are given as parameters to the function | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | default_parser_list = ["xml.sax.expatreader"] | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2001-07-31 08:54:55 +00:00
										 |  |  | # tell modulefinder that importing sax potentially imports expatreader | 
					
						
							|  |  |  | _false = 0 | 
					
						
							|  |  |  | if _false: | 
					
						
							|  |  |  |     import xml.sax.expatreader | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2000-09-21 08:34:04 +00:00
										 |  |  | import os, string, sys | 
					
						
							|  |  |  | if os.environ.has_key("PY_SAX_PARSER"): | 
					
						
							|  |  |  |     default_parser_list = string.split(os.environ["PY_SAX_PARSER"], ",") | 
					
						
							|  |  |  | del os | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | _key = "python.xml.sax.parser" | 
					
						
							|  |  |  | if sys.platform[:4] == "java" and sys.registry.containsKey(_key): | 
					
						
							|  |  |  |     default_parser_list = string.split(sys.registry.getProperty(_key), ",") | 
					
						
							| 
									
										
										
										
											2000-10-23 18:09:50 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2000-09-21 08:34:04 +00:00
										 |  |  | def make_parser(parser_list = []): | 
					
						
							|  |  |  |     """Creates and returns a SAX parser.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     Creates the first parser it is able to instantiate of the ones | 
					
						
							|  |  |  |     given in the list created by doing parser_list + | 
					
						
							|  |  |  |     default_parser_list.  The lists must contain the names of Python | 
					
						
							|  |  |  |     modules containing both a SAX parser and a create_parser function."""
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     for parser_name in parser_list + default_parser_list: | 
					
						
							|  |  |  |         try: | 
					
						
							| 
									
										
										
										
											2000-09-22 05:07:56 +00:00
										 |  |  |             return _create_parser(parser_name) | 
					
						
							| 
									
										
										
										
											2000-09-21 08:34:04 +00:00
										 |  |  |         except ImportError,e: | 
					
						
							| 
									
										
										
										
											2000-10-06 17:41:52 +00:00
										 |  |  |             import sys | 
					
						
							|  |  |  |             if sys.modules.has_key(parser_name): | 
					
						
							|  |  |  |                 # The parser module was found, but importing it | 
					
						
							|  |  |  |                 # failed unexpectedly, pass this exception through | 
					
						
							|  |  |  |                 raise | 
					
						
							|  |  |  |         except SAXReaderNotAvailable: | 
					
						
							|  |  |  |             # The parser module detected that it won't work properly, | 
					
						
							|  |  |  |             # so try the next one | 
					
						
							| 
									
										
										
										
											2000-09-21 08:34:04 +00:00
										 |  |  |             pass | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2000-10-23 18:09:50 +00:00
										 |  |  |     raise SAXReaderNotAvailable("No parsers found", None) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2000-09-21 08:34:04 +00:00
										 |  |  | # --- Internal utility methods used by make_parser | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | if sys.platform[ : 4] == "java": | 
					
						
							|  |  |  |     def _create_parser(parser_name): | 
					
						
							| 
									
										
										
										
											2000-09-22 09:30:29 +00:00
										 |  |  |         from org.python.core import imp | 
					
						
							|  |  |  |         drv_module = imp.importName(parser_name, 0, globals()) | 
					
						
							|  |  |  |         return drv_module.create_parser() | 
					
						
							| 
									
										
										
										
											2000-09-21 08:34:04 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | else: | 
					
						
							|  |  |  |     def _create_parser(parser_name): | 
					
						
							| 
									
										
										
										
											2000-09-24 21:31:06 +00:00
										 |  |  |         drv_module = __import__(parser_name,{},{},['create_parser']) | 
					
						
							| 
									
										
										
										
											2000-09-22 09:30:29 +00:00
										 |  |  |         return drv_module.create_parser() | 
					
						
							| 
									
										
										
										
											2000-09-21 08:34:04 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | del sys |