| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  | #! /usr/bin/env python | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | """Convert ESIS events to SGML or XML markup.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | This is limited, but seems sufficient for the ESIS generated by the | 
					
						
							|  |  |  | latex2esis.py script when run over the Python documentation. | 
					
						
							|  |  |  | """
 | 
					
						
							|  |  |  | __version__ = '$Revision$' | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | import errno | 
					
						
							| 
									
										
										
										
											1998-12-01 19:01:53 +00:00
										 |  |  | import esistools | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  | import re | 
					
						
							|  |  |  | import string | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											1999-01-14 17:06:09 +00:00
										 |  |  | from xml.utils import escape | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | def format_attrs(attrs): | 
					
						
							|  |  |  |     attrs = attrs.items() | 
					
						
							|  |  |  |     attrs.sort() | 
					
						
							|  |  |  |     s = '' | 
					
						
							|  |  |  |     for name, value in attrs: | 
					
						
							| 
									
										
										
										
											1999-01-14 17:06:09 +00:00
										 |  |  |         s = '%s %s="%s"' % (s, name, escape(value)) | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  |     return s | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											1998-12-10 18:31:37 +00:00
										 |  |  | def do_convert(ifp, ofp, xml=0): | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  |     attrs = {} | 
					
						
							|  |  |  |     lastopened = None | 
					
						
							| 
									
										
										
										
											1998-12-10 18:31:37 +00:00
										 |  |  |     knownempties = [] | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  |     knownempty = 0 | 
					
						
							|  |  |  |     lastempty = 0 | 
					
						
							|  |  |  |     while 1: | 
					
						
							|  |  |  |         line = ifp.readline() | 
					
						
							|  |  |  |         if not line: | 
					
						
							|  |  |  |             break | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         type = line[0] | 
					
						
							|  |  |  |         data = line[1:] | 
					
						
							|  |  |  |         if data and data[-1] == "\n": | 
					
						
							|  |  |  |             data = data[:-1] | 
					
						
							|  |  |  |         if type == "-": | 
					
						
							| 
									
										
										
										
											1998-12-01 19:01:53 +00:00
										 |  |  |             data = esistools.decode(data) | 
					
						
							| 
									
										
										
										
											1999-01-14 17:06:09 +00:00
										 |  |  |             ofp.write(escape(data)) | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  |             if "\n" in data: | 
					
						
							|  |  |  |                 lastopened = None | 
					
						
							|  |  |  |             knownempty = 0 | 
					
						
							|  |  |  |             lastempty = 0 | 
					
						
							|  |  |  |         elif type == "(": | 
					
						
							| 
									
										
										
										
											1998-12-01 19:01:53 +00:00
										 |  |  |             if data == "COMMENT": | 
					
						
							|  |  |  |                 ofp.write("<!--") | 
					
						
							|  |  |  |                 continue | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  |             if knownempty and xml: | 
					
						
							|  |  |  |                 ofp.write("<%s%s/>" % (data, format_attrs(attrs))) | 
					
						
							|  |  |  |             else: | 
					
						
							|  |  |  |                 ofp.write("<%s%s>" % (data, format_attrs(attrs))) | 
					
						
							|  |  |  |             if knownempty and data not in knownempties: | 
					
						
							|  |  |  |                 # accumulate knowledge! | 
					
						
							|  |  |  |                 knownempties.append(data) | 
					
						
							|  |  |  |             attrs = {} | 
					
						
							|  |  |  |             lastopened = data | 
					
						
							|  |  |  |             lastempty = knownempty | 
					
						
							|  |  |  |             knownempty = 0 | 
					
						
							|  |  |  |         elif type == ")": | 
					
						
							| 
									
										
										
										
											1998-12-01 19:01:53 +00:00
										 |  |  |             if data == "COMMENT": | 
					
						
							|  |  |  |                 ofp.write("-->") | 
					
						
							|  |  |  |                 continue | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  |             if xml: | 
					
						
							|  |  |  |                 if not lastempty: | 
					
						
							|  |  |  |                     ofp.write("</%s>" % data) | 
					
						
							|  |  |  |             elif data not in knownempties: | 
					
						
							|  |  |  |                 if lastopened == data: | 
					
						
							|  |  |  |                     ofp.write("</>") | 
					
						
							|  |  |  |                 else: | 
					
						
							|  |  |  |                     ofp.write("</%s>" % data) | 
					
						
							|  |  |  |             lastopened = None | 
					
						
							|  |  |  |             lastempty = 0 | 
					
						
							|  |  |  |         elif type == "A": | 
					
						
							|  |  |  |             name, type, value = string.split(data, " ", 2) | 
					
						
							| 
									
										
										
										
											1998-12-01 19:01:53 +00:00
										 |  |  |             attrs[name] = esistools.decode(value) | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  |         elif type == "e": | 
					
						
							|  |  |  |             knownempty = 1 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											1998-12-10 18:31:37 +00:00
										 |  |  | def sgml_convert(ifp, ofp): | 
					
						
							|  |  |  |     return do_convert(ifp, ofp, xml=0) | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											1998-12-10 18:31:37 +00:00
										 |  |  | def xml_convert(ifp, ofp): | 
					
						
							|  |  |  |     return do_convert(ifp, ofp, xml=1) | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def main(): | 
					
						
							| 
									
										
										
										
											1998-12-01 19:01:53 +00:00
										 |  |  |     import getopt | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  |     import sys | 
					
						
							|  |  |  |     # | 
					
						
							|  |  |  |     convert = sgml_convert | 
					
						
							| 
									
										
										
										
											1998-12-01 19:01:53 +00:00
										 |  |  |     xml = 0 | 
					
						
							|  |  |  |     xmldecl = 0 | 
					
						
							|  |  |  |     opts, args = getopt.getopt(sys.argv[1:], "dx", ["declare", "xml"]) | 
					
						
							|  |  |  |     for opt, arg in opts: | 
					
						
							|  |  |  |         if opt in ("-d", "--declare"): | 
					
						
							|  |  |  |             xmldecl = 1 | 
					
						
							|  |  |  |         elif opt in ("-x", "--xml"): | 
					
						
							|  |  |  |             xml = 1 | 
					
						
							|  |  |  |             convert = xml_convert | 
					
						
							|  |  |  |     if len(args) == 0: | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  |         ifp = sys.stdin | 
					
						
							|  |  |  |         ofp = sys.stdout | 
					
						
							| 
									
										
										
										
											1998-12-01 19:01:53 +00:00
										 |  |  |     elif len(args) == 1: | 
					
						
							|  |  |  |         ifp = open(args[0]) | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  |         ofp = sys.stdout | 
					
						
							| 
									
										
										
										
											1998-12-01 19:01:53 +00:00
										 |  |  |     elif len(args) == 2: | 
					
						
							|  |  |  |         ifp = open(args[0]) | 
					
						
							|  |  |  |         ofp = open(args[1], "w") | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  |     else: | 
					
						
							|  |  |  |         usage() | 
					
						
							|  |  |  |         sys.exit(2) | 
					
						
							|  |  |  |     # knownempties is ignored in the XML version | 
					
						
							|  |  |  |     try: | 
					
						
							| 
									
										
										
										
											1998-12-01 19:01:53 +00:00
										 |  |  |         if xml and xmldecl: | 
					
						
							|  |  |  |             opf.write('<?xml version="1.0" encoding="iso8859-1"?>\n') | 
					
						
							| 
									
										
										
										
											1998-11-23 16:59:39 +00:00
										 |  |  |         convert(ifp, ofp) | 
					
						
							|  |  |  |     except IOError, (err, msg): | 
					
						
							|  |  |  |         if err != errno.EPIPE: | 
					
						
							|  |  |  |             raise | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | if __name__ == "__main__": | 
					
						
							|  |  |  |     main() |