| 
									
										
										
										
											2010-01-09 18:45:30 +00:00
										 |  |  | # Copyright (C) 2001-2010 Python Software Foundation | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | # Author: Barry Warsaw | 
					
						
							|  |  |  | # Contact: email-sig@python.org | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | """Classes to generate plain text from a message object tree.""" | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2012-03-16 22:43:05 -04:00
										 |  |  | __all__ = ['Generator', 'DecodedGenerator', 'BytesGenerator'] | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | import re | 
					
						
							|  |  |  | import sys | 
					
						
							|  |  |  | import time | 
					
						
							|  |  |  | import random | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2014-02-08 11:48:20 -05:00
										 |  |  | from copy import deepcopy | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  | from io import StringIO, BytesIO | 
					
						
							| 
									
										
										
										
											2012-05-25 15:01:48 -04:00
										 |  |  | from email.utils import _has_surrogates | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | UNDERSCORE = '_' | 
					
						
							| 
									
										
										
										
											2010-10-23 22:19:56 +00:00
										 |  |  | NL = '\n'  # XXX: no longer used by the code below. | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2016-09-11 17:23:33 -04:00
										 |  |  | NLCRE = re.compile(r'\r\n|\r|\n') | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | fcre = re.compile(r'^From ', re.MULTILINE) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class Generator: | 
					
						
							|  |  |  |     """Generates output from a Message object tree.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     This basic generator writes the message to the given file object as plain | 
					
						
							|  |  |  |     text. | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  |     # | 
					
						
							|  |  |  |     # Public interface | 
					
						
							|  |  |  |     # | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-05-17 14:24:33 -04:00
										 |  |  |     def __init__(self, outfp, mangle_from_=None, maxheaderlen=None, *, | 
					
						
							| 
									
										
										
										
											2012-05-25 15:01:48 -04:00
										 |  |  |                  policy=None): | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         """Create the generator for message flattening.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         outfp is the output file-like object for writing the message to.  It | 
					
						
							|  |  |  |         must have a write() method. | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2015-05-17 14:24:33 -04:00
										 |  |  |         Optional mangle_from_ is a flag that, when True (the default if policy | 
					
						
							|  |  |  |         is not set), escapes From_ lines in the body of the message by putting | 
					
						
							| 
									
										
										
										
											2024-05-22 12:35:18 -04:00
										 |  |  |         a '>' in front of them. | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |         Optional maxheaderlen specifies the longest length for a non-continued | 
					
						
							|  |  |  |         header.  When a header line is longer (in characters, with tabs | 
					
						
							|  |  |  |         expanded to 8 spaces) than maxheaderlen, the header will split as | 
					
						
							|  |  |  |         defined in the Header class.  Set maxheaderlen to zero to disable | 
					
						
							|  |  |  |         header wrapping.  The default is 78, as recommended (but not required) | 
					
						
							|  |  |  |         by RFC 2822. | 
					
						
							| 
									
										
										
										
											2011-04-18 13:59:37 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  |         The policy keyword specifies a policy object that controls a number of | 
					
						
							| 
									
										
										
										
											2014-05-06 21:33:18 -04:00
										 |  |  |         aspects of the generator's operation.  If no policy is specified, | 
					
						
							|  |  |  |         the policy associated with the Message object passed to the | 
					
						
							|  |  |  |         flatten method is used. | 
					
						
							| 
									
										
										
										
											2011-04-18 13:59:37 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         """
 | 
					
						
							| 
									
										
										
										
											2015-05-17 14:24:33 -04:00
										 |  |  | 
 | 
					
						
							|  |  |  |         if mangle_from_ is None: | 
					
						
							|  |  |  |             mangle_from_ = True if policy is None else policy.mangle_from_ | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         self._fp = outfp | 
					
						
							|  |  |  |         self._mangle_from_ = mangle_from_ | 
					
						
							| 
									
										
										
										
											2012-05-25 15:01:48 -04:00
										 |  |  |         self.maxheaderlen = maxheaderlen | 
					
						
							| 
									
										
										
										
											2011-04-18 13:59:37 -04:00
										 |  |  |         self.policy = policy | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def write(self, s): | 
					
						
							|  |  |  |         # Just delegate to the file object | 
					
						
							|  |  |  |         self._fp.write(s) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-04-18 13:59:37 -04:00
										 |  |  |     def flatten(self, msg, unixfrom=False, linesep=None): | 
					
						
							| 
									
										
										
										
											2011-03-14 18:35:56 -04:00
										 |  |  |         r"""Print the message object tree rooted at msg to the output file
 | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         specified when the Generator instance was created. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         unixfrom is a flag that forces the printing of a Unix From_ delimiter | 
					
						
							|  |  |  |         before the first object in the message tree.  If the original message | 
					
						
							| 
									
										
										
										
											2024-05-22 12:35:18 -04:00
										 |  |  |         has no From_ delimiter, a 'standard' one is crafted.  By default, this | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         is False to inhibit the printing of any From_ delimiter. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         Note that for subobjects, no From_ line is printed. | 
					
						
							| 
									
										
										
										
											2010-10-23 22:19:56 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |         linesep specifies the characters used to indicate a new line in | 
					
						
							| 
									
										
										
										
											2014-05-06 21:33:18 -04:00
										 |  |  |         the output.  The default value is determined by the policy specified | 
					
						
							|  |  |  |         when the Generator instance was created or, if none was specified, | 
					
						
							|  |  |  |         from the policy associated with the msg. | 
					
						
							| 
									
										
										
										
											2011-03-14 18:35:56 -04:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         """
 | 
					
						
							| 
									
										
										
										
											2010-10-23 22:19:56 +00:00
										 |  |  |         # We use the _XXX constants for operating on data that comes directly | 
					
						
							|  |  |  |         # from the msg, and _encoded_XXX constants for operating on data that | 
					
						
							|  |  |  |         # has already been converted (to bytes in the BytesGenerator) and | 
					
						
							|  |  |  |         # inserted into a temporary buffer. | 
					
						
							| 
									
										
										
										
											2012-05-25 15:01:48 -04:00
										 |  |  |         policy = msg.policy if self.policy is None else self.policy | 
					
						
							|  |  |  |         if linesep is not None: | 
					
						
							|  |  |  |             policy = policy.clone(linesep=linesep) | 
					
						
							|  |  |  |         if self.maxheaderlen is not None: | 
					
						
							|  |  |  |             policy = policy.clone(max_line_length=self.maxheaderlen) | 
					
						
							|  |  |  |         self._NL = policy.linesep | 
					
						
							| 
									
										
										
										
											2011-04-18 13:59:37 -04:00
										 |  |  |         self._encoded_NL = self._encode(self._NL) | 
					
						
							| 
									
										
										
										
											2010-10-23 22:19:56 +00:00
										 |  |  |         self._EMPTY = '' | 
					
						
							| 
									
										
										
										
											2016-09-08 22:21:27 -04:00
										 |  |  |         self._encoded_EMPTY = self._encode(self._EMPTY) | 
					
						
							| 
									
										
										
										
											2012-05-25 18:42:14 -04:00
										 |  |  |         # Because we use clone (below) when we recursively process message | 
					
						
							|  |  |  |         # subparts, and because clone uses the computed policy (not None), | 
					
						
							|  |  |  |         # submessages will automatically get set to the computed policy when | 
					
						
							|  |  |  |         # they are processed by this code. | 
					
						
							|  |  |  |         old_gen_policy = self.policy | 
					
						
							|  |  |  |         old_msg_policy = msg.policy | 
					
						
							| 
									
										
										
										
											2012-05-25 15:01:48 -04:00
										 |  |  |         try: | 
					
						
							|  |  |  |             self.policy = policy | 
					
						
							| 
									
										
										
										
											2012-05-25 18:42:14 -04:00
										 |  |  |             msg.policy = policy | 
					
						
							| 
									
										
										
										
											2012-05-25 15:01:48 -04:00
										 |  |  |             if unixfrom: | 
					
						
							|  |  |  |                 ufrom = msg.get_unixfrom() | 
					
						
							|  |  |  |                 if not ufrom: | 
					
						
							|  |  |  |                     ufrom = 'From nobody ' + time.ctime(time.time()) | 
					
						
							|  |  |  |                 self.write(ufrom + self._NL) | 
					
						
							|  |  |  |             self._write(msg) | 
					
						
							|  |  |  |         finally: | 
					
						
							| 
									
										
										
										
											2012-05-25 18:42:14 -04:00
										 |  |  |             self.policy = old_gen_policy | 
					
						
							|  |  |  |             msg.policy = old_msg_policy | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def clone(self, fp): | 
					
						
							|  |  |  |         """Clone this generator with the exact same options.""" | 
					
						
							| 
									
										
										
										
											2012-05-25 15:01:48 -04:00
										 |  |  |         return self.__class__(fp, | 
					
						
							|  |  |  |                               self._mangle_from_, | 
					
						
							|  |  |  |                               None, # Use policy setting, which we've adjusted | 
					
						
							|  |  |  |                               policy=self.policy) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     # | 
					
						
							|  |  |  |     # Protected interface - undocumented ;/ | 
					
						
							|  |  |  |     # | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |     # Note that we use 'self.write' when what we are writing is coming from | 
					
						
							|  |  |  |     # the source, and self._fp.write when what we are writing is coming from a | 
					
						
							|  |  |  |     # buffer (because the Bytes subclass has already had a chance to transform | 
					
						
							|  |  |  |     # the data in its write method in that case).  This is an entirely | 
					
						
							|  |  |  |     # pragmatic split determined by experiment; we could be more general by | 
					
						
							|  |  |  |     # always using write and having the Bytes subclass write method detect when | 
					
						
							|  |  |  |     # it has already transformed the input; but, since this whole thing is a | 
					
						
							|  |  |  |     # hack anyway this seems good enough. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _new_buffer(self): | 
					
						
							|  |  |  |         # BytesGenerator overrides this to return BytesIO. | 
					
						
							|  |  |  |         return StringIO() | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-10-23 22:19:56 +00:00
										 |  |  |     def _encode(self, s): | 
					
						
							|  |  |  |         # BytesGenerator overrides this to encode strings to bytes. | 
					
						
							|  |  |  |         return s | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-03-07 16:38:03 -05:00
										 |  |  |     def _write_lines(self, lines): | 
					
						
							|  |  |  |         # We have to transform the line endings. | 
					
						
							|  |  |  |         if not lines: | 
					
						
							|  |  |  |             return | 
					
						
							| 
									
										
										
										
											2016-09-11 17:23:33 -04:00
										 |  |  |         lines = NLCRE.split(lines) | 
					
						
							| 
									
										
										
										
											2013-03-07 16:38:03 -05:00
										 |  |  |         for line in lines[:-1]: | 
					
						
							| 
									
										
										
										
											2016-09-11 17:23:33 -04:00
										 |  |  |             self.write(line) | 
					
						
							| 
									
										
										
										
											2013-03-07 16:38:03 -05:00
										 |  |  |             self.write(self._NL) | 
					
						
							| 
									
										
										
										
											2016-09-11 17:23:33 -04:00
										 |  |  |         if lines[-1]: | 
					
						
							|  |  |  |             self.write(lines[-1]) | 
					
						
							|  |  |  |         # XXX logic tells me this else should be needed, but the tests fail | 
					
						
							|  |  |  |         # with it and pass without it.  (NLCRE.split ends with a blank element | 
					
						
							|  |  |  |         # if and only if there was a trailing newline.) | 
					
						
							|  |  |  |         #else: | 
					
						
							|  |  |  |         #    self.write(self._NL) | 
					
						
							| 
									
										
										
										
											2013-03-07 16:38:03 -05:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |     def _write(self, msg): | 
					
						
							|  |  |  |         # We can't write the headers yet because of the following scenario: | 
					
						
							|  |  |  |         # say a multipart message includes the boundary string somewhere in | 
					
						
							|  |  |  |         # its body.  We'd have to calculate the new boundary /before/ we write | 
					
						
							|  |  |  |         # the headers so that we can write the correct Content-Type: | 
					
						
							|  |  |  |         # parameter. | 
					
						
							|  |  |  |         # | 
					
						
							|  |  |  |         # The way we do this, so as to make the _handle_*() methods simpler, | 
					
						
							| 
									
										
										
										
											2022-11-26 05:03:20 +11:00
										 |  |  |         # is to cache any subpart writes into a buffer.  Then we write the | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |         # headers and the buffer contents.  That way, subpart handlers can | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         # Do The Right Thing, and can still modify the Content-Type: header if | 
					
						
							|  |  |  |         # necessary. | 
					
						
							|  |  |  |         oldfp = self._fp | 
					
						
							|  |  |  |         try: | 
					
						
							| 
									
										
										
										
											2014-02-08 11:48:20 -05:00
										 |  |  |             self._munge_cte = None | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |             self._fp = sfp = self._new_buffer() | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |             self._dispatch(msg) | 
					
						
							|  |  |  |         finally: | 
					
						
							|  |  |  |             self._fp = oldfp | 
					
						
							| 
									
										
										
										
											2014-02-08 11:48:20 -05:00
										 |  |  |             munge_cte = self._munge_cte | 
					
						
							|  |  |  |             del self._munge_cte | 
					
						
							|  |  |  |         # If we munged the cte, copy the message again and re-fix the CTE. | 
					
						
							|  |  |  |         if munge_cte: | 
					
						
							|  |  |  |             msg = deepcopy(msg) | 
					
						
							| 
									
										
										
										
											2020-10-19 15:49:19 -07:00
										 |  |  |             # Preserve the header order if the CTE header already exists. | 
					
						
							|  |  |  |             if msg.get('content-transfer-encoding') is None: | 
					
						
							|  |  |  |                 msg['Content-Transfer-Encoding'] = munge_cte[0] | 
					
						
							|  |  |  |             else: | 
					
						
							|  |  |  |                 msg.replace_header('content-transfer-encoding', munge_cte[0]) | 
					
						
							| 
									
										
										
										
											2014-02-08 11:48:20 -05:00
										 |  |  |             msg.replace_header('content-type', munge_cte[1]) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         # Write the headers.  First we see if the message object wants to | 
					
						
							|  |  |  |         # handle that itself.  If not, we'll do it generically. | 
					
						
							|  |  |  |         meth = getattr(msg, '_write_headers', None) | 
					
						
							|  |  |  |         if meth is None: | 
					
						
							|  |  |  |             self._write_headers(msg) | 
					
						
							|  |  |  |         else: | 
					
						
							|  |  |  |             meth(self) | 
					
						
							|  |  |  |         self._fp.write(sfp.getvalue()) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _dispatch(self, msg): | 
					
						
							|  |  |  |         # Get the Content-Type: for the message, then try to dispatch to | 
					
						
							|  |  |  |         # self._handle_<maintype>_<subtype>().  If there's no handler for the | 
					
						
							|  |  |  |         # full MIME type, then dispatch to self._handle_<maintype>().  If | 
					
						
							|  |  |  |         # that's missing too, then dispatch to self._writeBody(). | 
					
						
							|  |  |  |         main = msg.get_content_maintype() | 
					
						
							|  |  |  |         sub = msg.get_content_subtype() | 
					
						
							|  |  |  |         specific = UNDERSCORE.join((main, sub)).replace('-', '_') | 
					
						
							|  |  |  |         meth = getattr(self, '_handle_' + specific, None) | 
					
						
							|  |  |  |         if meth is None: | 
					
						
							|  |  |  |             generic = main.replace('-', '_') | 
					
						
							|  |  |  |             meth = getattr(self, '_handle_' + generic, None) | 
					
						
							|  |  |  |             if meth is None: | 
					
						
							|  |  |  |                 meth = self._writeBody | 
					
						
							|  |  |  |         meth(msg) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     # | 
					
						
							|  |  |  |     # Default handlers | 
					
						
							|  |  |  |     # | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _write_headers(self, msg): | 
					
						
							| 
									
										
										
										
											2012-05-25 15:01:48 -04:00
										 |  |  |         for h, v in msg.raw_items(): | 
					
						
							|  |  |  |             self.write(self.policy.fold(h, v)) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         # A blank line always separates headers from body | 
					
						
							| 
									
										
										
										
											2010-10-23 22:19:56 +00:00
										 |  |  |         self.write(self._NL) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     # | 
					
						
							|  |  |  |     # Handlers for writing types and subtypes | 
					
						
							|  |  |  |     # | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _handle_text(self, msg): | 
					
						
							|  |  |  |         payload = msg.get_payload() | 
					
						
							|  |  |  |         if payload is None: | 
					
						
							|  |  |  |             return | 
					
						
							| 
									
										
										
										
											2007-10-16 18:12:55 +00:00
										 |  |  |         if not isinstance(payload, str): | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |             raise TypeError('string payload expected: %s' % type(payload)) | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |         if _has_surrogates(msg._payload): | 
					
						
							|  |  |  |             charset = msg.get_param('charset') | 
					
						
							|  |  |  |             if charset is not None: | 
					
						
							| 
									
										
										
										
											2014-02-08 11:48:20 -05:00
										 |  |  |                 # XXX: This copy stuff is an ugly hack to avoid modifying the | 
					
						
							|  |  |  |                 # existing message. | 
					
						
							|  |  |  |                 msg = deepcopy(msg) | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |                 del msg['content-transfer-encoding'] | 
					
						
							| 
									
										
										
										
											2024-03-05 17:49:01 +02:00
										 |  |  |                 msg.set_payload(msg._payload, charset) | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |                 payload = msg.get_payload() | 
					
						
							| 
									
										
										
										
											2014-02-08 11:48:20 -05:00
										 |  |  |                 self._munge_cte = (msg['content-transfer-encoding'], | 
					
						
							|  |  |  |                                    msg['content-type']) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         if self._mangle_from_: | 
					
						
							|  |  |  |             payload = fcre.sub('>From ', payload) | 
					
						
							| 
									
										
										
										
											2013-03-07 16:38:03 -05:00
										 |  |  |         self._write_lines(payload) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     # Default body handler | 
					
						
							|  |  |  |     _writeBody = _handle_text | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _handle_multipart(self, msg): | 
					
						
							|  |  |  |         # The trick here is to write out each part separately, merge them all | 
					
						
							|  |  |  |         # together, and then make sure that the boundary we've chosen isn't | 
					
						
							|  |  |  |         # present in the payload. | 
					
						
							|  |  |  |         msgtexts = [] | 
					
						
							|  |  |  |         subparts = msg.get_payload() | 
					
						
							|  |  |  |         if subparts is None: | 
					
						
							|  |  |  |             subparts = [] | 
					
						
							| 
									
										
										
										
											2007-10-16 18:12:55 +00:00
										 |  |  |         elif isinstance(subparts, str): | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |             # e.g. a non-strict parse of a message with no starting boundary. | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |             self.write(subparts) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |             return | 
					
						
							|  |  |  |         elif not isinstance(subparts, list): | 
					
						
							|  |  |  |             # Scalar payload | 
					
						
							|  |  |  |             subparts = [subparts] | 
					
						
							|  |  |  |         for part in subparts: | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |             s = self._new_buffer() | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |             g = self.clone(s) | 
					
						
							| 
									
										
										
										
											2010-10-23 22:19:56 +00:00
										 |  |  |             g.flatten(part, unixfrom=False, linesep=self._NL) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |             msgtexts.append(s.getvalue()) | 
					
						
							|  |  |  |         # BAW: What about boundaries that are wrapped in double-quotes? | 
					
						
							| 
									
										
										
										
											2010-12-12 20:06:19 +00:00
										 |  |  |         boundary = msg.get_boundary() | 
					
						
							|  |  |  |         if not boundary: | 
					
						
							|  |  |  |             # Create a boundary that doesn't appear in any of the | 
					
						
							|  |  |  |             # message texts. | 
					
						
							|  |  |  |             alltext = self._encoded_NL.join(msgtexts) | 
					
						
							| 
									
										
										
										
											2010-12-21 18:07:59 +00:00
										 |  |  |             boundary = self._make_boundary(alltext) | 
					
						
							|  |  |  |             msg.set_boundary(boundary) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         # If there's a preamble, write it out, with a trailing CRLF | 
					
						
							|  |  |  |         if msg.preamble is not None: | 
					
						
							| 
									
										
										
										
											2012-07-22 21:47:53 -04:00
										 |  |  |             if self._mangle_from_: | 
					
						
							|  |  |  |                 preamble = fcre.sub('>From ', msg.preamble) | 
					
						
							|  |  |  |             else: | 
					
						
							|  |  |  |                 preamble = msg.preamble | 
					
						
							| 
									
										
										
										
											2013-03-07 16:38:03 -05:00
										 |  |  |             self._write_lines(preamble) | 
					
						
							|  |  |  |             self.write(self._NL) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         # dash-boundary transport-padding CRLF | 
					
						
							| 
									
										
										
										
											2010-10-23 22:19:56 +00:00
										 |  |  |         self.write('--' + boundary + self._NL) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         # body-part | 
					
						
							|  |  |  |         if msgtexts: | 
					
						
							|  |  |  |             self._fp.write(msgtexts.pop(0)) | 
					
						
							|  |  |  |         # *encapsulation | 
					
						
							|  |  |  |         # --> delimiter transport-padding | 
					
						
							|  |  |  |         # --> CRLF body-part | 
					
						
							|  |  |  |         for body_part in msgtexts: | 
					
						
							|  |  |  |             # delimiter transport-padding CRLF | 
					
						
							| 
									
										
										
										
											2010-10-23 22:19:56 +00:00
										 |  |  |             self.write(self._NL + '--' + boundary + self._NL) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |             # body-part | 
					
						
							|  |  |  |             self._fp.write(body_part) | 
					
						
							|  |  |  |         # close-delimiter transport-padding | 
					
						
							| 
									
										
										
										
											2014-02-08 17:54:56 -05:00
										 |  |  |         self.write(self._NL + '--' + boundary + '--' + self._NL) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         if msg.epilogue is not None: | 
					
						
							| 
									
										
										
										
											2012-07-22 21:47:53 -04:00
										 |  |  |             if self._mangle_from_: | 
					
						
							|  |  |  |                 epilogue = fcre.sub('>From ', msg.epilogue) | 
					
						
							|  |  |  |             else: | 
					
						
							|  |  |  |                 epilogue = msg.epilogue | 
					
						
							| 
									
										
										
										
											2013-03-07 16:38:03 -05:00
										 |  |  |             self._write_lines(epilogue) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-01-16 18:30:03 +00:00
										 |  |  |     def _handle_multipart_signed(self, msg): | 
					
						
							|  |  |  |         # The contents of signed parts has to stay unmodified in order to keep | 
					
						
							|  |  |  |         # the signature intact per RFC1847 2.1, so we disable header wrapping. | 
					
						
							|  |  |  |         # RDM: This isn't enough to completely preserve the part, but it helps. | 
					
						
							| 
									
										
										
										
											2012-05-25 15:01:48 -04:00
										 |  |  |         p = self.policy | 
					
						
							|  |  |  |         self.policy = p.clone(max_line_length=0) | 
					
						
							| 
									
										
										
										
											2010-01-16 18:30:03 +00:00
										 |  |  |         try: | 
					
						
							|  |  |  |             self._handle_multipart(msg) | 
					
						
							|  |  |  |         finally: | 
					
						
							| 
									
										
										
										
											2012-05-25 15:01:48 -04:00
										 |  |  |             self.policy = p | 
					
						
							| 
									
										
										
										
											2010-01-16 18:30:03 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |     def _handle_message_delivery_status(self, msg): | 
					
						
							|  |  |  |         # We can't just write the headers directly to self's file object | 
					
						
							|  |  |  |         # because this will leave an extra newline between the last header | 
					
						
							|  |  |  |         # block and the boundary.  Sigh. | 
					
						
							|  |  |  |         blocks = [] | 
					
						
							|  |  |  |         for part in msg.get_payload(): | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |             s = self._new_buffer() | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |             g = self.clone(s) | 
					
						
							| 
									
										
										
										
											2010-11-21 16:53:48 +00:00
										 |  |  |             g.flatten(part, unixfrom=False, linesep=self._NL) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |             text = s.getvalue() | 
					
						
							| 
									
										
										
										
											2010-10-23 22:19:56 +00:00
										 |  |  |             lines = text.split(self._encoded_NL) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |             # Strip off the unnecessary trailing empty line | 
					
						
							| 
									
										
										
										
											2010-10-23 22:19:56 +00:00
										 |  |  |             if lines and lines[-1] == self._encoded_EMPTY: | 
					
						
							|  |  |  |                 blocks.append(self._encoded_NL.join(lines[:-1])) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |             else: | 
					
						
							|  |  |  |                 blocks.append(text) | 
					
						
							|  |  |  |         # Now join all the blocks with an empty line.  This has the lovely | 
					
						
							|  |  |  |         # effect of separating each block with an empty line, but not adding | 
					
						
							|  |  |  |         # an extra one after the last one. | 
					
						
							| 
									
										
										
										
											2010-10-23 22:19:56 +00:00
										 |  |  |         self._fp.write(self._encoded_NL.join(blocks)) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def _handle_message(self, msg): | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |         s = self._new_buffer() | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         g = self.clone(s) | 
					
						
							|  |  |  |         # The payload of a message/rfc822 part should be a multipart sequence | 
					
						
							|  |  |  |         # of length 1.  The zeroth element of the list should be the Message | 
					
						
							|  |  |  |         # object for the subpart.  Extract that object, stringify it, and | 
					
						
							|  |  |  |         # write it out. | 
					
						
							| 
									
										
										
										
											2010-02-21 04:39:40 +00:00
										 |  |  |         # Except, it turns out, when it's a string instead, which happens when | 
					
						
							|  |  |  |         # and only when HeaderParser is used on a message of mime type | 
					
						
							|  |  |  |         # message/rfc822.  Such messages are generated by, for example, | 
					
						
							|  |  |  |         # Groupwise when forwarding unadorned messages.  (Issue 7970.)  So | 
					
						
							|  |  |  |         # in that case we just emit the string body. | 
					
						
							| 
									
										
										
										
											2011-04-13 16:46:05 -04:00
										 |  |  |         payload = msg._payload | 
					
						
							| 
									
										
										
										
											2010-02-21 04:39:40 +00:00
										 |  |  |         if isinstance(payload, list): | 
					
						
							| 
									
										
										
										
											2010-11-21 16:53:48 +00:00
										 |  |  |             g.flatten(msg.get_payload(0), unixfrom=False, linesep=self._NL) | 
					
						
							| 
									
										
										
										
											2010-02-21 04:39:40 +00:00
										 |  |  |             payload = s.getvalue() | 
					
						
							| 
									
										
										
										
											2011-04-13 16:46:05 -04:00
										 |  |  |         else: | 
					
						
							|  |  |  |             payload = self._encode(payload) | 
					
						
							| 
									
										
										
										
											2010-02-21 04:39:40 +00:00
										 |  |  |         self._fp.write(payload) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |     # This used to be a module level function; we use a classmethod for this | 
					
						
							|  |  |  |     # and _compile_re so we can continue to provide the module level function | 
					
						
							|  |  |  |     # for backward compatibility by doing | 
					
						
							| 
									
										
										
										
											2013-08-10 18:47:07 +03:00
										 |  |  |     #   _make_boundary = Generator._make_boundary | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |     # at the end of the module.  It *is* internal, so we could drop that... | 
					
						
							|  |  |  |     @classmethod | 
					
						
							|  |  |  |     def _make_boundary(cls, text=None): | 
					
						
							|  |  |  |         # Craft a random boundary.  If text is given, ensure that the chosen | 
					
						
							|  |  |  |         # boundary doesn't appear in the text. | 
					
						
							|  |  |  |         token = random.randrange(sys.maxsize) | 
					
						
							|  |  |  |         boundary = ('=' * 15) + (_fmt % token) + '==' | 
					
						
							|  |  |  |         if text is None: | 
					
						
							|  |  |  |             return boundary | 
					
						
							|  |  |  |         b = boundary | 
					
						
							|  |  |  |         counter = 0 | 
					
						
							|  |  |  |         while True: | 
					
						
							|  |  |  |             cre = cls._compile_re('^--' + re.escape(b) + '(--)?$', re.MULTILINE) | 
					
						
							|  |  |  |             if not cre.search(text): | 
					
						
							|  |  |  |                 break | 
					
						
							|  |  |  |             b = boundary + '.' + str(counter) | 
					
						
							|  |  |  |             counter += 1 | 
					
						
							|  |  |  |         return b | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     @classmethod | 
					
						
							|  |  |  |     def _compile_re(cls, s, flags): | 
					
						
							|  |  |  |         return re.compile(s, flags) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2023-03-08 13:58:14 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  | class BytesGenerator(Generator): | 
					
						
							|  |  |  |     """Generates a bytes version of a Message object tree.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     Functionally identical to the base Generator except that the output is | 
					
						
							|  |  |  |     bytes and not string.  When surrogates were used in the input to encode | 
					
						
							| 
									
										
										
										
											2011-04-18 13:59:37 -04:00
										 |  |  |     bytes, these are decoded back to bytes for output.  If the policy has | 
					
						
							| 
									
										
										
										
											2012-05-25 15:01:48 -04:00
										 |  |  |     cte_type set to 7bit, then the message is transformed such that the | 
					
						
							|  |  |  |     non-ASCII bytes are properly content transfer encoded, using the charset | 
					
						
							|  |  |  |     unknown-8bit. | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     The outfp object must accept bytes in its write method. | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def write(self, s): | 
					
						
							|  |  |  |         self._fp.write(s.encode('ascii', 'surrogateescape')) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _new_buffer(self): | 
					
						
							|  |  |  |         return BytesIO() | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-10-23 22:19:56 +00:00
										 |  |  |     def _encode(self, s): | 
					
						
							|  |  |  |         return s.encode('ascii') | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |     def _write_headers(self, msg): | 
					
						
							|  |  |  |         # This is almost the same as the string version, except for handling | 
					
						
							|  |  |  |         # strings with 8bit bytes. | 
					
						
							| 
									
										
										
										
											2012-05-25 15:01:48 -04:00
										 |  |  |         for h, v in msg.raw_items(): | 
					
						
							|  |  |  |             self._fp.write(self.policy.fold_binary(h, v)) | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |         # A blank line always separates headers from body | 
					
						
							| 
									
										
										
										
											2010-10-23 22:19:56 +00:00
										 |  |  |         self.write(self._NL) | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     def _handle_text(self, msg): | 
					
						
							|  |  |  |         # If the string has surrogates the original source was bytes, so | 
					
						
							|  |  |  |         # just write it back out. | 
					
						
							| 
									
										
										
										
											2011-01-26 21:21:32 +00:00
										 |  |  |         if msg._payload is None: | 
					
						
							|  |  |  |             return | 
					
						
							| 
									
										
										
										
											2012-05-25 15:01:48 -04:00
										 |  |  |         if _has_surrogates(msg._payload) and not self.policy.cte_type=='7bit': | 
					
						
							| 
									
										
										
										
											2012-08-24 11:14:13 -04:00
										 |  |  |             if self._mangle_from_: | 
					
						
							|  |  |  |                 msg._payload = fcre.sub(">From ", msg._payload) | 
					
						
							| 
									
										
										
										
											2013-03-07 16:38:03 -05:00
										 |  |  |             self._write_lines(msg._payload) | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |         else: | 
					
						
							|  |  |  |             super(BytesGenerator,self)._handle_text(msg) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2013-02-09 13:02:58 -05:00
										 |  |  |     # Default body handler | 
					
						
							|  |  |  |     _writeBody = _handle_text | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  |     @classmethod | 
					
						
							|  |  |  |     def _compile_re(cls, s, flags): | 
					
						
							|  |  |  |         return re.compile(s.encode('ascii'), flags) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | _FMT = '[Non-text (%(type)s) part of message omitted, filename %(filename)s]' | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | class DecodedGenerator(Generator): | 
					
						
							| 
									
										
										
										
											2010-10-01 20:38:33 +00:00
										 |  |  |     """Generates a text representation of a message.
 | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |     Like the Generator base class, except that non-text parts are substituted | 
					
						
							|  |  |  |     with a format string representing the part. | 
					
						
							|  |  |  |     """
 | 
					
						
							| 
									
										
										
										
											2016-09-08 17:57:06 -04:00
										 |  |  |     def __init__(self, outfp, mangle_from_=None, maxheaderlen=None, fmt=None, *, | 
					
						
							|  |  |  |                  policy=None): | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         """Like Generator.__init__() except that an additional optional
 | 
					
						
							|  |  |  |         argument is allowed. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         Walks through all subparts of a message.  If the subpart is of main | 
					
						
							| 
									
										
										
										
											2024-05-22 12:35:18 -04:00
										 |  |  |         type 'text', then it prints the decoded payload of the subpart. | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |         Otherwise, fmt is a format string that is used instead of the message | 
					
						
							|  |  |  |         payload.  fmt is expanded with the following keywords (in | 
					
						
							|  |  |  |         %(keyword)s format): | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         type       : Full MIME type of the non-text part | 
					
						
							|  |  |  |         maintype   : Main MIME type of the non-text part | 
					
						
							|  |  |  |         subtype    : Sub-MIME type of the non-text part | 
					
						
							|  |  |  |         filename   : Filename of the non-text part | 
					
						
							|  |  |  |         description: Description associated with the non-text part | 
					
						
							|  |  |  |         encoding   : Content transfer encoding of the non-text part | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         The default value for fmt is None, meaning | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         [Non-text (%(type)s) part of message omitted, filename %(filename)s] | 
					
						
							|  |  |  |         """
 | 
					
						
							| 
									
										
										
										
											2016-09-08 17:57:06 -04:00
										 |  |  |         Generator.__init__(self, outfp, mangle_from_, maxheaderlen, | 
					
						
							|  |  |  |                            policy=policy) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |         if fmt is None: | 
					
						
							|  |  |  |             self._fmt = _FMT | 
					
						
							|  |  |  |         else: | 
					
						
							|  |  |  |             self._fmt = fmt | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _dispatch(self, msg): | 
					
						
							|  |  |  |         for part in msg.walk(): | 
					
						
							|  |  |  |             maintype = part.get_content_maintype() | 
					
						
							|  |  |  |             if maintype == 'text': | 
					
						
							| 
									
										
										
										
											2007-10-16 18:12:55 +00:00
										 |  |  |                 print(part.get_payload(decode=False), file=self) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  |             elif maintype == 'multipart': | 
					
						
							|  |  |  |                 # Just skip this | 
					
						
							|  |  |  |                 pass | 
					
						
							|  |  |  |             else: | 
					
						
							|  |  |  |                 print(self._fmt % { | 
					
						
							|  |  |  |                     'type'       : part.get_content_type(), | 
					
						
							|  |  |  |                     'maintype'   : part.get_content_maintype(), | 
					
						
							|  |  |  |                     'subtype'    : part.get_content_subtype(), | 
					
						
							|  |  |  |                     'filename'   : part.get_filename('[no filename]'), | 
					
						
							|  |  |  |                     'description': part.get('Content-Description', | 
					
						
							|  |  |  |                                             '[no description]'), | 
					
						
							|  |  |  |                     'encoding'   : part.get('Content-Transfer-Encoding', | 
					
						
							|  |  |  |                                             '[no encoding]'), | 
					
						
							|  |  |  |                     }, file=self) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  | # Helper used by Generator._make_boundary | 
					
						
							| 
									
										
										
										
											2007-12-04 23:02:19 +00:00
										 |  |  | _width = len(repr(sys.maxsize-1)) | 
					
						
							| 
									
										
										
										
											2007-08-30 01:15:14 +00:00
										 |  |  | _fmt = '%%0%dd' % _width | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-10-08 15:55:28 +00:00
										 |  |  | # Backward compatibility | 
					
						
							|  |  |  | _make_boundary = Generator._make_boundary |