Edit File by line

[0] Fix | Delete

# Authors: Baxter, Wouters and Warsaw

[1] Fix | Delete

# Contact: email-sig@python.org

[2] Fix | Delete

[3] Fix | Delete

"""FeedParser - An email feed parser.

[4] Fix | Delete

[5] Fix | Delete

The feed parser implements an interface for incrementally parsing an email

[6] Fix | Delete

message, line by line. This has advantages for certain applications, such as

[7] Fix | Delete

those reading email messages off a socket.

[8] Fix | Delete

[9] Fix | Delete

FeedParser.feed() is the primary interface for pushing new data into the

[10] Fix | Delete

parser. It returns when there's nothing more it can do with the available

[11] Fix | Delete

data. When you have no more data to push into the parser, call .close().

[12] Fix | Delete

This completes the parsing and returns the root message object.

[13] Fix | Delete

[14] Fix | Delete

The other advantage of this parser is that it will never raise a parsing

[15] Fix | Delete

exception. Instead, when it finds something unexpected, it adds a 'defect' to

[16] Fix | Delete

the current message. Defects are just instances that live on the message

[17] Fix | Delete

object's .defects attribute.

[18] Fix | Delete

"""

[19] Fix | Delete

[20] Fix | Delete

__all__ = ['FeedParser', 'BytesFeedParser']

[21] Fix | Delete

[22] Fix | Delete

import re

[23] Fix | Delete

[24] Fix | Delete

from email import errors

[25] Fix | Delete

from email._policybase import compat32

[26] Fix | Delete

from collections import deque

[27] Fix | Delete

from io import StringIO

[28] Fix | Delete

[29] Fix | Delete

NLCRE = re.compile(r'\r\n|\r|\n')

[30] Fix | Delete

NLCRE_bol = re.compile(r'(\r\n|\r|\n)')

[31] Fix | Delete

NLCRE_eol = re.compile(r'(\r\n|\r|\n)\Z')

[32] Fix | Delete

NLCRE_crack = re.compile(r'(\r\n|\r|\n)')

[33] Fix | Delete

# RFC 2822 $3.6.8 Optional fields. ftext is %d33-57 / %d59-126, Any character

[34] Fix | Delete

# except controls, SP, and ":".

[35] Fix | Delete

headerRE = re.compile(r'^(From |[\041-\071\073-\176]*:|[\t ])')

[36] Fix | Delete

EMPTYSTRING = ''

[37] Fix | Delete

NL = '\n'

[38] Fix | Delete

[39] Fix | Delete

NeedMoreData = object()

[40] Fix | Delete

[41] Fix | Delete

[42] Fix | Delete

[43] Fix | Delete

class BufferedSubFile(object):

[44] Fix | Delete

"""A file-ish object that can have new data loaded into it.

[45] Fix | Delete

[46] Fix | Delete

You can also push and pop line-matching predicates onto a stack. When the

[47] Fix | Delete

current predicate matches the current line, a false EOF response

[48] Fix | Delete

(i.e. empty string) is returned instead. This lets the parser adhere to a

[49] Fix | Delete

simple abstraction -- it parses until EOF closes the current message.

[50] Fix | Delete

"""

[51] Fix | Delete

def __init__(self):

[52] Fix | Delete

# Text stream of the last partial line pushed into this object.

[53] Fix | Delete

# See issue 22233 for why this is a text stream and not a list.

[54] Fix | Delete

self._partial = StringIO(newline='')

[55] Fix | Delete

# A deque of full, pushed lines

[56] Fix | Delete

self._lines = deque()

[57] Fix | Delete

# The stack of false-EOF checking predicates.

[58] Fix | Delete

self._eofstack = []

[59] Fix | Delete

# A flag indicating whether the file has been closed or not.

[60] Fix | Delete

self._closed = False

[61] Fix | Delete

[62] Fix | Delete

def push_eof_matcher(self, pred):

[63] Fix | Delete

self._eofstack.append(pred)

[64] Fix | Delete

[65] Fix | Delete

def pop_eof_matcher(self):

[66] Fix | Delete

return self._eofstack.pop()

[67] Fix | Delete

[68] Fix | Delete

def close(self):

[69] Fix | Delete

# Don't forget any trailing partial line.

[70] Fix | Delete

self._partial.seek(0)

[71] Fix | Delete

self.pushlines(self._partial.readlines())

[72] Fix | Delete

self._partial.seek(0)

[73] Fix | Delete

self._partial.truncate()

[74] Fix | Delete

self._closed = True

[75] Fix | Delete

[76] Fix | Delete

def readline(self):

[77] Fix | Delete

if not self._lines:

[78] Fix | Delete

if self._closed:

[79] Fix | Delete

return ''

[80] Fix | Delete

return NeedMoreData

[81] Fix | Delete

# Pop the line off the stack and see if it matches the current

[82] Fix | Delete

# false-EOF predicate.

[83] Fix | Delete

line = self._lines.popleft()

[84] Fix | Delete

# RFC 2046, section 5.1.2 requires us to recognize outer level

[85] Fix | Delete

# boundaries at any level of inner nesting. Do this, but be sure it's

[86] Fix | Delete

# in the order of most to least nested.

[87] Fix | Delete

for ateof in reversed(self._eofstack):

[88] Fix | Delete

if ateof(line):

[89] Fix | Delete

# We're at the false EOF. But push the last line back first.

[90] Fix | Delete

self._lines.appendleft(line)

[91] Fix | Delete

return ''

[92] Fix | Delete

return line

[93] Fix | Delete

[94] Fix | Delete

def unreadline(self, line):

[95] Fix | Delete

# Let the consumer push a line back into the buffer.

[96] Fix | Delete

assert line is not NeedMoreData

[97] Fix | Delete

self._lines.appendleft(line)

[98] Fix | Delete

[99] Fix | Delete

def push(self, data):

[100] Fix | Delete

"""Push some new data into this object."""

[101] Fix | Delete

self._partial.write(data)

[102] Fix | Delete

if '\n' not in data and '\r' not in data:

[103] Fix | Delete

# No new complete lines, wait for more.

[104] Fix | Delete

return

[105] Fix | Delete

[106] Fix | Delete

# Crack into lines, preserving the linesep characters.

[107] Fix | Delete

self._partial.seek(0)

[108] Fix | Delete

parts = self._partial.readlines()

[109] Fix | Delete

self._partial.seek(0)

[110] Fix | Delete

self._partial.truncate()

[111] Fix | Delete

[112] Fix | Delete

# If the last element of the list does not end in a newline, then treat

[113] Fix | Delete

# it as a partial line. We only check for '\n' here because a line

[114] Fix | Delete

# ending with '\r' might be a line that was split in the middle of a

[115] Fix | Delete

# '\r\n' sequence (see bugs 1555570 and 1721862).

[116] Fix | Delete

if not parts[-1].endswith('\n'):

[117] Fix | Delete

self._partial.write(parts.pop())

[118] Fix | Delete

self.pushlines(parts)

[119] Fix | Delete

[120] Fix | Delete

def pushlines(self, lines):

[121] Fix | Delete

self._lines.extend(lines)

[122] Fix | Delete

[123] Fix | Delete

def __iter__(self):

[124] Fix | Delete

return self

[125] Fix | Delete

[126] Fix | Delete

def __next__(self):

[127] Fix | Delete

line = self.readline()

[128] Fix | Delete

if line == '':

[129] Fix | Delete

raise StopIteration

[130] Fix | Delete

return line

[131] Fix | Delete

[132] Fix | Delete

[133] Fix | Delete

[134] Fix | Delete

class FeedParser:

[135] Fix | Delete

"""A feed-style parser of email."""

[136] Fix | Delete

[137] Fix | Delete

def __init__(self, _factory=None, *, policy=compat32):

[138] Fix | Delete

"""_factory is called with no arguments to create a new message obj

[139] Fix | Delete

[140] Fix | Delete

The policy keyword specifies a policy object that controls a number of

[141] Fix | Delete

aspects of the parser's operation. The default policy maintains

[142] Fix | Delete

backward compatibility.

[143] Fix | Delete

[144] Fix | Delete

"""

[145] Fix | Delete

self.policy = policy

[146] Fix | Delete

self._old_style_factory = False

[147] Fix | Delete

if _factory is None:

[148] Fix | Delete

if policy.message_factory is None:

[149] Fix | Delete

from email.message import Message

[150] Fix | Delete

self._factory = Message

[151] Fix | Delete

else:

[152] Fix | Delete

self._factory = policy.message_factory

[153] Fix | Delete

else:

[154] Fix | Delete

self._factory = _factory

[155] Fix | Delete

try:

[156] Fix | Delete

_factory(policy=self.policy)

[157] Fix | Delete

except TypeError:

[158] Fix | Delete

# Assume this is an old-style factory

[159] Fix | Delete

self._old_style_factory = True

[160] Fix | Delete

self._input = BufferedSubFile()

[161] Fix | Delete

self._msgstack = []

[162] Fix | Delete

self._parse = self._parsegen().__next__

[163] Fix | Delete

self._cur = None

[164] Fix | Delete

self._last = None

[165] Fix | Delete

self._headersonly = False

[166] Fix | Delete

[167] Fix | Delete

# Non-public interface for supporting Parser's headersonly flag

[168] Fix | Delete

def _set_headersonly(self):

[169] Fix | Delete

self._headersonly = True

[170] Fix | Delete

[171] Fix | Delete

def feed(self, data):

[172] Fix | Delete

"""Push more data into the parser."""

[173] Fix | Delete

self._input.push(data)

[174] Fix | Delete

self._call_parse()

[175] Fix | Delete

[176] Fix | Delete

def _call_parse(self):

[177] Fix | Delete

try:

[178] Fix | Delete

self._parse()

[179] Fix | Delete

except StopIteration:

[180] Fix | Delete

pass

[181] Fix | Delete

[182] Fix | Delete

def close(self):

[183] Fix | Delete

"""Parse all remaining data and return the root message object."""

[184] Fix | Delete

self._input.close()

[185] Fix | Delete

self._call_parse()

[186] Fix | Delete

root = self._pop_message()

[187] Fix | Delete

assert not self._msgstack

[188] Fix | Delete

# Look for final set of defects

[189] Fix | Delete

if root.get_content_maintype() == 'multipart' \

[190] Fix | Delete

and not root.is_multipart():

[191] Fix | Delete

defect = errors.MultipartInvariantViolationDefect()

[192] Fix | Delete

self.policy.handle_defect(root, defect)

[193] Fix | Delete

return root

[194] Fix | Delete

[195] Fix | Delete

def _new_message(self):

[196] Fix | Delete

if self._old_style_factory:

[197] Fix | Delete

msg = self._factory()

[198] Fix | Delete

else:

[199] Fix | Delete

msg = self._factory(policy=self.policy)

[200] Fix | Delete

if self._cur and self._cur.get_content_type() == 'multipart/digest':

[201] Fix | Delete

msg.set_default_type('message/rfc822')

[202] Fix | Delete

if self._msgstack:

[203] Fix | Delete

self._msgstack[-1].attach(msg)

[204] Fix | Delete

self._msgstack.append(msg)

[205] Fix | Delete

self._cur = msg

[206] Fix | Delete

self._last = msg

[207] Fix | Delete

[208] Fix | Delete

def _pop_message(self):

[209] Fix | Delete

retval = self._msgstack.pop()

[210] Fix | Delete

if self._msgstack:

[211] Fix | Delete

self._cur = self._msgstack[-1]

[212] Fix | Delete

else:

[213] Fix | Delete

self._cur = None

[214] Fix | Delete

return retval

[215] Fix | Delete

[216] Fix | Delete

def _parsegen(self):

[217] Fix | Delete

# Create a new message and start by parsing headers.

[218] Fix | Delete

self._new_message()

[219] Fix | Delete

headers = []

[220] Fix | Delete

# Collect the headers, searching for a line that doesn't match the RFC

[221] Fix | Delete

# 2822 header or continuation pattern (including an empty line).

[222] Fix | Delete

for line in self._input:

[223] Fix | Delete

if line is NeedMoreData:

[224] Fix | Delete

yield NeedMoreData

[225] Fix | Delete

continue

[226] Fix | Delete

if not headerRE.match(line):

[227] Fix | Delete

# If we saw the RFC defined header/body separator

[228] Fix | Delete

# (i.e. newline), just throw it away. Otherwise the line is

[229] Fix | Delete

# part of the body so push it back.

[230] Fix | Delete

if not NLCRE.match(line):

[231] Fix | Delete

defect = errors.MissingHeaderBodySeparatorDefect()

[232] Fix | Delete

self.policy.handle_defect(self._cur, defect)

[233] Fix | Delete

self._input.unreadline(line)

[234] Fix | Delete

break

[235] Fix | Delete

headers.append(line)

[236] Fix | Delete

# Done with the headers, so parse them and figure out what we're

[237] Fix | Delete

# supposed to see in the body of the message.

[238] Fix | Delete

self._parse_headers(headers)

[239] Fix | Delete

# Headers-only parsing is a backwards compatibility hack, which was

[240] Fix | Delete

# necessary in the older parser, which could raise errors. All

[241] Fix | Delete

# remaining lines in the input are thrown into the message body.

[242] Fix | Delete

if self._headersonly:

[243] Fix | Delete

lines = []

[244] Fix | Delete

while True:

[245] Fix | Delete

line = self._input.readline()

[246] Fix | Delete

if line is NeedMoreData:

[247] Fix | Delete

yield NeedMoreData

[248] Fix | Delete

continue

[249] Fix | Delete

if line == '':

[250] Fix | Delete

break

[251] Fix | Delete

lines.append(line)

[252] Fix | Delete

self._cur.set_payload(EMPTYSTRING.join(lines))

[253] Fix | Delete

return

[254] Fix | Delete

if self._cur.get_content_type() == 'message/delivery-status':

[255] Fix | Delete

# message/delivery-status contains blocks of headers separated by

[256] Fix | Delete

# a blank line. We'll represent each header block as a separate

[257] Fix | Delete

# nested message object, but the processing is a bit different

[258] Fix | Delete

# than standard message/* types because there is no body for the

[259] Fix | Delete

# nested messages. A blank line separates the subparts.

[260] Fix | Delete

while True:

[261] Fix | Delete

self._input.push_eof_matcher(NLCRE.match)

[262] Fix | Delete

for retval in self._parsegen():

[263] Fix | Delete

if retval is NeedMoreData:

[264] Fix | Delete

yield NeedMoreData

[265] Fix | Delete

continue

[266] Fix | Delete

break

[267] Fix | Delete

msg = self._pop_message()

[268] Fix | Delete

# We need to pop the EOF matcher in order to tell if we're at

[269] Fix | Delete

# the end of the current file, not the end of the last block

[270] Fix | Delete

# of message headers.

[271] Fix | Delete

self._input.pop_eof_matcher()

[272] Fix | Delete

# The input stream must be sitting at the newline or at the

[273] Fix | Delete

# EOF. We want to see if we're at the end of this subpart, so

[274] Fix | Delete

# first consume the blank line, then test the next line to see

[275] Fix | Delete

# if we're at this subpart's EOF.

[276] Fix | Delete

while True:

[277] Fix | Delete

line = self._input.readline()

[278] Fix | Delete

if line is NeedMoreData:

[279] Fix | Delete

yield NeedMoreData

[280] Fix | Delete

continue

[281] Fix | Delete

break

[282] Fix | Delete

while True:

[283] Fix | Delete

line = self._input.readline()

[284] Fix | Delete

if line is NeedMoreData:

[285] Fix | Delete

yield NeedMoreData

[286] Fix | Delete

continue

[287] Fix | Delete

break

[288] Fix | Delete

if line == '':

[289] Fix | Delete

break

[290] Fix | Delete

# Not at EOF so this is a line we're going to need.

[291] Fix | Delete

self._input.unreadline(line)

[292] Fix | Delete

return

[293] Fix | Delete

if self._cur.get_content_maintype() == 'message':

[294] Fix | Delete

# The message claims to be a message/* type, then what follows is

[295] Fix | Delete

# another RFC 2822 message.

[296] Fix | Delete

for retval in self._parsegen():

[297] Fix | Delete

if retval is NeedMoreData:

[298] Fix | Delete

yield NeedMoreData

[299] Fix | Delete

continue

[300] Fix | Delete

break

[301] Fix | Delete

self._pop_message()

[302] Fix | Delete

return

[303] Fix | Delete

if self._cur.get_content_maintype() == 'multipart':

[304] Fix | Delete

boundary = self._cur.get_boundary()

[305] Fix | Delete

if boundary is None:

[306] Fix | Delete

# The message /claims/ to be a multipart but it has not

[307] Fix | Delete

# defined a boundary. That's a problem which we'll handle by

[308] Fix | Delete

# reading everything until the EOF and marking the message as

[309] Fix | Delete

# defective.

[310] Fix | Delete

defect = errors.NoBoundaryInMultipartDefect()

[311] Fix | Delete

self.policy.handle_defect(self._cur, defect)

[312] Fix | Delete

lines = []

[313] Fix | Delete

for line in self._input:

[314] Fix | Delete

if line is NeedMoreData:

[315] Fix | Delete

yield NeedMoreData

[316] Fix | Delete

continue

[317] Fix | Delete

lines.append(line)

[318] Fix | Delete

self._cur.set_payload(EMPTYSTRING.join(lines))

[319] Fix | Delete

return

[320] Fix | Delete

# Make sure a valid content type was specified per RFC 2045:6.4.

[321] Fix | Delete

if (self._cur.get('content-transfer-encoding', '8bit').lower()

[322] Fix | Delete

not in ('7bit', '8bit', 'binary')):

[323] Fix | Delete

defect = errors.InvalidMultipartContentTransferEncodingDefect()

[324] Fix | Delete

self.policy.handle_defect(self._cur, defect)

[325] Fix | Delete

# Create a line match predicate which matches the inter-part

[326] Fix | Delete

# boundary as well as the end-of-multipart boundary. Don't push

[327] Fix | Delete

# this onto the input stream until we've scanned past the

[328] Fix | Delete

# preamble.

[329] Fix | Delete

separator = '--' + boundary

[330] Fix | Delete

boundaryre = re.compile(

[331] Fix | Delete

'(?P<sep>' + re.escape(separator) +

[332] Fix | Delete

r')(?P<end>--)?(?P<ws>[ \t]*)(?P<linesep>\r\n|\r|\n)?$')

[333] Fix | Delete

capturing_preamble = True

[334] Fix | Delete

preamble = []

[335] Fix | Delete

linesep = False

[336] Fix | Delete

close_boundary_seen = False

[337] Fix | Delete

while True:

[338] Fix | Delete

line = self._input.readline()

[339] Fix | Delete

if line is NeedMoreData:

[340] Fix | Delete

yield NeedMoreData

[341] Fix | Delete

continue

[342] Fix | Delete

if line == '':

[343] Fix | Delete

break

[344] Fix | Delete

mo = boundaryre.match(line)

[345] Fix | Delete

if mo:

[346] Fix | Delete

# If we're looking at the end boundary, we're done with

[347] Fix | Delete

# this multipart. If there was a newline at the end of

[348] Fix | Delete

# the closing boundary, then we need to initialize the

[349] Fix | Delete

# epilogue with the empty string (see below).

[350] Fix | Delete

if mo.group('end'):

[351] Fix | Delete

close_boundary_seen = True

[352] Fix | Delete

linesep = mo.group('linesep')

[353] Fix | Delete

break

[354] Fix | Delete

# We saw an inter-part boundary. Were we in the preamble?

[355] Fix | Delete

if capturing_preamble:

[356] Fix | Delete

if preamble:

[357] Fix | Delete

# According to RFC 2046, the last newline belongs

[358] Fix | Delete

# to the boundary.

[359] Fix | Delete

lastline = preamble[-1]

[360] Fix | Delete

eolmo = NLCRE_eol.search(lastline)

[361] Fix | Delete

if eolmo:

[362] Fix | Delete

preamble[-1] = lastline[:-len(eolmo.group(0))]

[363] Fix | Delete

self._cur.preamble = EMPTYSTRING.join(preamble)

[364] Fix | Delete

capturing_preamble = False

[365] Fix | Delete

self._input.unreadline(line)

[366] Fix | Delete

continue

[367] Fix | Delete

# We saw a boundary separating two parts. Consume any

[368] Fix | Delete

# multiple boundary lines that may be following. Our

[369] Fix | Delete

# interpretation of RFC 2046 BNF grammar does not produce

[370] Fix | Delete

# body parts within such double boundaries.

[371] Fix | Delete

while True:

[372] Fix | Delete

line = self._input.readline()

[373] Fix | Delete

if line is NeedMoreData:

[374] Fix | Delete

yield NeedMoreData

[375] Fix | Delete

continue

[376] Fix | Delete

mo = boundaryre.match(line)

[377] Fix | Delete

if not mo:

[378] Fix | Delete

self._input.unreadline(line)

[379] Fix | Delete

break

[380] Fix | Delete

# Recurse to parse this subpart; the input stream points

[381] Fix | Delete

# at the subpart's first line.

[382] Fix | Delete

self._input.push_eof_matcher(boundaryre.match)

[383] Fix | Delete

for retval in self._parsegen():

[384] Fix | Delete

if retval is NeedMoreData:

[385] Fix | Delete

yield NeedMoreData

[386] Fix | Delete

continue

[387] Fix | Delete

break

[388] Fix | Delete

# Because of RFC 2046, the newline preceding the boundary

[389] Fix | Delete

# separator actually belongs to the boundary, not the

[390] Fix | Delete

# previous subpart's payload (or epilogue if the previous

[391] Fix | Delete

# part is a multipart).

[392] Fix | Delete

if self._last.get_content_maintype() == 'multipart':

[393] Fix | Delete

epilogue = self._last.epilogue

[394] Fix | Delete

if epilogue == '':

[395] Fix | Delete

self._last.epilogue = None

[396] Fix | Delete

elif epilogue is not None:

[397] Fix | Delete

mo = NLCRE_eol.search(epilogue)

[398] Fix | Delete

if mo:

[399] Fix | Delete

end = len(mo.group(0))

[400] Fix | Delete

self._last.epilogue = epilogue[:-end]

[401] Fix | Delete

else:

[402] Fix | Delete

payload = self._last._payload

[403] Fix | Delete

if isinstance(payload, str):

[404] Fix | Delete

mo = NLCRE_eol.search(payload)

[405] Fix | Delete

if mo:

[406] Fix | Delete

payload = payload[:-len(mo.group(0))]

[407] Fix | Delete

self._last._payload = payload

[408] Fix | Delete

self._input.pop_eof_matcher()

[409] Fix | Delete

self._pop_message()

[410] Fix | Delete

# Set the multipart up for newline cleansing, which will

[411] Fix | Delete

# happen if we're in a nested multipart.

[412] Fix | Delete

self._last = self._cur

[413] Fix | Delete

else:

[414] Fix | Delete

# I think we must be in the preamble

[415] Fix | Delete

assert capturing_preamble

[416] Fix | Delete

preamble.append(line)

[417] Fix | Delete

# We've seen either the EOF or the end boundary. If we're still

[418] Fix | Delete

# capturing the preamble, we never saw the start boundary. Note

[419] Fix | Delete

# that as a defect and store the captured text as the payload.

[420] Fix | Delete

if capturing_preamble:

[421] Fix | Delete

defect = errors.StartBoundaryNotFoundDefect()

[422] Fix | Delete

self.policy.handle_defect(self._cur, defect)

[423] Fix | Delete

self._cur.set_payload(EMPTYSTRING.join(preamble))

[424] Fix | Delete

epilogue = []

[425] Fix | Delete

for line in self._input:

[426] Fix | Delete

if line is NeedMoreData:

[427] Fix | Delete

yield NeedMoreData

[428] Fix | Delete

continue

[429] Fix | Delete

self._cur.epilogue = EMPTYSTRING.join(epilogue)

[430] Fix | Delete

return

[431] Fix | Delete

# If we're not processing the preamble, then we might have seen

[432] Fix | Delete

# EOF without seeing that end boundary...that is also a defect.

[433] Fix | Delete

if not close_boundary_seen:

[434] Fix | Delete

defect = errors.CloseBoundaryNotFoundDefect()

[435] Fix | Delete

self.policy.handle_defect(self._cur, defect)

[436] Fix | Delete

return

[437] Fix | Delete

# Everything from here to the EOF is epilogue. If the end boundary

[438] Fix | Delete

# ended in a newline, we'll need to make sure the epilogue isn't

[439] Fix | Delete

# None

[440] Fix | Delete

if linesep:

[441] Fix | Delete

epilogue = ['']

[442] Fix | Delete

else:

[443] Fix | Delete

epilogue = []

[444] Fix | Delete

for line in self._input:

[445] Fix | Delete

if line is NeedMoreData:

[446] Fix | Delete

yield NeedMoreData

[447] Fix | Delete

continue

[448] Fix | Delete

epilogue.append(line)

[449] Fix | Delete

# Any CRLF at the front of the epilogue is not technically part of

[450] Fix | Delete

# the epilogue. Also, watch out for an empty string epilogue,

[451] Fix | Delete

# which means a single newline.

[452] Fix | Delete

if epilogue:

[453] Fix | Delete

firstline = epilogue[0]

[454] Fix | Delete

bolmo = NLCRE_bol.match(firstline)

[455] Fix | Delete

if bolmo:

[456] Fix | Delete

epilogue[0] = firstline[len(bolmo.group(0)):]

[457] Fix | Delete

self._cur.epilogue = EMPTYSTRING.join(epilogue)

[458] Fix | Delete

return

[459] Fix | Delete

# Otherwise, it's some non-multipart type, so the entire rest of the

[460] Fix | Delete

# file contents becomes the payload.

[461] Fix | Delete

lines = []

[462] Fix | Delete

for line in self._input:

[463] Fix | Delete

if line is NeedMoreData:

[464] Fix | Delete

yield NeedMoreData

[465] Fix | Delete

continue

[466] Fix | Delete

lines.append(line)

[467] Fix | Delete

self._cur.set_payload(EMPTYSTRING.join(lines))

[468] Fix | Delete

[469] Fix | Delete

def _parse_headers(self, lines):

[470] Fix | Delete

# Passed a list of lines that make up the headers for the current msg

[471] Fix | Delete

lastheader = ''

[472] Fix | Delete

lastvalue = []

[473] Fix | Delete

for lineno, line in enumerate(lines):

[474] Fix | Delete

# Check for continuation

[475] Fix | Delete

if line[0] in ' \t':

[476] Fix | Delete

if not lastheader:

[477] Fix | Delete

# The first line of the headers was a continuation. This

[478] Fix | Delete

# is illegal, so let's note the defect, store the illegal

[479] Fix | Delete

# line, and ignore it for purposes of headers.

[480] Fix | Delete

defect = errors.FirstHeaderLineIsContinuationDefect(line)

[481] Fix | Delete

self.policy.handle_defect(self._cur, defect)

[482] Fix | Delete

continue

[483] Fix | Delete

lastvalue.append(line)

[484] Fix | Delete

continue

[485] Fix | Delete

if lastheader:

[486] Fix | Delete

self._cur.set_raw(*self.policy.header_source_parse(lastvalue))

[487] Fix | Delete

lastheader, lastvalue = '', []

[488] Fix | Delete

# Check for envelope header, i.e. unix-from

[489] Fix | Delete

if line.startswith('From '):

[490] Fix | Delete

if lineno == 0:

[491] Fix | Delete

# Strip off the trailing newline

[492] Fix | Delete

mo = NLCRE_eol.search(line)

[493] Fix | Delete

if mo:

[494] Fix | Delete

line = line[:-len(mo.group(0))]

[495] Fix | Delete

self._cur.set_unixfrom(line)

[496] Fix | Delete

continue

[497] Fix | Delete

elif lineno == len(lines) - 1:

[498] Fix | Delete

# Something looking like a unix-from at the end - it's

[499] Fix | Delete