mirror of
https://github.com/python/cpython.git
synced 2024-11-21 21:09:37 +01:00
303aac8c56
I am re-submitting an older PR which was abandoned but is still relevant, #10783 by @timb07. The issue being solved () is still relevant. The original PR #10783 was closed as the final request changes were not applied and since abandoned. In this new PR I have re-used the original patch plus applied both comments from the review, by @maxking and @pganssle. For reference, here is the original PR description: In email.utils.parsedate_to_datetime(), a failure to parse the date, or invalid date components (such as hour outside 0..23) raises an exception. Document this behaviour, and add tests to test_email/test_utils.py to confirm this behaviour. In email.headerregistry.DateHeader.parse(), check when parsedate_to_datetime() raises an exception and add a new defect InvalidDateDefect; preserve the invalid value as the string value of the header, but set the datetime attribute to None. Add tests to test_email/test_headerregistry.py to confirm this behaviour; also added test to test_email/test_inversion.py to confirm emails with such defective date headers round trip successfully. This pull request incorporates feedback gratefully received from @bitdancer, @brettcannon, @Mariatta and @warsaw, and replaces the earlier PR #2254. Automerge-Triggered-By: GH:warsaw
79 lines
2.2 KiB
Python
79 lines
2.2 KiB
Python
"""Test the parser and generator are inverses.
|
|
|
|
Note that this is only strictly true if we are parsing RFC valid messages and
|
|
producing RFC valid messages.
|
|
"""
|
|
|
|
import io
|
|
import unittest
|
|
from email import policy, message_from_bytes
|
|
from email.message import EmailMessage
|
|
from email.generator import BytesGenerator
|
|
from test.test_email import TestEmailBase, parameterize
|
|
|
|
# This is like textwrap.dedent for bytes, except that it uses \r\n for the line
|
|
# separators on the rebuilt string.
|
|
def dedent(bstr):
|
|
lines = bstr.splitlines()
|
|
if not lines[0].strip():
|
|
raise ValueError("First line must contain text")
|
|
stripamt = len(lines[0]) - len(lines[0].lstrip())
|
|
return b'\r\n'.join(
|
|
[x[stripamt:] if len(x)>=stripamt else b''
|
|
for x in lines])
|
|
|
|
|
|
@parameterize
|
|
class TestInversion(TestEmailBase):
|
|
|
|
policy = policy.default
|
|
message = EmailMessage
|
|
|
|
def msg_as_input(self, msg):
|
|
m = message_from_bytes(msg, policy=policy.SMTP)
|
|
b = io.BytesIO()
|
|
g = BytesGenerator(b)
|
|
g.flatten(m)
|
|
self.assertEqual(b.getvalue(), msg)
|
|
|
|
# XXX: spaces are not preserved correctly here yet in the general case.
|
|
msg_params = {
|
|
'header_with_one_space_body': (dedent(b"""\
|
|
From: abc@xyz.com
|
|
X-Status:\x20
|
|
Subject: test
|
|
|
|
foo
|
|
"""),),
|
|
|
|
'header_with_invalid_date': (dedent(b"""\
|
|
Date: Tue, 06 Jun 2017 27:39:33 +0600
|
|
From: abc@xyz.com
|
|
Subject: timezones
|
|
|
|
How do they work even?
|
|
"""),),
|
|
|
|
}
|
|
|
|
payload_params = {
|
|
'plain_text': dict(payload='This is a test\n'*20),
|
|
'base64_text': dict(payload=(('xy a'*40+'\n')*5), cte='base64'),
|
|
'qp_text': dict(payload=(('xy a'*40+'\n')*5), cte='quoted-printable'),
|
|
}
|
|
|
|
def payload_as_body(self, payload, **kw):
|
|
msg = self._make_message()
|
|
msg['From'] = 'foo'
|
|
msg['To'] = 'bar'
|
|
msg['Subject'] = 'payload round trip test'
|
|
msg.set_content(payload, **kw)
|
|
b = bytes(msg)
|
|
msg2 = message_from_bytes(b, policy=self.policy)
|
|
self.assertEqual(bytes(msg2), b)
|
|
self.assertEqual(msg2.get_content(), payload)
|
|
|
|
|
|
if __name__ == '__main__':
|
|
unittest.main()
|