summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorAbhilash Raj <maxking@users.noreply.github.com>2019-12-09 01:35:38 (GMT)
committerGitHub <noreply@github.com>2019-12-09 01:35:38 (GMT)
commit68157da8b42b26408af5d157d2dba4fcf29c6320 (patch)
tree24b6efbd34f13ad32d02ac4981b8f97b5156d027
parent080ee5a88406fb68aaab741145cd5d2a7c5f2ad6 (diff)
downloadcpython-68157da8b42b26408af5d157d2dba4fcf29c6320.zip
cpython-68157da8b42b26408af5d157d2dba4fcf29c6320.tar.gz
cpython-68157da8b42b26408af5d157d2dba4fcf29c6320.tar.bz2
bpo-38698: Add a new InvalidMessageID token to email header parser. (GH-17503)
This adds a new InvalidMessageID token to the email header parser which can be used to represent invalid message-id headers in the parse tree.
-rw-r--r--Lib/email/_header_value_parser.py20
-rw-r--r--Lib/test/test_email/test__header_value_parser.py40
-rw-r--r--Misc/NEWS.d/next/Library/2019-12-07-21-49-50.bpo-38698.HxoSym.rst3
3 files changed, 56 insertions, 7 deletions
diff --git a/Lib/email/_header_value_parser.py b/Lib/email/_header_value_parser.py
index abdef81..cb01322 100644
--- a/Lib/email/_header_value_parser.py
+++ b/Lib/email/_header_value_parser.py
@@ -850,10 +850,15 @@ class MsgID(TokenList):
# message-id tokens may not be folded.
return str(self) + policy.linesep
+
class MessageID(MsgID):
token_type = 'message-id'
+class InvalidMessageID(MessageID):
+ token_type = 'invalid-message-id'
+
+
class Header(TokenList):
token_type = 'header'
@@ -2110,11 +2115,18 @@ def parse_message_id(value):
message_id = MessageID()
try:
token, value = get_msg_id(value)
- except errors.HeaderParseError:
- message_id.defects.append(errors.InvalidHeaderDefect(
- "Expected msg-id but found {!r}".format(value)))
- else:
message_id.append(token)
+ except errors.HeaderParseError as ex:
+ token = get_unstructured(value)
+ message_id = InvalidMessageID(token)
+ message_id.defects.append(
+ errors.InvalidHeaderDefect("Invalid msg-id: {!r}".format(ex)))
+ else:
+ # Value after parsing a valid msg_id should be None.
+ if value:
+ message_id.defects.append(errors.InvalidHeaderDefect(
+ "Unexpected {!r}".format(value)))
+
return message_id
#
diff --git a/Lib/test/test_email/test__header_value_parser.py b/Lib/test/test_email/test__header_value_parser.py
index 71168f3..d59d701 100644
--- a/Lib/test/test_email/test__header_value_parser.py
+++ b/Lib/test/test_email/test__header_value_parser.py
@@ -2639,10 +2639,44 @@ class TestParser(TestParserMixin, TestEmailBase):
self.assertEqual(msg_id.token_type, 'msg-id')
def test_get_msg_id_invalid_expected_msg_id_not_found(self):
- text = "Message-Id: 935-XPB-567:0:86089:180874:0:45327:9:90305:17843586-40@example.com"
+ text = "935-XPB-567:0:45327:9:90305:17843586-40@example.com"
msg_id = parser.parse_message_id(text)
- self.assertDefectsEqual(msg_id.all_defects,
- [errors.InvalidHeaderDefect])
+ self.assertDefectsEqual(
+ msg_id.all_defects,
+ [errors.InvalidHeaderDefect])
+
+ def test_parse_invalid_message_id(self):
+ message_id = self._test_parse_x(
+ parser.parse_message_id,
+ "935-XPB-567:0:45327:9:90305:17843586-40@example.com",
+ "935-XPB-567:0:45327:9:90305:17843586-40@example.com",
+ "935-XPB-567:0:45327:9:90305:17843586-40@example.com",
+ [errors.InvalidHeaderDefect],
+ )
+ self.assertEqual(message_id.token_type, 'invalid-message-id')
+
+ def test_parse_valid_message_id(self):
+ message_id = self._test_parse_x(
+ parser.parse_message_id,
+ "<aperson@somedomain>",
+ "<aperson@somedomain>",
+ "<aperson@somedomain>",
+ [],
+ )
+ self.assertEqual(message_id.token_type, 'message-id')
+
+ def test_parse_message_id_with_remaining(self):
+ message_id = self._test_parse_x(
+ parser.parse_message_id,
+ "<validmessageid@example>thensomething",
+ "<validmessageid@example>",
+ "<validmessageid@example>",
+ [errors.InvalidHeaderDefect],
+ [],
+ )
+ self.assertEqual(message_id.token_type, 'message-id')
+ self.assertEqual(str(message_id.all_defects[0]),
+ "Unexpected 'thensomething'")
def test_get_msg_id_no_angle_start(self):
with self.assertRaises(errors.HeaderParseError):
diff --git a/Misc/NEWS.d/next/Library/2019-12-07-21-49-50.bpo-38698.HxoSym.rst b/Misc/NEWS.d/next/Library/2019-12-07-21-49-50.bpo-38698.HxoSym.rst
new file mode 100644
index 0000000..b930dea
--- /dev/null
+++ b/Misc/NEWS.d/next/Library/2019-12-07-21-49-50.bpo-38698.HxoSym.rst
@@ -0,0 +1,3 @@
+Add a new ``InvalidMessageID`` token to email parser to represent invalid
+Message-ID headers. Also, add defects when there is remaining value after
+parsing the header.