python
diff --git a/‎Lib/email/_header_value_parser.py
Lines changed: 9 additions & 1 deletion b/‎Lib/email/_header_value_parser.py
Lines changed: 9 additions & 1 deletion
diff --git a/‎Lib/test/test_email/test__header_value_parser.py
Lines changed: 22 additions & 2 deletions b/‎Lib/test/test_email/test__header_value_parser.py
Lines changed: 22 additions & 2 deletions
diff --git a/‎Lib/test/test_email/test_headerregistry.py
Lines changed: 2 additions & 1 deletion b/‎Lib/test/test_email/test_headerregistry.py
Lines changed: 2 additions & 1 deletion
diff --git a/‎Misc/NEWS.d/next/Library/2019-05-19-10-48-46.bpo-21315.PgXVqF.rst
Lines changed: 3 additions & 0 deletions b/‎Misc/NEWS.d/next/Library/2019-05-19-10-48-46.bpo-21315.PgXVqF.rst
Lines changed: 3 additions & 0 deletions
@@ -75,7 +75,7 @@
 from email import _encoded_words as _ew
 from email import errors
 from email import utils
-
+from email.header import ecre as rfc2047_matcher
 #
 # Useful constants and functions
 #
@@ -1049,6 +1049,10 @@ def get_encoded_word(value):
         _validate_xtext(vtext)
         ew.append(vtext)
         text = ''.join(remainder)
+    # Encoded words should be followed by a LWS.
+    if value and value[0] != ' ':
+        ew.defects.append(errors.InvalidHeaderDefect(
+            "missing trailing whitespace after encoded-word"))
     return ew, value
 
 def get_unstructured(value):
@@ -1101,6 +1105,10 @@ def get_unstructured(value):
                 unstructured.append(token)
                 continue
         tok, *remainder = _wsp_splitter(value, 1)
+        # Split in the middle of an atom if there is a rfc2047 encoded word
+        # which does not have WS on both sides.
+        if rfc2047_matcher.search(tok):
+            tok, *remainder = value.partition('=?')
         vtext = ValueTerminal(tok, 'vtext')
         _validate_xtext(vtext)
         unstructured.append(vtext)
 
@@ -118,7 +118,7 @@ def test_get_encoded_word_gets_first_even_if_no_space(self):
                          '=?us-ascii?q?first?==?utf-8?q?second?=',
                          'first',
                          'first',
-                         [],
+                         [errors.InvalidHeaderDefect],
                          '=?utf-8?q?second?=')
 
     def test_get_encoded_word_sets_extra_attributes(self):
@@ -361,6 +361,25 @@ def test_get_unstructured_no_whitespace_between_ews(self):
             '=?utf-8?q?foo?==?utf-8?q?bar?=',
             'foobar',
             'foobar',
+            [errors.InvalidHeaderDefect,
+            errors.InvalidHeaderDefect],
+            '')
+
+    def test_get_unstructured_ew_without_leading_whitespace(self):
+        self._test_get_x(
+            self._get_unst,
+            'nowhitespace=?utf-8?q?somevalue?=',
+            'nowhitespacesomevalue',
+            'nowhitespacesomevalue',
+            [errors.InvalidHeaderDefect],
+            '')
+
+    def test_get_unstructured_ew_without_trailing_whitespace(self):
+        self._test_get_x(
+            self._get_unst,
+            '=?utf-8?q?somevalue?=nowhitespace',
+            'somevaluenowhitespace',
+            'somevaluenowhitespace',
             [errors.InvalidHeaderDefect],
             '')
 
@@ -546,7 +565,8 @@ def test_encoded_word_inside_quotes(self):
             '"=?utf-8?Q?not_really_valid?="',
             '"not really valid"',
             'not really valid',
-            [errors.InvalidHeaderDefect],
+            [errors.InvalidHeaderDefect,
+             errors.InvalidHeaderDefect],
             '')
 
     # get_comment
 
@@ -1180,7 +1180,8 @@ class TestAddressHeader(TestHeaderBase):
 
         'rfc2047_atom_in_quoted_string_is_decoded':
             ('"=?utf-8?q?=C3=89ric?=" <foo@example.com>',
-            [errors.InvalidHeaderDefect],
+            [errors.InvalidHeaderDefect,
+            errors.InvalidHeaderDefect],
             'Éric <foo@example.com>',
             'Éric',
             'foo@example.com',
 
@@ -0,0 +1,3 @@
+Email headers containing 2047 encoded words with no leading whitespace are
+parsed correctly. Also, missing trailing whitespaces now register a defect
+instead of silently ignoring.
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+Email headers containing 2047 encoded words with no leading whitespace are`
	`2`	`+parsed correctly. Also, missing trailing whitespaces now register a defect`
	`3`	`+instead of silently ignoring.`