Sign Up
Log In
Log In
or
Sign Up
Places
All Projects
Status Monitor
Collapse sidebar
SUSE:SLE-12-SP1:GA
python3-doc.30641
CVE-2023-27043-email-parsing-errors.patch
Overview
Repositories
Revisions
Requests
Users
Attributes
Meta
File CVE-2023-27043-email-parsing-errors.patch of Package python3-doc.30641
--- Doc/library/email.util.rst | 26 +++ Lib/email/utils.py | 62 ++++++- Lib/test/test_email/test_email.py | 81 +++++++++- Misc/NEWS.d/next/Security/2023-06-13-20-52-24.gh-issue-102988.Kei7Vf.rst | 4 4 files changed, 163 insertions(+), 10 deletions(-) --- a/Doc/library/email.util.rst +++ b/Doc/library/email.util.rst @@ -28,6 +28,11 @@ There are several useful utilities provi *email address* parts. Returns a tuple of that information, unless the parse fails, in which case a 2-tuple of ``('', '')`` is returned. + .. versionchanged:: 3.12 + For security reasons, addresses that were ambiguous and could parse into + multiple different addresses now cause ``('', '')`` to be returned + instead of only one of the *potential* addresses. + .. function:: formataddr(pair, charset='utf-8') @@ -50,7 +55,7 @@ There are several useful utilities provi This method returns a list of 2-tuples of the form returned by ``parseaddr()``. *fieldvalues* is a sequence of header field values as might be returned by :meth:`Message.get_all <email.message.Message.get_all>`. Here's a simple - example that gets all the recipients of a message:: + example that gets all the recipients of a message: from email.utils import getaddresses @@ -60,6 +65,25 @@ There are several useful utilities provi resent_ccs = msg.get_all('resent-cc', []) all_recipients = getaddresses(tos + ccs + resent_tos + resent_ccs) + When parsing fails for a single fieldvalue, a 2-tuple of ``('', '')`` + is returned in its place. Other errors in parsing the list of + addresses such as a fieldvalue seemingly parsing into multiple + addresses may result in a list containing a single empty 2-tuple + ``[('', '')]`` being returned rather than returning potentially + invalid output. + + Example malformed input parsing: + + .. doctest:: + + >>> from email.utils import getaddresses + >>> getaddresses(['alice@example.com <bob@example.com>', 'me@example.com']) + [('', '')] + + .. versionchanged:: 3.12 + The 2-tuple of ``('', '')`` in the returned values when parsing + fails were added as to address a security issue. + .. function:: parsedate(date) --- a/Lib/email/utils.py +++ b/Lib/email/utils.py @@ -106,13 +106,54 @@ def formataddr(pair, charset='utf-8'): return address +def _pre_parse_validation(email_header_fields): + accepted_values = [] + for v in email_header_fields: + s = v.replace('\\(', '').replace('\\)', '') + if s.count('(') != s.count(')'): + v = "('', '')" + accepted_values.append(v) + + return accepted_values + + +def _post_parse_validation(parsed_email_header_tuples): + accepted_values = [] + # The parser would have parsed a correctly formatted domain-literal + # The existence of an [ after parsing indicates a parsing failure + for v in parsed_email_header_tuples: + if '[' in v[1]: + v = ('', '') + accepted_values.append(v) + + return accepted_values + def getaddresses(fieldvalues): - """Return a list of (REALNAME, EMAIL) for each fieldvalue.""" - all = COMMASPACE.join(fieldvalues) + """Return a list of (REALNAME, EMAIL) or ('','') for each fieldvalue. + + When parsing fails for a fieldvalue, a 2-tuple of ('', '') is returned in + its place. + + If the resulting list of parsed address is not the same as the number of + fieldvalues in the input list a parsing error has occurred. A list + containing a single empty 2-tuple [('', '')] is returned in its place. + This is done to avoid invalid output. + """ + fieldvalues = [str(v) for v in fieldvalues] + fieldvalues = _pre_parse_validation(fieldvalues) + all = COMMASPACE.join(v for v in fieldvalues) a = _AddressList(all) - return a.addresslist + result = _post_parse_validation(a.addresslist) + + n = 0 + for v in fieldvalues: + n += v.count(',') + 1 + if len(result) != n: + return [('', '')] + + return result ecre = re.compile(r''' @@ -215,9 +256,18 @@ def parsedate_to_datetime(data): def parseaddr(addr): - addrs = _AddressList(addr).addresslist - if not addrs: - return '', '' + if isinstance(addr, list): + addr = addr[0] + + if not isinstance(addr, str): + return ('', '') + + addr = _pre_parse_validation([addr])[0] + addrs = _post_parse_validation(_AddressList(addr).addresslist) + + if not addrs or len(addrs) > 1: + return ('', '') + return addrs[0] --- a/Lib/test/test_email/test_email.py +++ b/Lib/test/test_email/test_email.py @@ -3154,15 +3154,90 @@ Foo [('Al Person', 'aperson@dom.ain'), ('Bud Person', 'bperson@dom.ain')]) + def test_getaddresses_parsing_errors(self): + """Test for parsing errors from CVE-2023-27043""" + eq = self.assertEqual + eq(utils.getaddresses(['alice@example.org(<bob@example.com>']), + [('', '')]) + eq(utils.getaddresses(['alice@example.org)<bob@example.com>']), + [('', '')]) + eq(utils.getaddresses(['alice@example.org<<bob@example.com>']), + [('', '')]) + eq(utils.getaddresses(['alice@example.org><bob@example.com>']), + [('', '')]) + eq(utils.getaddresses(['alice@example.org@<bob@example.com>']), + [('', '')]) + eq(utils.getaddresses(['alice@example.org,<bob@example.com>']), + [('', 'alice@example.org'), ('', 'bob@example.com')]) + eq(utils.getaddresses(['alice@example.org;<bob@example.com>']), + [('', '')]) + eq(utils.getaddresses(['alice@example.org:<bob@example.com>']), + [('', '')]) + eq(utils.getaddresses(['alice@example.org.<bob@example.com>']), + [('', '')]) + eq(utils.getaddresses(['alice@example.org"<bob@example.com>']), + [('', '')]) + eq(utils.getaddresses(['alice@example.org[<bob@example.com>']), + [('', '')]) + eq(utils.getaddresses(['alice@example.org]<bob@example.com>']), + [('', '')]) + + def test_parseaddr_parsing_errors(self): + """Test for parsing errors from CVE-2023-27043""" + eq = self.assertEqual + eq(utils.parseaddr(['alice@example.org(<bob@example.com>']), + ('', '')) + eq(utils.parseaddr(['alice@example.org)<bob@example.com>']), + ('', '')) + eq(utils.parseaddr(['alice@example.org<<bob@example.com>']), + ('', '')) + eq(utils.parseaddr(['alice@example.org><bob@example.com>']), + ('', '')) + eq(utils.parseaddr(['alice@example.org@<bob@example.com>']), + ('', '')) + eq(utils.parseaddr(['alice@example.org,<bob@example.com>']), + ('', '')) + eq(utils.parseaddr(['alice@example.org;<bob@example.com>']), + ('', '')) + eq(utils.parseaddr(['alice@example.org:<bob@example.com>']), + ('', '')) + eq(utils.parseaddr(['alice@example.org.<bob@example.com>']), + ('', '')) + eq(utils.parseaddr(['alice@example.org"<bob@example.com>']), + ('', '')) + eq(utils.parseaddr(['alice@example.org[<bob@example.com>']), + ('', '')) + eq(utils.parseaddr(['alice@example.org]<bob@example.com>']), + ('', '')) + def test_getaddresses_nasty(self): eq = self.assertEqual eq(utils.getaddresses(['foo: ;']), [('', '')]) - eq(utils.getaddresses( - ['[]*-- =~$']), - [('', ''), ('', ''), ('', '*--')]) + eq(utils.getaddresses(['[]*-- =~$']), [('', '')]) eq(utils.getaddresses( ['foo: ;', '"Jason R. Mastaler" <jason@dom.ain>']), [('', ''), ('Jason R. Mastaler', 'jason@dom.ain')]) + eq(utils.getaddresses( + [r'Pete(A nice \) chap) <pete(his account)@silly.test(his host)>']), + [('Pete (A nice ) chap his account his host)', 'pete@silly.test')]) + eq(utils.getaddresses( + ['(Empty list)(start)Undisclosed recipients :(nobody(I know))']), + [('', '')]) + eq(utils.getaddresses( + ['Mary <@machine.tld:mary@example.net>, , jdoe@test . example']), + [('Mary', 'mary@example.net'), ('', ''), ('', 'jdoe@test.example')]) + eq(utils.getaddresses( + ['John Doe <jdoe@machine(comment). example>']), + [('John Doe (comment)', 'jdoe@machine.example')]) + eq(utils.getaddresses( + ['"Mary Smith: Personal Account" <smith@home.example>']), + [('Mary Smith: Personal Account', 'smith@home.example')]) + eq(utils.getaddresses( + ['Undisclosed recipients:;']), + [('', '')]) + eq(utils.getaddresses( + [r'<boss@nil.test>, "Giant; \"Big\" Box" <bob@example.net>']), + [('', 'boss@nil.test'), ('Giant; "Big" Box', 'bob@example.net')]) def test_getaddresses_embedded_comment(self): """Test proper handling of a nested comment""" --- /dev/null +++ b/Misc/NEWS.d/next/Security/2023-06-13-20-52-24.gh-issue-102988.Kei7Vf.rst @@ -0,0 +1,4 @@ +CVE-2023-27043: Prevent :func:`email.utils.parseaddr` +and :func:`email.utils.getaddresses` from returning the realname portion of an +invalid RFC2822 email header in the email address portion of the 2-tuple +returned after being parsed by :class:`email._parseaddr.AddressList`.
Locations
Projects
Search
Status Monitor
Help
OpenBuildService.org
Documentation
API Documentation
Code of Conduct
Contact
Support
@OBShq
Terms
openSUSE Build Service is sponsored by
The Open Build Service is an
openSUSE project
.
Sign Up
Log In
Places
Places
All Projects
Status Monitor