(C)Python test resources

From python-checkins at python.org Sat Nov 1 00:49:04 2014 From: python-checkins at python.org (ethan.furman) Date: Fri, 31 Oct 2014 23:49:04 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_issue22780=3A_update_NotIm?= =?utf-8?q?plemented_description?= Message-ID: <20141031234904.120736.58013@psf.io> https://hg.python.org/cpython/rev/26d0a17affb5 changeset: 93327:26d0a17affb5 parent: 93325:c95ce9b0a085 user: Ethan Furman date: Fri Oct 31 16:48:41 2014 -0700 summary: issue22780: update NotImplemented description files: Doc/library/constants.rst | 6 +++--- 1 files changed, 3 insertions(+), 3 deletions(-) diff --git a/Doc/library/constants.rst b/Doc/library/constants.rst --- a/Doc/library/constants.rst +++ b/Doc/library/constants.rst @@ -26,9 +26,9 @@ .. data:: NotImplemented - Special value which can be returned by the "rich comparison" special methods - (:meth:`__eq__`, :meth:`__lt__`, and friends), to indicate that the comparison - is not implemented with respect to the other type. + Special value which should be returned by the special methods + (:meth:`__eq__`, :meth:`__lt__`, :meth:`__add__`, etc.) to indicate + that the operation is not implemented with respect to the other type. .. data:: Ellipsis -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 1 00:54:33 2014 From: python-checkins at python.org (benjamin.peterson) Date: Fri, 31 Oct 2014 23:54:33 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_2=2E7=2E9_concrete_dates?= Message-ID: <20141031235433.109256.52937@psf.io> https://hg.python.org/peps/rev/8df0058f32cc changeset: 5591:8df0058f32cc user: Benjamin Peterson date: Fri Oct 31 19:54:32 2014 -0400 summary: 2.7.9 concrete dates files: pep-0373.txt | 3 ++- 1 files changed, 2 insertions(+), 1 deletions(-) diff --git a/pep-0373.txt b/pep-0373.txt --- a/pep-0373.txt +++ b/pep-0373.txt @@ -71,7 +71,8 @@ Planned future release dates: -- 2.7.9 December 2014 +- 2.7.9rc1 2014-11-22 +- 2.7.9 2014-12-05 - 2.7.10 June 2015 - beyond this date, releases as needed -- Repository URL: https://hg.python.org/peps From python-checkins at python.org Sat Nov 1 09:46:01 2014 From: python-checkins at python.org (berker.peksag) Date: Sat, 01 Nov 2014 08:46:01 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=236623=3A_Remove_de?= =?utf-8?q?precated_Netrc_class_in_the_ftplib_module=2E?= Message-ID: <20141101084600.101688.80686@psf.io> https://hg.python.org/cpython/rev/ec196a99af8d changeset: 93328:ec196a99af8d user: Berker Peksag date: Sat Nov 01 10:45:57 2014 +0200 summary: Issue #6623: Remove deprecated Netrc class in the ftplib module. Patch by Matt Chaput. files: Doc/whatsnew/3.5.rst | 8 + Lib/ftplib.py | 117 +-------------------------- Lib/test/test_ftplib.py | 23 +---- Misc/ACKS | 1 + Misc/NEWS | 3 + 5 files changed, 23 insertions(+), 129 deletions(-) diff --git a/Doc/whatsnew/3.5.rst b/Doc/whatsnew/3.5.rst --- a/Doc/whatsnew/3.5.rst +++ b/Doc/whatsnew/3.5.rst @@ -369,10 +369,18 @@ Removed ======= +API and Feature Removals +------------------------ + +The following obsolete and previously deprecated APIs and features have been +removed: + * The ``__version__`` attribute has been dropped from the email package. The email code hasn't been shipped separately from the stdlib for a long time, and the ``__version__`` string was not updated in the last few releases. +* The internal ``Netrc`` class in the :mod:`ftplib` module was deprecated in + 3.4, and has now been removed. (Contributed by Matt Chaput in :issue:`6623`.) Porting to Python 3.5 ===================== diff --git a/Lib/ftplib.py b/Lib/ftplib.py --- a/Lib/ftplib.py +++ b/Lib/ftplib.py @@ -42,7 +42,7 @@ import warnings from socket import _GLOBAL_DEFAULT_TIMEOUT -__all__ = ["FTP", "Netrc"] +__all__ = ["FTP"] # Magic number from MSG_OOB = 0x1 # Process data out of band @@ -920,115 +920,6 @@ target.voidresp() -class Netrc: - """Class to parse & provide access to 'netrc' format files. - - See the netrc(4) man page for information on the file format. - - WARNING: This class is obsolete -- use module netrc instead. - - """ - __defuser = None - __defpasswd = None - __defacct = None - - def __init__(self, filename=None): - warnings.warn("This class is deprecated, use the netrc module instead", - DeprecationWarning, 2) - if filename is None: - if "HOME" in os.environ: - filename = os.path.join(os.environ["HOME"], - ".netrc") - else: - raise OSError("specify file to load or set $HOME") - self.__hosts = {} - self.__macros = {} - fp = open(filename, "r") - in_macro = 0 - while 1: - line = fp.readline() - if not line: - break - if in_macro and line.strip(): - macro_lines.append(line) - continue - elif in_macro: - self.__macros[macro_name] = tuple(macro_lines) - in_macro = 0 - words = line.split() - host = user = passwd = acct = None - default = 0 - i = 0 - while i < len(words): - w1 = words[i] - if i+1 < len(words): - w2 = words[i + 1] - else: - w2 = None - if w1 == 'default': - default = 1 - elif w1 == 'machine' and w2: - host = w2.lower() - i = i + 1 - elif w1 == 'login' and w2: - user = w2 - i = i + 1 - elif w1 == 'password' and w2: - passwd = w2 - i = i + 1 - elif w1 == 'account' and w2: - acct = w2 - i = i + 1 - elif w1 == 'macdef' and w2: - macro_name = w2 - macro_lines = [] - in_macro = 1 - break - i = i + 1 - if default: - self.__defuser = user or self.__defuser - self.__defpasswd = passwd or self.__defpasswd - self.__defacct = acct or self.__defacct - if host: - if host in self.__hosts: - ouser, opasswd, oacct = \ - self.__hosts[host] - user = user or ouser - passwd = passwd or opasswd - acct = acct or oacct - self.__hosts[host] = user, passwd, acct - fp.close() - - def get_hosts(self): - """Return a list of hosts mentioned in the .netrc file.""" - return self.__hosts.keys() - - def get_account(self, host): - """Returns login information for the named host. - - The return value is a triple containing userid, - password, and the accounting field. - - """ - host = host.lower() - user = passwd = acct = None - if host in self.__hosts: - user, passwd, acct = self.__hosts[host] - user = user or self.__defuser - passwd = passwd or self.__defpasswd - acct = acct or self.__defacct - return user, passwd, acct - - def get_macros(self): - """Return a list of all defined macro names.""" - return self.__macros.keys() - - def get_macro(self, macro): - """Return a sequence of lines which define a named macro.""" - return self.__macros[macro] - - - def test(): '''Test program. Usage: ftp [-d] [-r[file]] host [-l[dir]] [-d[dir]] [-p] [file] ... @@ -1042,6 +933,8 @@ print(test.__doc__) sys.exit(0) + import netrc + debugging = 0 rcfile = None while sys.argv[1] == '-d': @@ -1056,14 +949,14 @@ ftp.set_debuglevel(debugging) userid = passwd = acct = '' try: - netrc = Netrc(rcfile) + netrcobj = netrc.netrc(rcfile) except OSError: if rcfile is not None: sys.stderr.write("Could not open account file" " -- using anonymous login.") else: try: - userid, passwd, acct = netrc.get_account(host) + userid, acct, passwd = netrcobj.authenticators(host) except KeyError: # no account for host sys.stderr.write( diff --git a/Lib/test/test_ftplib.py b/Lib/test/test_ftplib.py --- a/Lib/test/test_ftplib.py +++ b/Lib/test/test_ftplib.py @@ -76,7 +76,7 @@ super(DummyDTPHandler, self).push(what.encode('ascii')) def handle_error(self): - raise + raise Exception class DummyFTPHandler(asynchat.async_chat): @@ -121,7 +121,7 @@ self.push('550 command "%s" not understood.' %cmd) def handle_error(self): - raise + raise Exception def push(self, data): asynchat.async_chat.push(self, data.encode('ascii') + b'\r\n') @@ -299,7 +299,7 @@ return 0 def handle_error(self): - raise + raise Exception if ssl is not None: @@ -397,7 +397,7 @@ raise def handle_error(self): - raise + raise Exception def close(self): if (isinstance(self.socket, ssl.SSLSocket) and @@ -673,7 +673,7 @@ self.assertRaises(StopIteration, next, self.client.mlsd()) set_data('') for x in self.client.mlsd(): - self.fail("unexpected data %s" % data) + self.fail("unexpected data %s" % x) def test_makeport(self): with self.client.makeport(): @@ -1053,19 +1053,8 @@ ftp.close() -class TestNetrcDeprecation(TestCase): - - def test_deprecation(self): - with support.temp_cwd(), support.EnvironmentVarGuard() as env: - env['HOME'] = os.getcwd() - open('.netrc', 'w').close() - with self.assertWarns(DeprecationWarning): - ftplib.Netrc() - - - def test_main(): - tests = [TestFTPClass, TestTimeouts, TestNetrcDeprecation, + tests = [TestFTPClass, TestTimeouts, TestIPv6Environment, TestTLS_FTPClassMixin, TestTLS_FTPClass] diff --git a/Misc/ACKS b/Misc/ACKS --- a/Misc/ACKS +++ b/Misc/ACKS @@ -233,6 +233,7 @@ Brad Chapman Greg Chapman Mitch Chapman +Matt Chaput Yogesh Chaudhari David Chaum Nicolas Chauvat diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -180,6 +180,9 @@ Library ------- +- Issue #6623: Remove deprecated Netrc class in the ftplib module. Patch by + Matt Chaput. + - Issue #17381: Fixed handling of case-insensitive ranges in regular expressions. -- Repository URL: https://hg.python.org/cpython From solipsis at pitrou.net Sat Nov 1 10:05:40 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Sat, 01 Nov 2014 10:05:40 +0100 Subject: [Python-checkins] Daily reference leaks (26d0a17affb5): sum=3 Message-ID: results for 26d0a17affb5 on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogP2wzaR', '-x'] From python-checkins at python.org Sat Nov 1 10:05:39 2014 From: python-checkins at python.org (berker.peksag) Date: Sat, 01 Nov 2014 09:05:39 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2322665=3A_Add_missing_get=5Fterminal=5Fsize_and_?= =?utf-8?q?SameFileError_to_shutil=2E=5F=5Fall=5F=5F=2E?= Message-ID: <20141101090538.120714.80210@psf.io> https://hg.python.org/cpython/rev/193ac288bc7f changeset: 93330:193ac288bc7f parent: 93328:ec196a99af8d parent: 93329:232520144c6c user: Berker Peksag date: Sat Nov 01 11:05:36 2014 +0200 summary: Issue #22665: Add missing get_terminal_size and SameFileError to shutil.__all__. files: Lib/shutil.py | 3 ++- Lib/test/test_shutil.py | 18 ++++++++++++++++++ Misc/NEWS | 3 +++ 3 files changed, 23 insertions(+), 1 deletions(-) diff --git a/Lib/shutil.py b/Lib/shutil.py --- a/Lib/shutil.py +++ b/Lib/shutil.py @@ -42,7 +42,8 @@ "register_archive_format", "unregister_archive_format", "get_unpack_formats", "register_unpack_format", "unregister_unpack_format", "unpack_archive", - "ignore_patterns", "chown", "which"] + "ignore_patterns", "chown", "which", "get_terminal_size", + "SameFileError"] # disk_usage is added later, if available on the platform class Error(OSError): diff --git a/Lib/test/test_shutil.py b/Lib/test/test_shutil.py --- a/Lib/test/test_shutil.py +++ b/Lib/test/test_shutil.py @@ -1788,5 +1788,23 @@ self.assertEqual(expected, actual) +class PublicAPITests(unittest.TestCase): + """Ensures that the correct values are exposed in the public API.""" + + def test_module_all_attribute(self): + self.assertTrue(hasattr(shutil, '__all__')) + target_api = ['copyfileobj', 'copyfile', 'copymode', 'copystat', + 'copy', 'copy2', 'copytree', 'move', 'rmtree', 'Error', + 'SpecialFileError', 'ExecError', 'make_archive', + 'get_archive_formats', 'register_archive_format', + 'unregister_archive_format', 'get_unpack_formats', + 'register_unpack_format', 'unregister_unpack_format', + 'unpack_archive', 'ignore_patterns', 'chown', 'which', + 'get_terminal_size', 'SameFileError'] + if hasattr(os, 'statvfs') or os.name == 'nt': + target_api.append('disk_usage') + self.assertEqual(set(shutil.__all__), set(target_api)) + + if __name__ == '__main__': unittest.main() diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -180,6 +180,9 @@ Library ------- +- Issue #22665: Add missing get_terminal_size and SameFileError to + shutil.__all__. + - Issue #6623: Remove deprecated Netrc class in the ftplib module. Patch by Matt Chaput. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 1 10:05:39 2014 From: python-checkins at python.org (berker.peksag) Date: Sat, 01 Nov 2014 09:05:39 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyNjY1?= =?utf-8?q?=3A_Add_missing_get=5Fterminal=5Fsize_and_SameFileError_to_shut?= =?utf-8?b?aWwuX19hbGxfXy4=?= Message-ID: <20141101090538.109280.86646@psf.io> https://hg.python.org/cpython/rev/232520144c6c changeset: 93329:232520144c6c branch: 3.4 parent: 93324:147518a95b60 user: Berker Peksag date: Sat Nov 01 11:04:06 2014 +0200 summary: Issue #22665: Add missing get_terminal_size and SameFileError to shutil.__all__. files: Lib/shutil.py | 3 ++- Lib/test/test_shutil.py | 18 ++++++++++++++++++ Misc/NEWS | 3 +++ 3 files changed, 23 insertions(+), 1 deletions(-) diff --git a/Lib/shutil.py b/Lib/shutil.py --- a/Lib/shutil.py +++ b/Lib/shutil.py @@ -36,7 +36,8 @@ "register_archive_format", "unregister_archive_format", "get_unpack_formats", "register_unpack_format", "unregister_unpack_format", "unpack_archive", - "ignore_patterns", "chown", "which"] + "ignore_patterns", "chown", "which", "get_terminal_size", + "SameFileError"] # disk_usage is added later, if available on the platform class Error(OSError): diff --git a/Lib/test/test_shutil.py b/Lib/test/test_shutil.py --- a/Lib/test/test_shutil.py +++ b/Lib/test/test_shutil.py @@ -1762,5 +1762,23 @@ self.assertEqual(expected, actual) +class PublicAPITests(unittest.TestCase): + """Ensures that the correct values are exposed in the public API.""" + + def test_module_all_attribute(self): + self.assertTrue(hasattr(shutil, '__all__')) + target_api = ['copyfileobj', 'copyfile', 'copymode', 'copystat', + 'copy', 'copy2', 'copytree', 'move', 'rmtree', 'Error', + 'SpecialFileError', 'ExecError', 'make_archive', + 'get_archive_formats', 'register_archive_format', + 'unregister_archive_format', 'get_unpack_formats', + 'register_unpack_format', 'unregister_unpack_format', + 'unpack_archive', 'ignore_patterns', 'chown', 'which', + 'get_terminal_size', 'SameFileError'] + if hasattr(os, 'statvfs') or os.name == 'nt': + target_api.append('disk_usage') + self.assertEqual(set(shutil.__all__), set(target_api)) + + if __name__ == '__main__': unittest.main() diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -33,6 +33,9 @@ Library ------- +- Issue #22665: Add missing get_terminal_size and SameFileError to + shutil.__all__. + - Issue #17381: Fixed handling of case-insensitive ranges in regular expressions. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 1 15:40:47 2014 From: python-checkins at python.org (ethan.furman) Date: Sat, 01 Nov 2014 14:40:47 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_standardize_Enum_docs_by_r?= =?utf-8?q?eferring_to_=27special_methods=27_instead_of_=5F=5Fdunder=5F=5F?= Message-ID: <20141101144044.101698.67174@psf.io> https://hg.python.org/cpython/rev/149490bbd260 changeset: 93331:149490bbd260 user: Ethan Furman date: Sat Nov 01 07:40:22 2014 -0700 summary: standardize Enum docs by referring to 'special methods' instead of __dunder__ methods files: Doc/library/enum.rst | 10 +++++----- 1 files changed, 5 insertions(+), 5 deletions(-) diff --git a/Doc/library/enum.rst b/Doc/library/enum.rst --- a/Doc/library/enum.rst +++ b/Doc/library/enum.rst @@ -314,11 +314,11 @@ >>> str(Mood.funky) 'my custom str! 1' -The rules for what is allowed are as follows: _sunder_ names (starting and -ending with a single underscore) are reserved by enum and cannot be used; -all other attributes defined within an enumeration will become members of this -enumeration, with the exception of *__dunder__* names and descriptors (methods -are also descriptors). +The rules for what is allowed are as follows: names that start and end with a +with a single underscore are reserved by enum and cannot be used; all other +attributes defined within an enumeration will become members of this +enumeration, with the exception of special methods (:meth:`__str__`, +:meth:`__add__`, etc.) and descriptors (methods are also descriptors). Note: if your enumeration defines :meth:`__new__` and/or :meth:`__init__` then whatever value(s) were given to the enum member will be passed into those -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 1 21:01:12 2014 From: python-checkins at python.org (vinay.sajip) Date: Sat, 01 Nov 2014 20:01:12 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E4=29=3A_Brought_exclud?= =?utf-8?q?ed_code_into_the_scope_of_a_try_block_in_SysLogHandler=2Eemit?= =?utf-8?b?KCku?= Message-ID: <20141101200109.120724.27785@psf.io> https://hg.python.org/cpython/rev/f6a906541476 changeset: 93333:f6a906541476 branch: 3.4 parent: 93329:232520144c6c user: Vinay Sajip date: Sat Nov 01 19:58:47 2014 +0000 summary: Brought excluded code into the scope of a try block in SysLogHandler.emit(). files: Lib/logging/handlers.py | 28 ++++++++++++++-------------- Misc/NEWS | 3 +++ 2 files changed, 17 insertions(+), 14 deletions(-) diff --git a/Lib/logging/handlers.py b/Lib/logging/handlers.py --- a/Lib/logging/handlers.py +++ b/Lib/logging/handlers.py @@ -879,21 +879,21 @@ The record is formatted, and then sent to the syslog server. If exception information is present, it is NOT sent to the server. """ - msg = self.format(record) - if self.ident: - msg = self.ident + msg - if self.append_nul: - msg += '\000' + try: + msg = self.format(record) + if self.ident: + msg = self.ident + msg + if self.append_nul: + msg += '\000' - # We need to convert record level to lowercase, maybe this will - # change in the future. - prio = '<%d>' % self.encodePriority(self.facility, - self.mapPriority(record.levelname)) - prio = prio.encode('utf-8') - # Message is a string. Convert to bytes as required by RFC 5424 - msg = msg.encode('utf-8') - msg = prio + msg - try: + # We need to convert record level to lowercase, maybe this will + # change in the future. + prio = '<%d>' % self.encodePriority(self.facility, + self.mapPriority(record.levelname)) + prio = prio.encode('utf-8') + # Message is a string. Convert to bytes as required by RFC 5424 + msg = msg.encode('utf-8') + msg = prio + msg if self.unixsocket: try: self.socket.send(msg) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -33,6 +33,9 @@ Library ------- +- Issue #22776: Brought excluded code into the scope of a try block in + SysLogHandler.emit(). + - Issue #22665: Add missing get_terminal_size and SameFileError to shutil.__all__. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 1 21:01:12 2014 From: python-checkins at python.org (vinay.sajip) Date: Sat, 01 Nov 2014 20:01:12 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Closes_=2322776=3A_Merged_fix_from_3=2E4=2E?= Message-ID: <20141101200109.101682.22068@psf.io> https://hg.python.org/cpython/rev/54549f9b2ecc changeset: 93334:54549f9b2ecc parent: 93331:149490bbd260 parent: 93333:f6a906541476 user: Vinay Sajip date: Sat Nov 01 20:00:56 2014 +0000 summary: Closes #22776: Merged fix from 3.4. files: Lib/logging/handlers.py | 28 ++++++++++++++-------------- Misc/NEWS | 3 +++ 2 files changed, 17 insertions(+), 14 deletions(-) diff --git a/Lib/logging/handlers.py b/Lib/logging/handlers.py --- a/Lib/logging/handlers.py +++ b/Lib/logging/handlers.py @@ -879,21 +879,21 @@ The record is formatted, and then sent to the syslog server. If exception information is present, it is NOT sent to the server. """ - msg = self.format(record) - if self.ident: - msg = self.ident + msg - if self.append_nul: - msg += '\000' + try: + msg = self.format(record) + if self.ident: + msg = self.ident + msg + if self.append_nul: + msg += '\000' - # We need to convert record level to lowercase, maybe this will - # change in the future. - prio = '<%d>' % self.encodePriority(self.facility, - self.mapPriority(record.levelname)) - prio = prio.encode('utf-8') - # Message is a string. Convert to bytes as required by RFC 5424 - msg = msg.encode('utf-8') - msg = prio + msg - try: + # We need to convert record level to lowercase, maybe this will + # change in the future. + prio = '<%d>' % self.encodePriority(self.facility, + self.mapPriority(record.levelname)) + prio = prio.encode('utf-8') + # Message is a string. Convert to bytes as required by RFC 5424 + msg = msg.encode('utf-8') + msg = prio + msg if self.unixsocket: try: self.socket.send(msg) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -180,6 +180,9 @@ Library ------- +- Issue #22776: Brought excluded code into the scope of a try block in + SysLogHandler.emit(). + - Issue #22665: Add missing get_terminal_size and SameFileError to shutil.__all__. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 1 21:01:12 2014 From: python-checkins at python.org (vinay.sajip) Date: Sat, 01 Nov 2014 20:01:12 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=282=2E7=29=3A_Brought_exclud?= =?utf-8?q?ed_code_into_the_scope_of_a_try_block_in_SysLogHandler=2Eemit?= =?utf-8?b?KCku?= Message-ID: <20141101200108.109268.11270@psf.io> https://hg.python.org/cpython/rev/ea7b64406396 changeset: 93332:ea7b64406396 branch: 2.7 parent: 93326:3f13f1620d70 user: Vinay Sajip date: Sat Nov 01 19:56:13 2014 +0000 summary: Brought excluded code into the scope of a try block in SysLogHandler.emit(). files: Lib/logging/handlers.py | 22 +++++++++++----------- Misc/NEWS | 3 +++ 2 files changed, 14 insertions(+), 11 deletions(-) diff --git a/Lib/logging/handlers.py b/Lib/logging/handlers.py --- a/Lib/logging/handlers.py +++ b/Lib/logging/handlers.py @@ -840,18 +840,18 @@ The record is formatted, and then sent to the syslog server. If exception information is present, it is NOT sent to the server. """ - msg = self.format(record) + '\000' - """ - We need to convert record level to lowercase, maybe this will - change in the future. - """ - prio = '<%d>' % self.encodePriority(self.facility, - self.mapPriority(record.levelname)) - # Message is a string. Convert to bytes as required by RFC 5424 - if type(msg) is unicode: - msg = msg.encode('utf-8') - msg = prio + msg try: + msg = self.format(record) + '\000' + """ + We need to convert record level to lowercase, maybe this will + change in the future. + """ + prio = '<%d>' % self.encodePriority(self.facility, + self.mapPriority(record.levelname)) + # Message is a string. Convert to bytes as required by RFC 5424 + if type(msg) is unicode: + msg = msg.encode('utf-8') + msg = prio + msg if self.unixsocket: try: self.socket.send(msg) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -37,6 +37,9 @@ Library ------- +- Issue #22776: Brought excluded code into the scope of a try block in + SysLogHandler.emit(). + - Issue #17381: Fixed ranges handling in case-insensitive regular expressions. - Issue #19329: Optimized compiling charsets in regular expressions. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 1 23:11:38 2014 From: python-checkins at python.org (steve.dower) Date: Sat, 01 Nov 2014 22:11:38 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_=2322731_test=5Fcapi_test_?= =?utf-8?q?fails_because_of_mismatched_newlines?= Message-ID: <20141101221136.109258.64289@psf.io> https://hg.python.org/cpython/rev/edb270e5c9c3 changeset: 93335:edb270e5c9c3 user: Steve Dower date: Sat Nov 01 15:11:05 2014 -0700 summary: #22731 test_capi test fails because of mismatched newlines files: Lib/test/test_capi.py | 7 ++++--- 1 files changed, 4 insertions(+), 3 deletions(-) diff --git a/Lib/test/test_capi.py b/Lib/test/test_capi.py --- a/Lib/test/test_capi.py +++ b/Lib/test/test_capi.py @@ -304,12 +304,13 @@ cmd.extend(args) p = subprocess.Popen(cmd, stdout=subprocess.PIPE, - stderr=subprocess.PIPE) + stderr=subprocess.PIPE, + universal_newlines=True) (out, err) = p.communicate() self.assertEqual(p.returncode, 0, "bad returncode %d, stderr is %r" % (p.returncode, err)) - return out.decode("latin1"), err.decode("latin1") + return out, err def test_subinterps(self): # This is just a "don't crash" test @@ -339,7 +340,7 @@ expected_errors = sys.__stdout__.errors expected_stdin_encoding = sys.__stdin__.encoding expected_pipe_encoding = self._get_default_pipe_encoding() - expected_output = os.linesep.join([ + expected_output = '\n'.join([ "--- Use defaults ---", "Expected encoding: default", "Expected errors: default", -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 1 23:16:09 2014 From: python-checkins at python.org (steve.dower) Date: Sat, 01 Nov 2014 22:16:09 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_=2322732_ctypes_tests_don?= =?utf-8?q?=27t_set_correct_restype_for_intptr=5Ft_functions?= Message-ID: <20141101221607.111420.13171@psf.io> https://hg.python.org/cpython/rev/a944fe09fae8 changeset: 93336:a944fe09fae8 user: Steve Dower date: Sat Nov 01 15:14:27 2014 -0700 summary: #22732 ctypes tests don't set correct restype for intptr_t functions files: Lib/ctypes/test/test_pointers.py | 5 ++++- Lib/ctypes/test/test_prototypes.py | 5 ++++- 2 files changed, 8 insertions(+), 2 deletions(-) diff --git a/Lib/ctypes/test/test_pointers.py b/Lib/ctypes/test/test_pointers.py --- a/Lib/ctypes/test/test_pointers.py +++ b/Lib/ctypes/test/test_pointers.py @@ -24,7 +24,10 @@ def test_pass_pointers(self): dll = CDLL(_ctypes_test.__file__) func = dll._testfunc_p_p - func.restype = c_long + if sizeof(c_longlong) == sizeof(c_void_p): + func.restype = c_longlong + else: + func.restype = c_long i = c_int(12345678) ## func.argtypes = (POINTER(c_int),) diff --git a/Lib/ctypes/test/test_prototypes.py b/Lib/ctypes/test/test_prototypes.py --- a/Lib/ctypes/test/test_prototypes.py +++ b/Lib/ctypes/test/test_prototypes.py @@ -69,7 +69,10 @@ def test_int_pointer_arg(self): func = testdll._testfunc_p_p - func.restype = c_long + if sizeof(c_longlong) == sizeof(c_void_p): + func.restype = c_longlong + else: + func.restype = c_long self.assertEqual(0, func(0)) ci = c_int(0) -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 1 23:16:09 2014 From: python-checkins at python.org (steve.dower) Date: Sat, 01 Nov 2014 22:16:09 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_=2322734_marshal_needs_a_l?= =?utf-8?q?ower_stack_depth_for_debug_builds_on_Windows?= Message-ID: <20141101221608.111404.71617@psf.io> https://hg.python.org/cpython/rev/c2a3865a59f4 changeset: 93337:c2a3865a59f4 user: Steve Dower date: Sat Nov 01 15:15:16 2014 -0700 summary: #22734 marshal needs a lower stack depth for debug builds on Windows files: Lib/test/test_marshal.py | 2 +- Python/marshal.c | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/Lib/test/test_marshal.py b/Lib/test/test_marshal.py --- a/Lib/test/test_marshal.py +++ b/Lib/test/test_marshal.py @@ -188,7 +188,7 @@ head = last = [] # The max stack depth should match the value in Python/marshal.c. if os.name == 'nt' and hasattr(sys, 'gettotalrefcount'): - MAX_MARSHAL_STACK_DEPTH = 1500 + MAX_MARSHAL_STACK_DEPTH = 1000 else: MAX_MARSHAL_STACK_DEPTH = 2000 for i in range(MAX_MARSHAL_STACK_DEPTH - 2): diff --git a/Python/marshal.c b/Python/marshal.c --- a/Python/marshal.c +++ b/Python/marshal.c @@ -19,7 +19,7 @@ * On Windows debug builds, reduce this value. */ #if defined(MS_WINDOWS) && defined(_DEBUG) -#define MAX_MARSHAL_STACK_DEPTH 1500 +#define MAX_MARSHAL_STACK_DEPTH 1000 #else #define MAX_MARSHAL_STACK_DEPTH 2000 #endif -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 00:43:50 2014 From: python-checkins at python.org (zach.ware) Date: Sat, 01 Nov 2014 23:43:50 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzE3NzE3?= =?utf-8?q?=3A_Pull_NASM_from_svn=2Epython=2Eorg_for_OpenSSL_build=2E?= Message-ID: <20141101234349.35248.64114@psf.io> https://hg.python.org/cpython/rev/f7ed3e058fca changeset: 93339:f7ed3e058fca branch: 3.4 parent: 93333:f6a906541476 user: Zachary Ware date: Sat Nov 01 17:11:08 2014 -0500 summary: Issue #17717: Pull NASM from svn.python.org for OpenSSL build. files: Misc/NEWS | 3 +++ PCbuild/build_ssl.py | 11 +++++++++++ PCbuild/readme.txt | 4 +++- Tools/buildbot/external-common.bat | 4 ++++ 4 files changed, 21 insertions(+), 1 deletions(-) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -126,6 +126,9 @@ Windows ------- +- Issue #17717: The Windows build scripts now use a copy of NASM pulled from + svn.python.org to build OpenSSL. + - Issue #22644: The bundled version of OpenSSL has been updated to 1.0.1j. What's New in Python 3.4.2? diff --git a/PCbuild/build_ssl.py b/PCbuild/build_ssl.py --- a/PCbuild/build_ssl.py +++ b/PCbuild/build_ssl.py @@ -182,6 +182,17 @@ if ssl_dir is None: sys.exit(1) + # add our copy of NASM to PATH. It will be on the same level as openssl + for dir in os.listdir(os.path.join(ssl_dir, os.pardir)): + if dir.startswith('nasm'): + nasm_dir = os.path.join(ssl_dir, os.pardir, dir) + nasm_dir = os.path.abspath(nasm_dir) + os.environ['PATH'] += os.pathsep.join(['', nasm_dir]) + break + else: + print('NASM was not found, make sure it is on PATH') + + old_cd = os.getcwd() try: os.chdir(ssl_dir) diff --git a/PCbuild/readme.txt b/PCbuild/readme.txt --- a/PCbuild/readme.txt +++ b/PCbuild/readme.txt @@ -182,7 +182,9 @@ to be somewhere on your PATH. More recent versions of OpenSSL may need a later version of NASM. If OpenSSL's self tests don't pass, you should first try to update NASM and do a full rebuild of - OpenSSL. + OpenSSL. If you use the Tools\buildbot\external(-amd64).bat method + for getting sources, it also downloads a version of NASM which the + ssl build script will add to PATH. If you like to use the official sources instead of the files from python.org's subversion repository, Perl is required to build the diff --git a/Tools/buildbot/external-common.bat b/Tools/buildbot/external-common.bat --- a/Tools/buildbot/external-common.bat +++ b/Tools/buildbot/external-common.bat @@ -20,6 +20,10 @@ svn export http://svn.python.org/projects/external/bzip2-1.0.6 ) + at rem NASM, for OpenSSL build + at rem if exist nasm-2.11.06 rd /s/q nasm-2.11.06 +if not exist nasm-2.11.06 svn export http://svn.python.org/projects/external/nasm-2.11.06 + @rem OpenSSL if not exist openssl-1.0.1j ( rd /s/q openssl-1.0.1i -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 00:43:49 2014 From: python-checkins at python.org (zach.ware) Date: Sat, 01 Nov 2014 23:43:49 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzE3NzE3?= =?utf-8?q?=3A_Pull_NASM_from_svn=2Epython=2Eorg_for_OpenSSL_build=2E?= Message-ID: <20141101234349.35258.89627@psf.io> https://hg.python.org/cpython/rev/28d18fdc52c4 changeset: 93338:28d18fdc52c4 branch: 2.7 parent: 93332:ea7b64406396 user: Zachary Ware date: Sat Nov 01 17:11:08 2014 -0500 summary: Issue #17717: Pull NASM from svn.python.org for OpenSSL build. files: Misc/NEWS | 3 +++ PCbuild/build_ssl.py | 11 +++++++++++ PCbuild/readme.txt | 4 +++- Tools/buildbot/external-common.bat | 4 ++++ 4 files changed, 21 insertions(+), 1 deletions(-) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -305,6 +305,9 @@ Windows ------- +- Issue #17717: The Windows build scripts now use a copy of NASM pulled from + svn.python.org to build OpenSSL. + - Issue #22644: The bundled version of OpenSSL has been updated to 1.0.1j. diff --git a/PCbuild/build_ssl.py b/PCbuild/build_ssl.py --- a/PCbuild/build_ssl.py +++ b/PCbuild/build_ssl.py @@ -170,6 +170,17 @@ if ssl_dir is None: sys.exit(1) + # add our copy of NASM to PATH. It will be on the same level as openssl + for dir in os.listdir(os.path.join(ssl_dir, os.pardir)): + if dir.startswith('nasm'): + nasm_dir = os.path.join(ssl_dir, os.pardir, dir) + nasm_dir = os.path.abspath(nasm_dir) + os.environ['PATH'] += os.pathsep.join(['', nasm_dir]) + break + else: + print('NASM was not found, make sure it is on PATH') + + old_cd = os.getcwd() try: os.chdir(ssl_dir) diff --git a/PCbuild/readme.txt b/PCbuild/readme.txt --- a/PCbuild/readme.txt +++ b/PCbuild/readme.txt @@ -144,7 +144,9 @@ You must install the NASM assembler from http://nasm.sf.net - for x86 builds. Put nasm.exe anywhere in your PATH. + for x86 builds. Put nasm.exe anywhere in your PATH. If you use the + Tools\buildbot\external(-amd64).bat method for getting sources, it also + downloads a version of NASM, which the ssl build script will add to PATH. You can also install ActivePerl from http://www.activestate.com/activeperl/ diff --git a/Tools/buildbot/external-common.bat b/Tools/buildbot/external-common.bat --- a/Tools/buildbot/external-common.bat +++ b/Tools/buildbot/external-common.bat @@ -37,6 +37,10 @@ if exist db-4.4.20 rd /s/q db-4.4.20 if not exist db-4.7.25.0 svn export http://svn.python.org/projects/external/db-4.7.25.0 + at rem NASM, for OpenSSL build + at rem if exist nasm-2.11.06 rd /s/q nasm-2.11.06 +if not exist nasm-2.11.06 svn export http://svn.python.org/projects/external/nasm-2.11.06 + @rem OpenSSL if exist openssl-1.0.1i rd /s/q openssl-1.0.1i if not exist openssl-1.0.1j svn export http://svn.python.org/projects/external/openssl-1.0.1j -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 00:43:50 2014 From: python-checkins at python.org (zach.ware) Date: Sat, 01 Nov 2014 23:43:50 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Null_merge_with_3=2E4?= Message-ID: <20141101234350.101680.86997@psf.io> https://hg.python.org/cpython/rev/58b1426981c4 changeset: 93340:58b1426981c4 parent: 93337:c2a3865a59f4 parent: 93339:f7ed3e058fca user: Zachary Ware date: Sat Nov 01 18:33:52 2014 -0500 summary: Null merge with 3.4 files: -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 00:43:53 2014 From: python-checkins at python.org (zach.ware) Date: Sat, 01 Nov 2014 23:43:53 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2317717=3A_Pull_NAS?= =?utf-8?q?M_from_svn=2Epython=2Eorg_for_OpenSSL_build=2E?= Message-ID: <20141101234350.101684.64168@psf.io> https://hg.python.org/cpython/rev/ef15b51d59fb changeset: 93341:ef15b51d59fb user: Zachary Ware date: Sat Nov 01 18:42:46 2014 -0500 summary: Issue #17717: Pull NASM from svn.python.org for OpenSSL build. files: Misc/NEWS | 3 +++ PCbuild/get_externals.bat | 8 +++++--- PCbuild/pyproject.props | 4 ++++ PCbuild/readme.txt | 8 ++++---- PCbuild/ssl.vcxproj | 8 ++++++++ 5 files changed, 24 insertions(+), 7 deletions(-) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -1383,6 +1383,9 @@ Windows ------- +- Issue #17717: The Windows build scripts now use a copy of NASM pulled from + svn.python.org to build OpenSSL. + - Issue #21907: Improved the batch scripts provided for building Python. - Issue #22644: The bundled version of OpenSSL has been updated to 1.0.1j. diff --git a/PCbuild/get_externals.bat b/PCbuild/get_externals.bat --- a/PCbuild/get_externals.bat +++ b/PCbuild/get_externals.bat @@ -20,6 +20,7 @@ for /D %%d in ( bzip2-* db-* + nasm-* openssl-* tcl-* tcltk* @@ -51,6 +52,7 @@ for %%e in ( bzip2-1.0.6 + nasm-2.11.06 openssl-1.0.1j tcl-8.6.1.0 tk-8.6.1.0 @@ -87,9 +89,9 @@ echo.**WARNING**: the cleaning options unconditionally remove any directory echo.that is a child of echo. %CD% -echo.and matches wildcard patterns beginning with bzip2-, db-, openssl-, tcl-, -echo.tcltk, tk-, tix-, sqlite-, or xz-, and as such has the potential to be -echo.very destructive if you are not aware of what it is doing. Use with +echo.and matches wildcard patterns beginning with bzip2-, db-, nasm-, openssl-, +echo.tcl-, tcltk, tk-, tix-, sqlite-, or xz-, and as such has the potential +echo.to be very destructive if you are not aware of what it is doing. Use with echo.caution! popd exit /b -1 diff --git a/PCbuild/pyproject.props b/PCbuild/pyproject.props --- a/PCbuild/pyproject.props +++ b/PCbuild/pyproject.props @@ -20,6 +20,7 @@ $(externalsDir)\sqlite-3.8.3.1 $(externalsDir)\bzip2-1.0.6 $(externalsDir)\xz-5.0.5 + $(externalsDir)\nasm-2.11.06 $(externalsDir)\openssl-1.0.1j $(externalsDir)\tcl-8.6.1.0 $(externalsDir)\tk-8.6.1.0 @@ -77,6 +78,9 @@ $(lzmaDir) + + $(nasmDir) + $(opensslDir) diff --git a/PCbuild/readme.txt b/PCbuild/readme.txt --- a/PCbuild/readme.txt +++ b/PCbuild/readme.txt @@ -3,9 +3,8 @@ 1. Install Microsoft Visual C++ 2010 SP1, any edition. 2. Install Subversion, and make sure 'svn.exe' is on your PATH. -3. Install NASM, and make sure 'nasm.exe' is on your PATH. -4. Run "build.bat -e" to build Python in 32-bit Release configuration. -5. (Optional, but recommended) Run the test suite with "rt.bat -q". +3. Run "build.bat -e" to build Python in 32-bit Release configuration. +4. (Optional, but recommended) Run the test suite with "rt.bat -q". Building Python using Microsoft Visual C++ @@ -225,7 +224,8 @@ to be somewhere on your PATH. More recent versions of OpenSSL may need a later version of NASM. If OpenSSL's self tests don't pass, you should first try to update NASM and do a full rebuild of - OpenSSL. + OpenSSL. get_externals.py also downloads a snapshot of NASM, and the + ssl sub-project includes that version of nasm.exe on PATH. The ssl sub-project expects your OpenSSL sources to have already been configured and be ready to build. If you get your sources diff --git a/PCbuild/ssl.vcxproj b/PCbuild/ssl.vcxproj --- a/PCbuild/ssl.vcxproj +++ b/PCbuild/ssl.vcxproj @@ -119,6 +119,7 @@ <_ProjectFileVersion>10.0.30319.1 +path %PATH%;$(SolutionDir)$(nasmDir) cd "$(SolutionDir)$(opensslDir)" copy /Y crypto\buildinf_x86.h crypto\buildinf.h copy /Y crypto\opensslconf_x86.h crypto\opensslconf.h @@ -133,6 +134,7 @@ $(NMakeAssemblySearchPath) $(NMakeForcedUsingAssemblies) +path %PATH%;$(SolutionDir)$(nasmDir) cd "$(SolutionDir)$(opensslDir)" nasm -f win64 -DNEAR -Ox -g ms\\uptable.asm || echo nasm failed! && exit copy /Y crypto\buildinf_amd64.h crypto\buildinf.h @@ -148,6 +150,7 @@ $(NMakeAssemblySearchPath) $(NMakeForcedUsingAssemblies) +path %PATH%;$(SolutionDir)$(nasmDir) cd "$(SolutionDir)$(opensslDir)" copy /Y crypto\buildinf_x86.h crypto\buildinf.h copy /Y crypto\opensslconf_x86.h crypto\opensslconf.h @@ -162,6 +165,7 @@ $(NMakeAssemblySearchPath) $(NMakeForcedUsingAssemblies) +path %PATH%;$(SolutionDir)$(nasmDir) cd "$(SolutionDir)$(opensslDir)" nasm -f win64 -DNEAR -Ox -g ms\\uptable.asm || echo nasm failed! && exit copy /Y crypto\buildinf_amd64.h crypto\buildinf.h @@ -177,6 +181,7 @@ $(NMakeAssemblySearchPath) $(NMakeForcedUsingAssemblies) +path %PATH%;$(SolutionDir)$(nasmDir) cd "$(SolutionDir)$(opensslDir)" copy /Y crypto\buildinf_x86.h crypto\buildinf.h copy /Y crypto\opensslconf_x86.h crypto\opensslconf.h @@ -191,6 +196,7 @@ $(NMakeAssemblySearchPath) $(NMakeForcedUsingAssemblies) +path %PATH%;$(SolutionDir)$(nasmDir) cd "$(SolutionDir)$(opensslDir)" nasm -f win64 -DNEAR -Ox -g ms\\uptable.asm || echo nasm failed! && exit copy /Y crypto\buildinf_amd64.h crypto\buildinf.h @@ -206,6 +212,7 @@ $(NMakeAssemblySearchPath) $(NMakeForcedUsingAssemblies) +path %PATH%;$(SolutionDir)$(nasmDir) cd "$(SolutionDir)$(opensslDir)" copy /Y crypto\buildinf_x86.h crypto\buildinf.h copy /Y crypto\opensslconf_x86.h crypto\opensslconf.h @@ -220,6 +227,7 @@ $(NMakeAssemblySearchPath) $(NMakeForcedUsingAssemblies) +path %PATH%;$(SolutionDir)$(nasmDir) cd "$(SolutionDir)$(opensslDir)" nasm -f win64 -DNEAR -Ox -g ms\\uptable.asm || echo nasm failed! && exit copy /Y crypto\buildinf_amd64.h crypto\buildinf.h -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 03:34:01 2014 From: python-checkins at python.org (ned.deily) Date: Sun, 02 Nov 2014 02:34:01 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzIyNzcw?= =?utf-8?q?=3A_Prevent_some_Tk_segfaults_on_OS_X_when_running_gui_tests=2E?= Message-ID: <20141102023400.111410.59186@psf.io> https://hg.python.org/cpython/rev/bd4dc351d670 changeset: 93342:bd4dc351d670 branch: 2.7 parent: 93338:28d18fdc52c4 user: Ned Deily date: Sat Nov 01 19:26:45 2014 -0700 summary: Issue #22770: Prevent some Tk segfaults on OS X when running gui tests. When running tests in subprocesses with the regrtest -j option, a bug in Cocoa Tk can result in a Tcl segfault. Avoid the problem by forcing Tk to fully initialize as an OS X gui process before destroying the Tcl instance and creating another. (Original patch by Serhiy Storchaka) files: Lib/test/test_support.py | 5 ++--- Misc/NEWS | 2 ++ 2 files changed, 4 insertions(+), 3 deletions(-) diff --git a/Lib/test/test_support.py b/Lib/test/test_support.py --- a/Lib/test/test_support.py +++ b/Lib/test/test_support.py @@ -326,12 +326,11 @@ reason = "cannot run without OS X gui process" # check on every platform whether tkinter can actually do anything - # but skip the test on OS X because it can cause segfaults in Cocoa Tk - # when running regrtest with the -j option (multiple threads/subprocesses) - if (not reason) and (sys.platform != 'darwin'): + if not reason: try: from Tkinter import Tk root = Tk() + root.update() root.destroy() except Exception as e: err_string = str(e) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -277,6 +277,8 @@ - Issue #21976: Fix test_ssl to accept LibreSSL version strings. Thanks to William Orr. +- Issue #22770: Prevent some Tk segfaults on OS X when running gui tests. + Build ----- -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 03:34:01 2014 From: python-checkins at python.org (ned.deily) Date: Sun, 02 Nov 2014 02:34:01 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2322770=3A_merge_from_3=2E4?= Message-ID: <20141102023401.101684.26236@psf.io> https://hg.python.org/cpython/rev/e119343bc3ec changeset: 93344:e119343bc3ec parent: 93341:ef15b51d59fb parent: 93343:121517deb318 user: Ned Deily date: Sat Nov 01 19:33:25 2014 -0700 summary: Issue #22770: merge from 3.4 files: Lib/test/support/__init__.py | 5 ++--- Misc/NEWS | 2 ++ 2 files changed, 4 insertions(+), 3 deletions(-) diff --git a/Lib/test/support/__init__.py b/Lib/test/support/__init__.py --- a/Lib/test/support/__init__.py +++ b/Lib/test/support/__init__.py @@ -461,12 +461,11 @@ reason = "cannot run without OS X gui process" # check on every platform whether tkinter can actually do anything - # but skip the test on OS X because it can cause segfaults in Cocoa Tk - # when running regrtest with the -j option (multiple threads/subprocesses) - if (not reason) and (sys.platform != 'darwin'): + if not reason: try: from tkinter import Tk root = Tk() + root.update() root.destroy() except Exception as e: err_string = str(e) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -1342,6 +1342,8 @@ - Issue #21093: Prevent failures of ctypes test_macholib on OS X if a copy of libz exists in $HOME/lib or /usr/local/lib. +- Issue #22770: Prevent some Tk segfaults on OS X when running gui tests. + Tools/Demos ----------- -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 03:34:01 2014 From: python-checkins at python.org (ned.deily) Date: Sun, 02 Nov 2014 02:34:01 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyNzcw?= =?utf-8?q?=3A_Prevent_some_Tk_segfaults_on_OS_X_when_running_gui_tests=2E?= Message-ID: <20141102023401.109276.44229@psf.io> https://hg.python.org/cpython/rev/121517deb318 changeset: 93343:121517deb318 branch: 3.4 parent: 93339:f7ed3e058fca user: Ned Deily date: Sat Nov 01 19:29:22 2014 -0700 summary: Issue #22770: Prevent some Tk segfaults on OS X when running gui tests. When running tests in subprocesses with the regrtest -j option, a bug in Cocoa Tk can result in a Tcl segfault. Avoid the problem by forcing Tk to fully initialize as an OS X gui process before destroying the Tcl instance and creating another. (Original patch by Serhiy Storchaka) files: Lib/test/support/__init__.py | 5 ++--- Misc/NEWS | 2 ++ 2 files changed, 4 insertions(+), 3 deletions(-) diff --git a/Lib/test/support/__init__.py b/Lib/test/support/__init__.py --- a/Lib/test/support/__init__.py +++ b/Lib/test/support/__init__.py @@ -461,12 +461,11 @@ reason = "cannot run without OS X gui process" # check on every platform whether tkinter can actually do anything - # but skip the test on OS X because it can cause segfaults in Cocoa Tk - # when running regrtest with the -j option (multiple threads/subprocesses) - if (not reason) and (sys.platform != 'darwin'): + if not reason: try: from tkinter import Tk root = Tk() + root.update() root.destroy() except Exception as e: err_string = str(e) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -113,6 +113,8 @@ - Issue #21456: Skip two tests in test_urllib2net.py if _ssl module not present. Patch by Remi Pointel. +- Issue #22770: Prevent some Tk segfaults on OS X when running gui tests. + Build ----- -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 04:50:08 2014 From: python-checkins at python.org (zach.ware) Date: Sun, 02 Nov 2014 03:50:08 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzE3ODk2?= =?utf-8?q?=3A_Move_Windows_external_lib_sources_from_=2E=2E_to_externals?= =?utf-8?q?=2E?= Message-ID: <20141102035008.101682.70902@psf.io> https://hg.python.org/cpython/rev/b5e9bc4352e1 changeset: 93346:b5e9bc4352e1 branch: 3.4 parent: 93343:121517deb318 user: Zachary Ware date: Sat Nov 01 22:39:21 2014 -0500 summary: Issue #17896: Move Windows external lib sources from .. to externals. files: .gitignore | 1 + .hgignore | 1 + Lib/tkinter/_fix.py | 4 ++-- Misc/NEWS | 3 +++ PCbuild/build_ssl.py | 2 +- PCbuild/pyproject.props | 2 +- PCbuild/readme.txt | 13 +++++++------ PCbuild/rt.bat | 2 +- Tools/buildbot/external-common.bat | 3 ++- 9 files changed, 19 insertions(+), 12 deletions(-) diff --git a/.gitignore b/.gitignore --- a/.gitignore +++ b/.gitignore @@ -70,4 +70,5 @@ TAGS .coverage coverage/ +externals/ htmlcov/ diff --git a/.hgignore b/.hgignore --- a/.hgignore +++ b/.hgignore @@ -92,6 +92,7 @@ Modules/_testembed .coverage coverage/ +externals/ htmlcov/ *.gcda *.gcno diff --git a/Lib/tkinter/_fix.py b/Lib/tkinter/_fix.py --- a/Lib/tkinter/_fix.py +++ b/Lib/tkinter/_fix.py @@ -48,8 +48,8 @@ prefix = os.path.join(sys.base_prefix,"tcl") if not os.path.exists(prefix): - # devdir/../tcltk/lib - prefix = os.path.join(sys.base_prefix, os.path.pardir, "tcltk", "lib") + # devdir/externals/tcltk/lib + prefix = os.path.join(sys.base_prefix, "externals", "tcltk", "lib") prefix = os.path.abspath(prefix) # if this does not exist, no further search is needed if os.path.exists(prefix): diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -128,6 +128,9 @@ Windows ------- +- Issue #17896: The Windows build scripts now expect external library sources + to be in ``PCbuild\..\externals`` rather than ``PCbuild\..\..``. + - Issue #17717: The Windows build scripts now use a copy of NASM pulled from svn.python.org to build OpenSSL. diff --git a/PCbuild/build_ssl.py b/PCbuild/build_ssl.py --- a/PCbuild/build_ssl.py +++ b/PCbuild/build_ssl.py @@ -68,7 +68,7 @@ propfile = (os.path.join(os.path.dirname(__file__), 'pyproject.props')) with open(propfile, encoding='utf-8-sig') as f: m = re.search('openssl-([^<]+)<', f.read()) - return "..\..\openssl-"+m.group(1) + return "..\externals\openssl-"+m.group(1) def create_makefile64(makefile, m32): diff --git a/PCbuild/pyproject.props b/PCbuild/pyproject.props --- a/PCbuild/pyproject.props +++ b/PCbuild/pyproject.props @@ -16,7 +16,7 @@ python34$(PyDebugExt) $(OutDir)python$(PyDebugExt).exe $(OutDir)kill_python$(PyDebugExt).exe - ..\.. + ..\externals $(externalsDir)\sqlite-3.8.3.1 $(externalsDir)\bzip2-1.0.6 $(externalsDir)\xz-5.0.5 diff --git a/PCbuild/readme.txt b/PCbuild/readme.txt --- a/PCbuild/readme.txt +++ b/PCbuild/readme.txt @@ -224,9 +224,10 @@ Unlike the other external libraries listed above, Tk must be built separately before the _tkinter module can be built. This means that - a pre-built Tcl/Tk installation is expected in ..\..\tcltk (tcltk64 - for 64-bit) relative to this directory. See "Getting External - Sources" below for the easiest method to ensure Tcl/Tk is built. + a pre-built Tcl/Tk installation is expected in ..\externals\tcltk + (tcltk64 for 64-bit) relative to this directory. See "Getting + External Sources" below for the easiest method to ensure Tcl/Tk is + built. Getting External Sources @@ -246,12 +247,12 @@ This extracts all the external sub-projects from http://svn.python.org/projects/external via Subversion (so you'll need an svn.exe on your PATH) and places them -in ..\.. (relative to this directory). +in ..\externals (relative to this directory). It is also possible to download sources from each project's homepage, though you may have to change the names of some folders in order to make things work. For instance, if you were to download a version 5.0.7 of -XZ Utils, you would need to extract the archive into ..\..\xz-5.0.5 +XZ Utils, you would need to extract the archive into ..\externals\xz-5.0.5 anyway, since that is where the solution is set to look for xz. The same is true for all other external projects. @@ -268,7 +269,7 @@ So for a release build, you'd call it as: nmake -f makefile.vc MACHINE=AMD64 INSTALLDIR=..\..\tcltk64 clean all install -Note that the above command is called from within ..\..\tcl-8.6.1.0\win +Note that the above command is called from within ..\externals\tcl-8.6.1.0\win (relative to this directory); don't forget to build Tk as well as Tcl! This will be cleaned up in the future; http://bugs.python.org/issue15968 diff --git a/PCbuild/rt.bat b/PCbuild/rt.bat --- a/PCbuild/rt.bat +++ b/PCbuild/rt.bat @@ -38,7 +38,7 @@ if "%1"=="-d" (set suffix=_d) & shift & goto CheckOpts if "%1"=="-x64" (set prefix=amd64) & (set tcltk=tcltk64) & shift & goto CheckOpts -PATH %PATH%;%~dp0..\..\%tcltk%\bin +PATH %PATH%;%~dp0..\externals\%tcltk%\bin set exe=%prefix%\python%suffix% set cmd=%exe% %dashO% -Wd -E -bb ../lib/test/regrtest.py %1 %2 %3 %4 %5 %6 %7 %8 %9 if defined qmode goto Qmode diff --git a/Tools/buildbot/external-common.bat b/Tools/buildbot/external-common.bat --- a/Tools/buildbot/external-common.bat +++ b/Tools/buildbot/external-common.bat @@ -1,7 +1,8 @@ @rem Common file shared between external.bat and external-amd64.bat. Responsible for @rem fetching external components into the root\.. buildbot directories. -cd .. +if not exist externals mkdir externals +cd externals @rem XXX: If you need to force the buildbots to start from a fresh environment, uncomment @rem the following, check it in, then check it out, comment it out, then check it back in. @rem if exist bzip2-1.0.6 rd /s/q bzip2-1.0.6 -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 04:50:08 2014 From: python-checkins at python.org (zach.ware) Date: Sun, 02 Nov 2014 03:50:08 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzE3ODk2?= =?utf-8?q?=3A_Move_Windows_external_lib_sources_from_=2E=2E_to_externals?= =?utf-8?q?=2E?= Message-ID: <20141102035008.109258.13410@psf.io> https://hg.python.org/cpython/rev/62ce0f623154 changeset: 93345:62ce0f623154 branch: 2.7 parent: 93342:bd4dc351d670 user: Zachary Ware date: Sat Nov 01 22:34:09 2014 -0500 summary: Issue #17896: Move Windows external lib sources from .. to externals. files: .gitignore | 1 + .hgignore | 1 + Lib/lib-tk/FixTk.py | 4 +- Misc/NEWS | 3 + PCbuild/build_ssl.py | 2 +- PCbuild/pyproject.vsprops | 2 +- PCbuild/readme.txt | 40 ++--------------- PCbuild/rt.bat | 2 +- Tools/buildbot/external-common.bat | 5 +- 9 files changed, 18 insertions(+), 42 deletions(-) diff --git a/.gitignore b/.gitignore --- a/.gitignore +++ b/.gitignore @@ -43,4 +43,5 @@ tags .coverage coverage/ +externals/ htmlcov/ diff --git a/.hgignore b/.hgignore --- a/.hgignore +++ b/.hgignore @@ -61,4 +61,5 @@ PCbuild/Win32-temp-* .coverage coverage/ +externals/ htmlcov/ diff --git a/Lib/lib-tk/FixTk.py b/Lib/lib-tk/FixTk.py --- a/Lib/lib-tk/FixTk.py +++ b/Lib/lib-tk/FixTk.py @@ -48,8 +48,8 @@ prefix = os.path.join(sys.prefix,"tcl") if not os.path.exists(prefix): - # devdir/../tcltk/lib - prefix = os.path.join(sys.prefix, os.path.pardir, "tcltk", "lib") + # devdir/externals/tcltk/lib + prefix = os.path.join(sys.prefix, "externals", "tcltk", "lib") prefix = os.path.abspath(prefix) # if this does not exist, no further search is needed if os.path.exists(prefix): diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -307,6 +307,9 @@ Windows ------- +- Issue #17896: The Windows build scripts now expect external library sources + to be in ``PCbuild\..\externals`` rather than ``PCbuild\..\..``. + - Issue #17717: The Windows build scripts now use a copy of NASM pulled from svn.python.org to build OpenSSL. diff --git a/PCbuild/build_ssl.py b/PCbuild/build_ssl.py --- a/PCbuild/build_ssl.py +++ b/PCbuild/build_ssl.py @@ -69,7 +69,7 @@ propfile = (os.path.join(os.path.dirname(__file__), 'pyproject.vsprops')) with open(propfile) as f: m = re.search('openssl-([^"]+)"', f.read()) - return "..\..\openssl-"+m.group(1) + return "..\externals\openssl-"+m.group(1) def create_makefile64(makefile, m32): diff --git a/PCbuild/pyproject.vsprops b/PCbuild/pyproject.vsprops --- a/PCbuild/pyproject.vsprops +++ b/PCbuild/pyproject.vsprops @@ -46,7 +46,7 @@ /> linkd.exe external ..\..\trunk\external - Link created at: external - - Only a slight tweak would be needed to the buildbots such that bots - building trunk and py3k could make use of the same facility. (2.5.x - builds need to be kept separate as they're using Visual Studio 7.1.) -/XXX trent.nelson 02-Apr-08 - Building for Itanium -------------------- diff --git a/PCbuild/rt.bat b/PCbuild/rt.bat --- a/PCbuild/rt.bat +++ b/PCbuild/rt.bat @@ -38,7 +38,7 @@ if "%1"=="-d" (set suffix=_d) & shift & goto CheckOpts if "%1"=="-x64" (set prefix=amd64) & (set tcltk=tcltk64) & shift & goto CheckOpts -PATH %PATH%;%~dp0..\..\%tcltk%\bin +PATH %PATH%;%~dp0..\externals\%tcltk%\bin set exe=%prefix%\python%suffix% set cmd=%exe% %dashO% -Wd -3 -E -tt ../lib/test/regrtest.py %1 %2 %3 %4 %5 %6 %7 %8 %9 if defined qmode goto Qmode diff --git a/Tools/buildbot/external-common.bat b/Tools/buildbot/external-common.bat --- a/Tools/buildbot/external-common.bat +++ b/Tools/buildbot/external-common.bat @@ -1,7 +1,8 @@ @rem Common file shared between external.bat and external-amd64.bat. Responsible for - at rem fetching external components into the root\.. buildbot directories. + at rem fetching external components into the root\externals directory. -cd .. +if not exist externals mkdir externals +cd externals @rem XXX: If you need to force the buildbots to start from a fresh environment, uncomment @rem the following, check it in, then check it out, comment it out, then check it back in. @rem if exist bzip2-1.0.6 rd /s/q bzip2-1.0.6 -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 04:50:12 2014 From: python-checkins at python.org (zach.ware) Date: Sun, 02 Nov 2014 03:50:12 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2317896=3A_Move_Windows_external_lib_sources_from?= =?utf-8?q?_=2E=2E_to_externals=2E?= Message-ID: <20141102035008.109264.23418@psf.io> https://hg.python.org/cpython/rev/64a54f0c87d7 changeset: 93347:64a54f0c87d7 parent: 93344:e119343bc3ec parent: 93346:b5e9bc4352e1 user: Zachary Ware date: Sat Nov 01 22:48:24 2014 -0500 summary: Issue #17896: Move Windows external lib sources from .. to externals. files: .gitignore | 1 + .hgignore | 1 + Lib/tkinter/_fix.py | 4 ++-- Misc/NEWS | 3 +++ PCbuild/get_externals.bat | 3 ++- PCbuild/pyproject.props | 2 +- PCbuild/readme.txt | 2 +- Tools/buildbot/test-amd64.bat | 2 +- Tools/buildbot/test.bat | 2 +- 9 files changed, 13 insertions(+), 7 deletions(-) diff --git a/.gitignore b/.gitignore --- a/.gitignore +++ b/.gitignore @@ -80,4 +80,5 @@ TAGS .coverage coverage/ +externals/ htmlcov/ diff --git a/.hgignore b/.hgignore --- a/.hgignore +++ b/.hgignore @@ -93,6 +93,7 @@ Programs/_testembed .coverage coverage/ +externals/ htmlcov/ *.gcda *.gcno diff --git a/Lib/tkinter/_fix.py b/Lib/tkinter/_fix.py --- a/Lib/tkinter/_fix.py +++ b/Lib/tkinter/_fix.py @@ -48,8 +48,8 @@ prefix = os.path.join(sys.base_prefix,"tcl") if not os.path.exists(prefix): - # devdir/../tcltk/lib - prefix = os.path.join(sys.base_prefix, os.path.pardir, "tcltk", "lib") + # devdir/externals/tcltk/lib + prefix = os.path.join(sys.base_prefix, "externals", "tcltk", "lib") prefix = os.path.abspath(prefix) # if this does not exist, no further search is needed if os.path.exists(prefix): diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -1385,6 +1385,9 @@ Windows ------- +- Issue #17896: The Windows build scripts now expect external library sources + to be in ``PCbuild\..\externals`` rather than ``PCbuild\..\..``. + - Issue #17717: The Windows build scripts now use a copy of NASM pulled from svn.python.org to build OpenSSL. diff --git a/PCbuild/get_externals.bat b/PCbuild/get_externals.bat --- a/PCbuild/get_externals.bat +++ b/PCbuild/get_externals.bat @@ -2,7 +2,8 @@ setlocal rem Simple script to fetch source for external libraries -pushd "%~dp0..\.." +if not exist "%~dp0..\externals" mkdir "%~dp0..\externals" +pushd "%~dp0..\externals" if "%SVNROOT%"=="" set SVNROOT=http://svn.python.org/projects/external/ diff --git a/PCbuild/pyproject.props b/PCbuild/pyproject.props --- a/PCbuild/pyproject.props +++ b/PCbuild/pyproject.props @@ -16,7 +16,7 @@ python35$(PyDebugExt) $(OutDir)python$(PyDebugExt).exe $(OutDir)kill_python$(PyDebugExt).exe - ..\.. + ..\externals $(externalsDir)\sqlite-3.8.3.1 $(externalsDir)\bzip2-1.0.6 $(externalsDir)\xz-5.0.5 diff --git a/PCbuild/readme.txt b/PCbuild/readme.txt --- a/PCbuild/readme.txt +++ b/PCbuild/readme.txt @@ -278,7 +278,7 @@ directory. This script extracts all the external sub-projects from http://svn.python.org/projects/external via Subversion (so you'll need svn.exe on your PATH) and places them -in ..\.. (relative to this directory). +in ..\externals (relative to this directory). It is also possible to download sources from each project's homepage, though you may have to change folder names or pass the names to MSBuild diff --git a/Tools/buildbot/test-amd64.bat b/Tools/buildbot/test-amd64.bat --- a/Tools/buildbot/test-amd64.bat +++ b/Tools/buildbot/test-amd64.bat @@ -2,6 +2,6 @@ setlocal rem The following line should be removed before #20035 is closed -set TCL_LIBRARY=%~dp0..\..\..\tcltk64\lib\tcl8.6 +set TCL_LIBRARY=%~dp0..\..\externals\tcltk64\lib\tcl8.6 call "%~dp0..\..\PCbuild\rt.bat" -d -q -x64 -uall -rwW -n --timeout=3600 %* diff --git a/Tools/buildbot/test.bat b/Tools/buildbot/test.bat --- a/Tools/buildbot/test.bat +++ b/Tools/buildbot/test.bat @@ -2,6 +2,6 @@ setlocal rem The following line should be removed before #20035 is closed -set TCL_LIBRARY=%~dp0..\..\..\tcltk\lib\tcl8.6 +set TCL_LIBRARY=%~dp0..\..\externals\tcltk\lib\tcl8.6 call "%~dp0..\..\PCbuild\rt.bat" -d -q -uall -rwW -n --timeout=3600 %* -- Repository URL: https://hg.python.org/cpython From solipsis at pitrou.net Sun Nov 2 10:04:17 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Sun, 02 Nov 2014 10:04:17 +0100 Subject: [Python-checkins] Daily reference leaks (ef15b51d59fb): sum=3 Message-ID: results for ef15b51d59fb on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogLigs4a', '-x'] From python-checkins at python.org Sun Nov 2 17:13:57 2014 From: python-checkins at python.org (ezio.melotti) Date: Sun, 02 Nov 2014 16:13:57 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_Fix_commas_and_whitespace_in_?= =?utf-8?q?PEP_473=2E?= Message-ID: <20141102161355.35250.45664@psf.io> https://hg.python.org/peps/rev/8e9097a145dd changeset: 5592:8e9097a145dd user: Ezio Melotti date: Sun Nov 02 18:13:45 2014 +0200 summary: Fix commas and whitespace in PEP 473. files: pep-0473.txt | 6 +++--- 1 files changed, 3 insertions(+), 3 deletions(-) diff --git a/pep-0473.txt b/pep-0473.txt --- a/pep-0473.txt +++ b/pep-0473.txt @@ -14,7 +14,7 @@ ======== Exceptions like ``AttributeError``, ``IndexError``, ``KeyError``, -``LookupError``, ``NameError``, , ``TypeError`` and ``ValueError`` do not +``LookupError``, ``NameError``, ``TypeError``, and ``ValueError`` do not provide all information required by programmers to debug and better understand what caused them. Furthermore, in some cases the messages even have slightly different formats, @@ -47,7 +47,7 @@ A similar proposal [2]_ has been implemented for ``ImportError`` and in the same fashion this idea has received support [3]_. Additionally, almost 10 years ago Guido asked in [11]_ to have a clean API to access the affected objects in -Exceptions like ``KeyError``, ``AttributeError``, ``NameError`` and +Exceptions like ``KeyError``, ``AttributeError``, ``NameError``, and ``IndexError``. Similar issues and proposals ideas have been written in the last year. Some other issues have been created, but despite receiving support they finally get abandoned. References to the created issues are listed below: @@ -157,7 +157,7 @@ ======== Extend the exceptions ``AttributeError``, ``IndexError``, ``KeyError``, -``LookupError``, ``NameError``, , ``TypeError`` and ``ValueError`` with the +``LookupError``, ``NameError``, ``TypeError``, and ``ValueError`` with the following: * ``AttributeError``: target :sup:`w`, attribute -- Repository URL: https://hg.python.org/peps From python-checkins at python.org Sun Nov 2 18:15:42 2014 From: python-checkins at python.org (ezio.melotti) Date: Sun, 02 Nov 2014 17:15:42 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogIzIyNzUxOiBmaXgg?= =?utf-8?q?test=5F=5F=5Fall=5F=5F_warning_about_modified_environment_in_th?= =?utf-8?q?e_tests=2E?= Message-ID: <20141102171539.109268.76886@psf.io> https://hg.python.org/cpython/rev/16dfefe67c1f changeset: 93349:16dfefe67c1f branch: 2.7 parent: 93345:62ce0f623154 user: Ezio Melotti date: Sun Nov 02 19:08:35 2014 +0200 summary: #22751: fix test___all__ warning about modified environment in the tests. Patch by Michael Cetrulo. files: Lib/test/test___all__.py | 7 ++++--- Misc/ACKS | 1 + 2 files changed, 5 insertions(+), 3 deletions(-) diff --git a/Lib/test/test___all__.py b/Lib/test/test___all__.py --- a/Lib/test/test___all__.py +++ b/Lib/test/test___all__.py @@ -75,13 +75,14 @@ # rlcompleter needs special consideration; it imports readline which # initializes GNU readline which calls setlocale(LC_CTYPE, "")... :-( + import locale + locale_tuple = locale.getlocale(locale.LC_CTYPE) try: import rlcompleter - import locale except ImportError: pass - else: - locale.setlocale(locale.LC_CTYPE, 'C') + finally: + locale.setlocale(locale.LC_CTYPE, locale_tuple) ignored = [] failed_imports = [] diff --git a/Misc/ACKS b/Misc/ACKS --- a/Misc/ACKS +++ b/Misc/ACKS @@ -218,6 +218,7 @@ Matej Cepl Carl Cerecke Octavian Cerna +Michael Cetrulo Dave Chambers Pascal Chambon John Chandler -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 18:15:43 2014 From: python-checkins at python.org (ezio.melotti) Date: Sun, 02 Nov 2014 17:15:43 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?b?KTogIzIyNzUxOiBtZXJnZSB3aXRoIDMuNC4=?= Message-ID: <20141102171539.120722.54329@psf.io> https://hg.python.org/cpython/rev/3c030e4da7c6 changeset: 93350:3c030e4da7c6 parent: 93347:64a54f0c87d7 parent: 93348:37ed6eed0595 user: Ezio Melotti date: Sun Nov 02 19:14:54 2014 +0200 summary: #22751: merge with 3.4. files: Lib/test/test___all__.py | 7 ++++--- Misc/ACKS | 1 + 2 files changed, 5 insertions(+), 3 deletions(-) diff --git a/Lib/test/test___all__.py b/Lib/test/test___all__.py --- a/Lib/test/test___all__.py +++ b/Lib/test/test___all__.py @@ -72,13 +72,14 @@ # rlcompleter needs special consideration; it import readline which # initializes GNU readline which calls setlocale(LC_CTYPE, "")... :-( + import locale + locale_tuple = locale.getlocale(locale.LC_CTYPE) try: import rlcompleter - import locale except ImportError: pass - else: - locale.setlocale(locale.LC_CTYPE, 'C') + finally: + locale.setlocale(locale.LC_CTYPE, locale_tuple) ignored = [] failed_imports = [] diff --git a/Misc/ACKS b/Misc/ACKS --- a/Misc/ACKS +++ b/Misc/ACKS @@ -224,6 +224,7 @@ Matej Cepl Carl Cerecke Octavian Cerna +Michael Cetrulo Dave Chambers Pascal Chambon John Chandler -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 18:15:43 2014 From: python-checkins at python.org (ezio.melotti) Date: Sun, 02 Nov 2014 17:15:43 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogIzIyNzUxOiBmaXgg?= =?utf-8?q?test=5F=5F=5Fall=5F=5F_warning_about_modified_environment_in_th?= =?utf-8?q?e_tests=2E?= Message-ID: <20141102171539.101688.28249@psf.io> https://hg.python.org/cpython/rev/37ed6eed0595 changeset: 93348:37ed6eed0595 branch: 3.4 parent: 93346:b5e9bc4352e1 user: Ezio Melotti date: Sun Nov 02 19:08:35 2014 +0200 summary: #22751: fix test___all__ warning about modified environment in the tests. Patch by Michael Cetrulo. files: Lib/test/test___all__.py | 7 ++++--- Misc/ACKS | 1 + 2 files changed, 5 insertions(+), 3 deletions(-) diff --git a/Lib/test/test___all__.py b/Lib/test/test___all__.py --- a/Lib/test/test___all__.py +++ b/Lib/test/test___all__.py @@ -72,13 +72,14 @@ # rlcompleter needs special consideration; it import readline which # initializes GNU readline which calls setlocale(LC_CTYPE, "")... :-( + import locale + locale_tuple = locale.getlocale(locale.LC_CTYPE) try: import rlcompleter - import locale except ImportError: pass - else: - locale.setlocale(locale.LC_CTYPE, 'C') + finally: + locale.setlocale(locale.LC_CTYPE, locale_tuple) ignored = [] failed_imports = [] diff --git a/Misc/ACKS b/Misc/ACKS --- a/Misc/ACKS +++ b/Misc/ACKS @@ -222,6 +222,7 @@ Matej Cepl Carl Cerecke Octavian Cerna +Michael Cetrulo Dave Chambers Pascal Chambon John Chandler -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 18:29:27 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Sun, 02 Nov 2014 17:29:27 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAobWVyZ2UgMy40IC0+IDMuNCk6?= =?utf-8?q?_Merge_heads?= Message-ID: <20141102172927.35248.50233@psf.io> https://hg.python.org/cpython/rev/a5dd8e89d4da changeset: 93353:a5dd8e89d4da branch: 3.4 parent: 93351:e3825486da53 parent: 93348:37ed6eed0595 user: Serhiy Storchaka date: Sun Nov 02 19:26:23 2014 +0200 summary: Merge heads files: Lib/test/test___all__.py | 7 ++++--- Misc/ACKS | 1 + 2 files changed, 5 insertions(+), 3 deletions(-) diff --git a/Lib/test/test___all__.py b/Lib/test/test___all__.py --- a/Lib/test/test___all__.py +++ b/Lib/test/test___all__.py @@ -72,13 +72,14 @@ # rlcompleter needs special consideration; it import readline which # initializes GNU readline which calls setlocale(LC_CTYPE, "")... :-( + import locale + locale_tuple = locale.getlocale(locale.LC_CTYPE) try: import rlcompleter - import locale except ImportError: pass - else: - locale.setlocale(locale.LC_CTYPE, 'C') + finally: + locale.setlocale(locale.LC_CTYPE, locale_tuple) ignored = [] failed_imports = [] diff --git a/Misc/ACKS b/Misc/ACKS --- a/Misc/ACKS +++ b/Misc/ACKS @@ -222,6 +222,7 @@ Matej Cepl Carl Cerecke Octavian Cerna +Michael Cetrulo Dave Chambers Pascal Chambon John Chandler -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 18:29:27 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Sun, 02 Nov 2014 17:29:27 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Null_merge?= Message-ID: <20141102172927.120714.44184@psf.io> https://hg.python.org/cpython/rev/769a217764f2 changeset: 93355:769a217764f2 parent: 93354:0ea8a5bdc2f0 parent: 93353:a5dd8e89d4da user: Serhiy Storchaka date: Sun Nov 02 19:26:48 2014 +0200 summary: Null merge files: -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 18:29:28 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Sun, 02 Nov 2014 17:29:28 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_default_-=3E_default?= =?utf-8?q?=29=3A_Merge_heads?= Message-ID: <20141102172927.35270.83839@psf.io> https://hg.python.org/cpython/rev/0ea8a5bdc2f0 changeset: 93354:0ea8a5bdc2f0 parent: 93352:5f10a4a1e4df parent: 93350:3c030e4da7c6 user: Serhiy Storchaka date: Sun Nov 02 19:26:28 2014 +0200 summary: Merge heads files: Lib/test/test___all__.py | 7 ++++--- Misc/ACKS | 1 + 2 files changed, 5 insertions(+), 3 deletions(-) diff --git a/Lib/test/test___all__.py b/Lib/test/test___all__.py --- a/Lib/test/test___all__.py +++ b/Lib/test/test___all__.py @@ -72,13 +72,14 @@ # rlcompleter needs special consideration; it import readline which # initializes GNU readline which calls setlocale(LC_CTYPE, "")... :-( + import locale + locale_tuple = locale.getlocale(locale.LC_CTYPE) try: import rlcompleter - import locale except ImportError: pass - else: - locale.setlocale(locale.LC_CTYPE, 'C') + finally: + locale.setlocale(locale.LC_CTYPE, locale_tuple) ignored = [] failed_imports = [] diff --git a/Misc/ACKS b/Misc/ACKS --- a/Misc/ACKS +++ b/Misc/ACKS @@ -224,6 +224,7 @@ Matej Cepl Carl Cerecke Octavian Cerna +Michael Cetrulo Dave Chambers Pascal Chambon John Chandler -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 18:29:27 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Sun, 02 Nov 2014 17:29:27 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2322388=3A_Unified_the_style_of_=22Contributed_by?= =?utf-8?q?=22_sentences_in_What=27s_New=2E?= Message-ID: <20141102172926.35260.88422@psf.io> https://hg.python.org/cpython/rev/5f10a4a1e4df changeset: 93352:5f10a4a1e4df parent: 93347:64a54f0c87d7 parent: 93351:e3825486da53 user: Serhiy Storchaka date: Sun Nov 02 19:22:02 2014 +0200 summary: Issue #22388: Unified the style of "Contributed by" sentences in What's New. files: Doc/whatsnew/3.3.rst | 102 ++++++++++++++-------------- Doc/whatsnew/3.4.rst | 112 +++++++++++++++--------------- Doc/whatsnew/3.5.rst | 61 ++++++++-------- 3 files changed, 138 insertions(+), 137 deletions(-) diff --git a/Doc/whatsnew/3.3.rst b/Doc/whatsnew/3.3.rst --- a/Doc/whatsnew/3.3.rst +++ b/Doc/whatsnew/3.3.rst @@ -171,7 +171,7 @@ * Multi-dimensional comparisons are supported for any array type. * One-dimensional memoryviews of hashable (read-only) types with formats B, - b or c are now hashable. (Contributed by Antoine Pitrou in :issue:`13411`) + b or c are now hashable. (Contributed by Antoine Pitrou in :issue:`13411`.) * Arbitrary slicing of any 1-D arrays type is supported. For example, it is now possible to reverse a memoryview in O(1) by using a negative step. @@ -196,7 +196,7 @@ * For further changes see `Build and C API Changes`_ and `Porting C code`_. -(Contributed by Stefan Krah in :issue:`10181`) +(Contributed by Stefan Krah in :issue:`10181`.) .. seealso:: @@ -307,8 +307,8 @@ Python version when a more recent version is installed). In addition to the launcher, the Windows installer now includes an -option to add the newly installed Python to the system PATH (contributed -by Brian Curtin in :issue:`3561`). +option to add the newly installed Python to the system PATH. (Contributed +by Brian Curtin in :issue:`3561`.) .. seealso:: @@ -781,7 +781,7 @@ Both :func:`unicodedata.lookup()` and ``'\N{...}'`` now resolve name aliases, and :func:`unicodedata.lookup()` resolves named sequences too. - (Contributed by Ezio Melotti in :issue:`12753`) + (Contributed by Ezio Melotti in :issue:`12753`.) * Unicode database updated to UCD version 6.1.0 @@ -793,7 +793,7 @@ methods of :class:`bytes` and :class:`bytearray` objects now accept an integer between 0 and 255 as their first argument. - (Contributed by Petri Lehtinen in :issue:`12170`) + (Contributed by Petri Lehtinen in :issue:`12170`.) * The ``rjust()``, ``ljust()``, and ``center()`` methods of :class:`bytes` and :class:`bytearray` now accept a :class:`bytearray` for the ``fill`` @@ -854,7 +854,7 @@ * The sequence documentation has been substantially rewritten to better explain the binary/text sequence distinction and to provide specific documentation sections for the individual builtin sequence types - (:issue:`4966`) + (:issue:`4966`). New Modules @@ -891,7 +891,7 @@ objects representing IPv4 and IPv6 addresses, networks and interfaces (i.e. an IP address associated with a specific IP subnet). -(Contributed by Google and Peter Moody in :pep:`3144`) +(Contributed by Google and Peter Moody in :pep:`3144`.) lzma ---- @@ -900,7 +900,7 @@ using the LZMA algorithm, including support for the ``.xz`` and ``.lzma`` file formats. -(Contributed by Nadeem Vawda and Per ?yvind Karlsen in :issue:`6715`) +(Contributed by Nadeem Vawda and Per ?yvind Karlsen in :issue:`6715`.) Improved Modules @@ -921,7 +921,7 @@ * :class:`abc.abstractstaticmethod` has been deprecated, use :class:`staticmethod` with :func:`abc.abstractmethod` instead. -(Contributed by Darren Dale in :issue:`11610`) +(Contributed by Darren Dale in :issue:`11610`.) :meth:`abc.ABCMeta.register` now returns the registered subclass, which means it can now be used as a class decorator (:issue:`10868`). @@ -933,7 +933,7 @@ The :mod:`array` module supports the :c:type:`long long` type using ``q`` and ``Q`` type codes. -(Contributed by Oren Tirosh and Hirokazu Yamamoto in :issue:`1172711`) +(Contributed by Oren Tirosh and Hirokazu Yamamoto in :issue:`1172711`.) base64 @@ -964,14 +964,14 @@ * :class:`bz2.BZ2File` can now read from and write to arbitrary file-like objects, by means of its constructor's *fileobj* argument. - (Contributed by Nadeem Vawda in :issue:`5863`) + (Contributed by Nadeem Vawda in :issue:`5863`.) * :class:`bz2.BZ2File` and :func:`bz2.decompress` can now decompress multi-stream inputs (such as those produced by the :program:`pbzip2` tool). :class:`bz2.BZ2File` can now also be used to create this type of file, using the ``'a'`` (append) mode. - (Contributed by Nir Aides in :issue:`1625`) + (Contributed by Nir Aides in :issue:`1625`.) * :class:`bz2.BZ2File` now implements all of the :class:`io.BufferedIOBase` API, except for the :meth:`detach` and :meth:`truncate` methods. @@ -1018,7 +1018,7 @@ Addition of a new :class:`~collections.ChainMap` class to allow treating a number of mappings as a single unit. (Written by Raymond Hettinger for -:issue:`11089`, made public in :issue:`11297`) +:issue:`11089`, made public in :issue:`11297`.) The abstract base classes have been moved in a new :mod:`collections.abc` module, to better differentiate between the abstract and the concrete @@ -1069,7 +1069,7 @@ push a wide character so the next :meth:`~curses.window.get_wch` will return it -(Contributed by I?igo Serna in :issue:`6755`) +(Contributed by I?igo Serna in :issue:`6755`.) datetime -------- @@ -1376,11 +1376,11 @@ :func:`~ftplib.FTP_TLS.ccc` function to revert control channel back to plaintext. This can be useful to take advantage of firewalls that know how to handle NAT with non-secure FTP without opening fixed ports. (Contributed - by Giampaolo Rodol? in :issue:`12139`) + by Giampaolo Rodol? in :issue:`12139`.) * Added :meth:`ftplib.FTP.mlsd` method which provides a parsable directory listing format and deprecates :meth:`ftplib.FTP.nlst` and - :meth:`ftplib.FTP.dir`. (Contributed by Giampaolo Rodol? in :issue:`11072`) + :meth:`ftplib.FTP.dir`. (Contributed by Giampaolo Rodol? in :issue:`11072`.) functools @@ -1404,7 +1404,7 @@ A new :func:`~hmac.compare_digest` function has been added to prevent side channel attacks on digests through timing analysis. (Contributed by Nick -Coghlan and Christian Heimes in :issue:`15061`) +Coghlan and Christian Heimes in :issue:`15061`.) http @@ -1436,13 +1436,13 @@ (Contributed by Ezio Melotti in :issue:`15114`, and :issue:`14538`, :issue:`13993`, :issue:`13960`, :issue:`13358`, :issue:`1745761`, :issue:`755670`, :issue:`13357`, :issue:`12629`, :issue:`1200313`, -:issue:`670664`, :issue:`13273`, :issue:`12888`, :issue:`7311`) +:issue:`670664`, :issue:`13273`, :issue:`12888`, :issue:`7311`.) A new :data:`~html.entities.html5` dictionary that maps HTML5 named character references to the equivalent Unicode character(s) (e.g. ``html5['gt;'] == '>'``) has been added to the :mod:`html.entities` module. The dictionary is now also used by :class:`~html.parser.HTMLParser`. (Contributed by Ezio -Melotti in :issue:`11113` and :issue:`15156`) +Melotti in :issue:`11113` and :issue:`15156`.) imaplib @@ -1451,7 +1451,7 @@ The :class:`~imaplib.IMAP4_SSL` constructor now accepts an SSLContext parameter to control parameters of the secure channel. -(Contributed by Sijin Joseph in :issue:`8808`) +(Contributed by Sijin Joseph in :issue:`8808`.) inspect @@ -1462,14 +1462,14 @@ where those names were resolved, making it easier to verify correct internal state when testing code that relies on stateful closures. -(Contributed by Meador Inge and Nick Coghlan in :issue:`13062`) +(Contributed by Meador Inge and Nick Coghlan in :issue:`13062`.) A new :func:`~inspect.getgeneratorlocals` function has been added. This function reports the current binding of local variables in the generator's stack frame, making it easier to verify correct internal state when testing generators. -(Contributed by Meador Inge in :issue:`15153`) +(Contributed by Meador Inge in :issue:`15153`.) io -- @@ -1478,7 +1478,7 @@ exclusively create a new file, and raise a :exc:`FileExistsError` if the file already exists. It is based on the C11 'x' mode to fopen(). -(Contributed by David Townshend in :issue:`12760`) +(Contributed by David Townshend in :issue:`12760`.) The constructor of the :class:`~io.TextIOWrapper` class has a new *write_through* optional argument. If *write_through* is ``True``, calls to @@ -1513,7 +1513,7 @@ The :mod:`math` module has a new function, :func:`~math.log2`, which returns the base-2 logarithm of *x*. -(Written by Mark Dickinson in :issue:`11888`). +(Written by Mark Dickinson in :issue:`11888`.) mmap @@ -1567,7 +1567,7 @@ ('211 1755 1 1755 gmane.comp.python.committers', 1755, 1, 1755, 'gmane.comp.python.committers') >>> -(Contributed by Giampaolo Rodol? in :issue:`9795`) +(Contributed by Giampaolo Rodol? in :issue:`9795`.) os @@ -1744,24 +1744,24 @@ set to False makes the method execute the scheduled events due to expire soonest (if any) and then return immediately. This is useful in case you want to use the :class:`~sched.scheduler` in - non-blocking applications. (Contributed by Giampaolo Rodol? in :issue:`13449`) + non-blocking applications. (Contributed by Giampaolo Rodol? in :issue:`13449`.) * :class:`~sched.scheduler` class can now be safely used in multi-threaded environments. (Contributed by Josiah Carlson and Giampaolo Rodol? in - :issue:`8684`) + :issue:`8684`.) * *timefunc* and *delayfunct* parameters of :class:`~sched.scheduler` class constructor are now optional and defaults to :func:`time.time` and :func:`time.sleep` respectively. (Contributed by Chris Clark in - :issue:`13245`) + :issue:`13245`.) * :meth:`~sched.scheduler.enter` and :meth:`~sched.scheduler.enterabs` *argument* parameter is now optional. (Contributed by Chris Clark in - :issue:`13245`) + :issue:`13245`.) * :meth:`~sched.scheduler.enter` and :meth:`~sched.scheduler.enterabs` now accept a *kwargs* parameter. (Contributed by Chris Clark in - :issue:`13245`) + :issue:`13245`.) select @@ -1787,10 +1787,10 @@ * New functions: * :func:`~shutil.disk_usage`: provides total, used and free disk space - statistics. (Contributed by Giampaolo Rodol? in :issue:`12442`) + statistics. (Contributed by Giampaolo Rodol? in :issue:`12442`.) * :func:`~shutil.chown`: allows one to change user and/or group of the given path also specifying the user/group names and not only their numeric - ids. (Contributed by Sandro Tosi in :issue:`12191`) + ids. (Contributed by Sandro Tosi in :issue:`12191`.) * :func:`shutil.get_terminal_size`: returns the size of the terminal window to which the interpreter is attached. (Contributed by Zbigniew J?drzejewski-Szmek in :issue:`13609`.) @@ -1813,7 +1813,7 @@ * :func:`~shutil.rmtree` is now resistant to symlink attacks on platforms which support the new ``dir_fd`` parameter in :func:`os.open` and - :func:`os.unlink`. (Contributed by Martin von L?wis and Hynek Schlawack + :func:`os.unlink`. (Contributed by Martin von L?wis and Hynek Schlawack in :issue:`4489`.) @@ -1867,7 +1867,7 @@ The :class:`~smtplib.SMTP_SSL` constructor and the :meth:`~smtplib.SMTP.starttls` method now accept an SSLContext parameter to control parameters of the secure -channel. (Contributed by Kasun Herath in :issue:`8809`) +channel. (Contributed by Kasun Herath in :issue:`8809`.) socket @@ -1887,7 +1887,7 @@ (http://en.wikipedia.org/wiki/Socketcan), on Linux (http://lwn.net/Articles/253425). - (Contributed by Matthias Fuchs, updated by Tiago Gon?alves in :issue:`10141`) + (Contributed by Matthias Fuchs, updated by Tiago Gon?alves in :issue:`10141`.) * The :class:`~socket.socket` class now supports the PF_RDS protocol family (http://en.wikipedia.org/wiki/Reliable_Datagram_Sockets and @@ -1929,37 +1929,37 @@ pseudo-random bytes. * :func:`~ssl.RAND_pseudo_bytes`: generate pseudo-random bytes. - (Contributed by Victor Stinner in :issue:`12049`) + (Contributed by Victor Stinner in :issue:`12049`.) * The :mod:`ssl` module now exposes a finer-grained exception hierarchy in order to make it easier to inspect the various kinds of errors. - (Contributed by Antoine Pitrou in :issue:`11183`) + (Contributed by Antoine Pitrou in :issue:`11183`.) * :meth:`~ssl.SSLContext.load_cert_chain` now accepts a *password* argument to be used if the private key is encrypted. - (Contributed by Adam Simpkins in :issue:`12803`) + (Contributed by Adam Simpkins in :issue:`12803`.) * Diffie-Hellman key exchange, both regular and Elliptic Curve-based, is now supported through the :meth:`~ssl.SSLContext.load_dh_params` and :meth:`~ssl.SSLContext.set_ecdh_curve` methods. - (Contributed by Antoine Pitrou in :issue:`13626` and :issue:`13627`) + (Contributed by Antoine Pitrou in :issue:`13626` and :issue:`13627`.) * SSL sockets have a new :meth:`~ssl.SSLSocket.get_channel_binding` method allowing the implementation of certain authentication mechanisms such as - SCRAM-SHA-1-PLUS. (Contributed by Jacek Konieczny in :issue:`12551`) + SCRAM-SHA-1-PLUS. (Contributed by Jacek Konieczny in :issue:`12551`.) * You can query the SSL compression algorithm used by an SSL socket, thanks to its new :meth:`~ssl.SSLSocket.compression` method. The new attribute :attr:`~ssl.OP_NO_COMPRESSION` can be used to disable compression. - (Contributed by Antoine Pitrou in :issue:`13634`) + (Contributed by Antoine Pitrou in :issue:`13634`.) * Support has been added for the Next Procotol Negotiation extension using the :meth:`ssl.SSLContext.set_npn_protocols` method. - (Contributed by Colin Marc in :issue:`14204`) + (Contributed by Colin Marc in :issue:`14204`.) * SSL errors can now be introspected more easily thanks to :attr:`~ssl.SSLError.library` and :attr:`~ssl.SSLError.reason` attributes. - (Contributed by Antoine Pitrou in :issue:`14837`) + (Contributed by Antoine Pitrou in :issue:`14837`.) * The :func:`~ssl.get_server_certificate` function now supports IPv6. (Contributed by Charles-Fran?ois Natali in :issue:`11811`.) @@ -1976,7 +1976,7 @@ :func:`stat.filemode`. It can be used to convert a file's mode to a string of the form '-rwxrwxrwx'. -(Contributed by Giampaolo Rodol? in :issue:`14807`) +(Contributed by Giampaolo Rodol? in :issue:`14807`.) struct @@ -2035,8 +2035,8 @@ :class:`threading.Condition`, :class:`threading.Semaphore`, :class:`threading.BoundedSemaphore`, :class:`threading.Event`, and :class:`threading.Timer`, all of which used to be factory functions returning a -class instance, are now classes and may be subclassed. (Contributed by ?ric -Araujo in :issue:`10968`). +class instance, are now classes and may be subclassed. (Contributed by ?ric +Araujo in :issue:`10968`.) The :class:`threading.Thread` constructor now accepts a ``daemon`` keyword argument to override the default behavior of inheriting the ``deamon`` flag @@ -2066,7 +2066,7 @@ * :func:`~time.clock_getres`, :func:`~time.clock_gettime` and :func:`~time.clock_settime` functions with ``CLOCK_xxx`` constants. - (Contributed by Victor Stinner in :issue:`10278`) + (Contributed by Victor Stinner in :issue:`10278`.) To improve cross platform consistency, :func:`~time.sleep` now raises a :exc:`ValueError` when passed a negative sleep value. Previously this was an @@ -2090,7 +2090,7 @@ :meth:`.assertRaises`, :meth:`.assertRaisesRegex`, :meth:`.assertWarns`, and :meth:`.assertWarnsRegex` now accept a keyword argument *msg* when used as context managers. (Contributed by Ezio Melotti and Winston Ewert in -:issue:`10775`) +:issue:`10775`.) :meth:`unittest.TestCase.run` now returns the :class:`~unittest.TestResult` object. @@ -2117,7 +2117,7 @@ and the generic launchers :program:`xdg-open`, from the FreeDesktop.org project, and :program:`gvfs-open`, which is the default URI handler for GNOME 3. (The former contributed by Arnaud Calmettes in :issue:`13620`, the latter -by Matthias Klose in :issue:`14493`) +by Matthias Klose in :issue:`14493`.) xml.etree.ElementTree @@ -2160,7 +2160,7 @@ * UTF-8 is now 2x to 4x faster. UTF-16 encoding is now up to 10x faster. - (contributed by Serhiy Storchaka, :issue:`14624`, :issue:`14738` and + (Contributed by Serhiy Storchaka, :issue:`14624`, :issue:`14738` and :issue:`15026`.) diff --git a/Doc/whatsnew/3.4.rst b/Doc/whatsnew/3.4.rst --- a/Doc/whatsnew/3.4.rst +++ b/Doc/whatsnew/3.4.rst @@ -52,7 +52,7 @@ * It's helpful to add the bug/patch number as a comment: The :ref:`~socket.transmogrify()` function was added to the - :mod:`socket` module. (Contributed by P.Y. Developer in :issue:`12345`.) + :mod:`socket` module. (Contributed by P.Y. Developer in :issue:`12345`.) This saves the maintainer the effort of going through the Mercurial log when researching a change. @@ -372,7 +372,7 @@ in :ref:`binary-transforms` and :ref:`text-transforms`. (Contributed by Nick Coghlan in :issue:`7475`, :issue:`17827`, -:issue:`17828` and :issue:`19619`) +:issue:`17828` and :issue:`19619`.) .. _whatsnew-pep-451: @@ -414,14 +414,14 @@ * Module ``__file__`` attributes (and related values) should now always contain absolute paths by default, with the sole exception of ``__main__.__file__`` when a script has been executed directly using - a relative path (Contributed by Brett Cannon in :issue:`18416`). + a relative path. (Contributed by Brett Cannon in :issue:`18416`.) * All the UTF-\* codecs (except UTF-7) now reject surrogates during both encoding and decoding unless the ``surrogatepass`` error handler is used, with the exception of the UTF-16 decoder (which accepts valid surrogate pairs) and the UTF-16 encoder (which produces them while encoding non-BMP characters). - Contributed by Victor Stinner, Kang-Hao (Kenny) Lu and Serhiy Storchaka in - :issue:`12892`. + (Contributed by Victor Stinner, Kang-Hao (Kenny) Lu and Serhiy Storchaka in + :issue:`12892`.) * New German EBCDIC :ref:`codec ` ``cp273``. (Contributed by Michael Bierenfeld and Andrew Kuchling in :issue:`1097797`.) @@ -633,8 +633,8 @@ in :issue:`12866`.) New :func:`~audioop.byteswap` function converts big-endian samples to -little-endian and vice versa (Contributed by Serhiy Storchaka in -:issue:`19641`). +little-endian and vice versa. (Contributed by Serhiy Storchaka in +:issue:`19641`.) All :mod:`audioop` functions now accept any :term:`bytes-like object`. Strings are not accepted: they didn't work before, now they raise an error right away. @@ -681,8 +681,8 @@ The new :class:`contextlib.suppress` context manager helps to clarify the intent of code that deliberately suppresses exceptions from a single -statement. (Contributed by Raymond Hettinger in :issue:`15806` and -Zero Piraeus in :issue:`19266`) +statement. (Contributed by Raymond Hettinger in :issue:`15806` and +Zero Piraeus in :issue:`19266`.) The new :func:`contextlib.redirect_stdout` context manager makes it easier for utility scripts to handle inflexible APIs that write their output to @@ -693,7 +693,7 @@ from a function that was written to implement a command line interface. It is recommended only for utility scripts because it affects the global state of :data:`sys.stdout`. (Contributed by Raymond Hettinger -in :issue:`15805`) +in :issue:`15805`.) The :mod:`contextlib` documentation has also been updated to include a :ref:`discussion ` of the @@ -765,7 +765,7 @@ to ``distb(tb)``). (Contributed by Nick Coghlan, Ryan Kelly and Thomas Kluyver in :issue:`11816` -and Claudiu Popa in :issue:`17916`) +and Claudiu Popa in :issue:`17916`.) New function :func:`~dis.stack_effect` computes the effect on the Python stack of a given opcode and argument, information that is not otherwise available. @@ -855,7 +855,7 @@ for normal callables. The new descriptor also makes it easier to get arbitrary callables (including :func:`~functools.partial` instances) to behave like normal instance methods when included in a class definition. -(Contributed by Alon Horev and Nick Coghlan in :issue:`4331`) +(Contributed by Alon Horev and Nick Coghlan in :issue:`4331`.) .. _whatsnew-singledispatch: @@ -903,7 +903,7 @@ A new :func:`hashlib.pbkdf2_hmac` function provides the `PKCS#5 password-based key derivation function 2 `_. (Contributed by Christian -Heimes in :issue:`18582`) +Heimes in :issue:`18582`.) The :attr:`~hashlib.hash.name` attribute of :mod:`hashlib` hash objects is now a formally supported interface. It has always existed in CPython's @@ -939,17 +939,17 @@ New function :func:`~html.unescape` function converts HTML5 character references to the corresponding Unicode characters. (Contributed by Ezio Melotti in -:issue:`2927`) +:issue:`2927`.) :class:`~html.parser.HTMLParser` accepts a new keyword argument *convert_charrefs* that, when ``True``, automatically converts all character references. For backward-compatibility, its value defaults to ``False``, but it will change to ``True`` in a future version of Python, so you are invited to set it explicitly and update your code to use this new feature. (Contributed -by Ezio Melotti in :issue:`13633`) +by Ezio Melotti in :issue:`13633`.) The *strict* argument of :class:`~html.parser.HTMLParser` is now deprecated. -(Contributed by Ezio Melotti in :issue:`15114`) +(Contributed by Ezio Melotti in :issue:`15114`.) http @@ -1015,19 +1015,19 @@ The :mod:`inspect` module now offers a basic :ref:`command line interface ` to quickly display source code and other -information for modules, classes and functions. (Contributed by Claudiu Popa -and Nick Coghlan in :issue:`18626`) +information for modules, classes and functions. (Contributed by Claudiu Popa +and Nick Coghlan in :issue:`18626`.) :func:`~inspect.unwrap` makes it easy to unravel wrapper function chains created by :func:`functools.wraps` (and any other API that sets the -``__wrapped__`` attribute on a wrapper function). (Contributed by -Daniel Urban, Aaron Iles and Nick Coghlan in :issue:`13266`) +``__wrapped__`` attribute on a wrapper function). (Contributed by +Daniel Urban, Aaron Iles and Nick Coghlan in :issue:`13266`.) As part of the implementation of the new :mod:`enum` module, the :mod:`inspect` module now has substantially better support for custom ``__dir__`` methods and dynamic class attributes provided through -metaclasses (Contributed by Ethan Furman in :issue:`18929` and -:issue:`19030`) +metaclasses. (Contributed by Ethan Furman in :issue:`18929` and +:issue:`19030`.) :func:`~inspect.getfullargspec` and :func:`~inspect.getargspec` now use the :func:`~inspect.signature` API. This allows them to @@ -1038,11 +1038,11 @@ attributes, and report the already bound first argument for bound methods, so it is still necessary to update your code to use :func:`~inspect.signature` directly if those features are desired. -(Contributed by Yury Selivanov in :issue:`17481`) +(Contributed by Yury Selivanov in :issue:`17481`.) :func:`~inspect.signature` now supports duck types of CPython functions, -which adds support for functions compiled with Cython. (Contributed -by Stefan Behnel and Yury Selivanov in :issue:`17159`) +which adds support for functions compiled with Cython. (Contributed +by Stefan Behnel and Yury Selivanov in :issue:`17159`.) ipaddress @@ -1082,7 +1082,7 @@ Logging configuration data received from a socket via the :func:`logging.config.listen` function can now be validated before being processed by supplying a verification function as the argument to the new -*verify* keyword argument. (Contributed by Vinay Sajip in :issue:`15452`.) +*verify* keyword argument. (Contributed by Vinay Sajip in :issue:`15452`.) .. _whatsnew-marshal-3: @@ -1120,7 +1120,7 @@ :func:`~multiprocessing.get_all_start_methods` reports all start methods available on the platform, :func:`~multiprocessing.get_start_method` reports the current start method, and :func:`~multiprocessing.set_start_method` sets -the start method. (Contributed by Richard Oudkerk in :issue:`8713`). +the start method. (Contributed by Richard Oudkerk in :issue:`8713`.) :mod:`multiprocessing` also now has the concept of a ``context``, which determines how child processes are created. New function @@ -1141,7 +1141,7 @@ when using the ``spawn`` or ``forkserver`` start methods. This resolves some edge cases where combining multiprocessing, the ``-m`` command line switch, and explicit relative imports could cause obscure failures in child -processes. (Contributed by Nick Coghlan in :issue:`19946`) +processes. (Contributed by Nick Coghlan in :issue:`19946`.) operator @@ -1176,7 +1176,7 @@ Windows). (Contributed by Brian Curtin in :issue:`11939`.) :func:`os.path.ismount` now recognizes volumes mounted below a drive -root on Windows. (Contributed by Tim Golden in :issue:`9035`.) +root on Windows. (Contributed by Tim Golden in :issue:`9035`.) :func:`os.open` supports two new flags on platforms that provide them, :data:`~os.O_PATH` (un-opened file descriptor), and :data:`~os.O_TMPFILE` @@ -1230,7 +1230,7 @@ functions. (The older API is now deprecated.) In addition to the already supported XML plist format (:data:`~plistlib.FMT_XML`), it also now supports the binary plist format (:data:`~plistlib.FMT_BINARY`). (Contributed by Ronald -Oussoren and others in :issue:`14455`). +Oussoren and others in :issue:`14455`.) poplib @@ -1254,7 +1254,7 @@ (Contributed by Serhiy Storchaka in :issue:`19132`.) Long strings are now wrapped using Python's normal line continuation -syntax. (Contributed by Antoine Pitrou in :issue:`17150`). +syntax. (Contributed by Antoine Pitrou in :issue:`17150`.) pty @@ -1270,13 +1270,13 @@ The :mod:`pydoc` module is now based directly on the :func:`inspect.signature` introspection API, allowing it to provide signature information for a wider variety of callable objects. This change also means that ``__wrapped__`` -attributes are now taken into account when displaying help information -(Contributed by Larry Hastings in :issue:`19674`) +attributes are now taken into account when displaying help information. +(Contributed by Larry Hastings in :issue:`19674`.) The :mod:`pydoc` module no longer displays the ``self`` parameter for already bound methods. Instead, it aims to always display the exact current -signature of the supplied callable (Contributed by Larry Hastings in -:issue:`20710`) +signature of the supplied callable. (Contributed by Larry Hastings in +:issue:`20710`.) In addition to the changes that have been made to :mod:`pydoc` directly, its handling of custom ``__dir__`` methods and various descriptor @@ -1372,7 +1372,7 @@ :exc:`~smtplib.SMTPException` is now a subclass of :exc:`OSError`, which allows both socket level errors and SMTP protocol level errors to be caught in one try/except statement by code that only cares whether or not an error occurred. -(Contributed by Ned Jackson Lovely in :issue:`2118`). +(Contributed by Ned Jackson Lovely in :issue:`2118`.) socket @@ -1412,7 +1412,7 @@ :data:`~ssl.PROTOCOL_TLSv1_1` and :data:`~ssl.PROTOCOL_TLSv1_2` (TLSv1.1 and TLSv1.2 support) have been added; support for these protocols is only available if Python is linked with OpenSSL 1.0.1 or later. (Contributed by Michele Orr? and -Antoine Pitrou in :issue:`16692`) +Antoine Pitrou in :issue:`16692`.) .. _whatsnew34-sslcontext: @@ -1596,7 +1596,7 @@ A new :func:`traceback.clear_frames` function takes a traceback object and clears the local variables in all of the frames it references, reducing the amount of memory consumed. (Contributed by Andrew Kuchling in -:issue:`1565525`). +:issue:`1565525`.) types @@ -1619,7 +1619,7 @@ The http method that will be used by a :class:`~urllib.request.Request` class can now be specified by setting a :class:`~urllib.request.Request.method` -class attribute on the subclass. (Contributed by Jason R Coombs in +class attribute on the subclass. (Contributed by Jason R Coombs in :issue:`18978`.) :class:`~urllib.request.Request` objects are now reusable: if the @@ -1701,14 +1701,14 @@ :issue:`17015`.) :func:`~mock.mock_open` objects now have ``readline`` and ``readlines`` -methods. (Contributed by Toshio Kuratomi in :issue:`17467`.) +methods. (Contributed by Toshio Kuratomi in :issue:`17467`.) venv ---- :mod:`venv` now includes activation scripts for the ``csh`` and ``fish`` -shells (Contributed by Andrew Svetlov in :issue:`15417`.) +shells. (Contributed by Andrew Svetlov in :issue:`15417`.) :class:`~venv.EnvBuilder` and the :func:`~venv.create` convenience function take a new keyword argument *with_pip*, which defaults to ``False``, that @@ -1739,12 +1739,12 @@ ------- New :class:`~weakref.WeakMethod` class simulates weak references to bound -methods. (Contributed by Antoine Pitrou in :issue:`14631`.) +methods. (Contributed by Antoine Pitrou in :issue:`14631`.) New :class:`~weakref.finalize` class makes it possible to register a callback to be invoked when an object is garbage collected, without needing to -carefully manage the lifecycle of the weak reference itself. (Contributed by -Richard Oudkerk in :issue:`15528`) +carefully manage the lifecycle of the weak reference itself. (Contributed by +Richard Oudkerk in :issue:`15528`.) The callback, if any, associated with a :class:`~weakref.ref` is now exposed via the :attr:`~weakref.ref.__callback__` attribute. (Contributed @@ -1879,16 +1879,16 @@ * The new :c:func:`PyType_GetSlot` function has been added to the stable ABI, allowing retrieval of function pointers from named type slots when using - the limited API. (Contributed by Martin von L?wis in :issue:`17162`) + the limited API. (Contributed by Martin von L?wis in :issue:`17162`.) * The new :c:func:`Py_SetStandardStreamEncoding` pre-initialization API allows applications embedding the CPython interpreter to reliably force - a particular encoding and error handler for the standard streams - (Contributed by Bastien Montagne and Nick Coghlan in :issue:`16129`) + a particular encoding and error handler for the standard streams. + (Contributed by Bastien Montagne and Nick Coghlan in :issue:`16129`.) * Most Python C APIs that don't mutate string arguments are now correctly - marked as accepting ``const char *`` rather than ``char *`` (Contributed - by Serhiy Storchaka in :issue:`1772673`). + marked as accepting ``const char *`` rather than ``char *``. (Contributed + by Serhiy Storchaka in :issue:`1772673`.) * A new shell version of ``python-config`` can be used even when a python interpreter is not available (for example, in cross compilation scenarios). @@ -1958,7 +1958,7 @@ * The ``-R`` option to the :ref:`python regression test suite ` now also checks for memory allocation leaks, using :func:`sys.getallocatedblocks()`. (Contributed by Antoine Pitrou in - :issue:`13390`). + :issue:`13390`.) * ``python -m`` now works with namespace packages. @@ -2021,14 +2021,14 @@ longer imported by default. The marshal module has been improved to load compiled Python code faster. (Contributed by Antoine Pitrou, Christian Heimes and Victor Stinner in :issue:`19219`, :issue:`19218`, :issue:`19209`, - :issue:`19205` and :issue:`9548`) + :issue:`19205` and :issue:`9548`.) * :class:`bz2.BZ2File` is now as fast or faster than the Python2 version for most cases. :class:`lzma.LZMAFile` has also been optimized. (Contributed by Serhiy Storchaka and Nadeem Vawda in :issue:`16034`.) * :func:`random.getrandbits` is 20%-40% faster for small integers (the most - common use case). (Contributed by Serhiy Storchaka in :issue:`16674`). + common use case). (Contributed by Serhiy Storchaka in :issue:`16674`.) * By taking advantage of the new storage format for strings, pickling of strings is now significantly faster. (Contributed by Victor Stinner and @@ -2048,7 +2048,7 @@ * :func:`os.urandom` now uses a lazily-opened persistent file descriptor so as to avoid using many file descriptors when run in parallel from - multiple threads. (Contributed by Antoine Pitrou in :issue:`18756`.) + multiple threads. (Contributed by Antoine Pitrou in :issue:`18756`.) .. _deprecated-3.4: @@ -2246,7 +2246,7 @@ * The [X refs, Y blocks] output of a debug (``--with-pydebug``) build of the CPython interpreter is now off by default. It can be re-enabled using the - ``-X showrefcount`` option. (Contributed by Ezio Melotti in :issue:`17323`.) + ``-X showrefcount`` option. (Contributed by Ezio Melotti in :issue:`17323`.) * The python command and most stdlib scripts (as well as :mod:`argparse`) now output ``--version`` information to ``stdout`` instead of ``stderr`` (for @@ -2395,8 +2395,8 @@ storage). (:issue:`17094`.) * Parameter names in ``__annotations__`` dicts are now mangled properly, - similarly to ``__kwdefaults__``. (Contributed by Yury Selivanov in - :issue:`20625`). + similarly to ``__kwdefaults__``. (Contributed by Yury Selivanov in + :issue:`20625`.) * :attr:`hashlib.hash.name` now always returns the identifier in lower case. Previously some builtin hashes had uppercase names, but now that it is a diff --git a/Doc/whatsnew/3.5.rst b/Doc/whatsnew/3.5.rst --- a/Doc/whatsnew/3.5.rst +++ b/Doc/whatsnew/3.5.rst @@ -138,22 +138,22 @@ ---- * The :func:`code.InteractiveInterpreter.showtraceback` method now prints - the full chained traceback, just like the interactive interpreter - (contributed by Claudiu.Popa in :issue:`17442`). + the full chained traceback, just like the interactive interpreter. + (Contributed by Claudiu.Popa in :issue:`17442`.) compileall ---------- * :func:`compileall.compile_dir` and :mod:`compileall`'s command-line interface can now do parallel bytecode compilation. - (Contributed by Claudiu Popa in :issue:`16104`). + (Contributed by Claudiu Popa in :issue:`16104`.) doctest ------- * :func:`doctest.DocTestSuite` returns an empty :class:`unittest.TestSuite` if - *module* contains no docstrings instead of raising :exc:`ValueError` - (contributed by Glenn Jones in :issue:`15916`). + *module* contains no docstrings instead of raising :exc:`ValueError`. + (Contributed by Glenn Jones in :issue:`15916`.) glob ---- @@ -168,20 +168,20 @@ * :class:`IMAP4` now supports the context management protocol. When used in a :keyword:`with` statement, the IMAP4 ``LOGOUT`` command will be called automatically at the end of the block. (Contributed by Tarek Ziad? and - Serhiy Storchaka in :issue:`4972`). + Serhiy Storchaka in :issue:`4972`.) imghdr ------ * :func:`~imghdr.what` now recognizes the `OpenEXR `_ - format (contributed by Martin vignali and Cladui Popa in :issue:`20295`). + format. (Contributed by Martin vignali and Cladui Popa in :issue:`20295`.) importlib --------- * :class:`importlib.util.LazyLoader` allows for the lazy loading of modules in - applications where startup time is paramount (contributed by Brett Cannon in - :issue:`17621`). + applications where startup time is paramount. + (Contributed by Brett Cannon in :issue:`17621`.) * :func:`importlib.abc.InspectLoader.source_to_code` is now a static method to make it easier to work with source code in a string. @@ -196,26 +196,26 @@ ------- * :class:`inspect.Signature` and :class:`inspect.Parameter` are now - picklable and hashable (contributed by Yury Selivanov in :issue:`20726` - and :issue:`20334`). + picklable and hashable. (Contributed by Yury Selivanov in :issue:`20726` + and :issue:`20334`.) * New class method :meth:`inspect.Signature.from_callable`, which makes - subclassing of :class:`~inspect.Signature` easier (contributed - by Yury Selivanov and Eric Snow in :issue:`17373`). + subclassing of :class:`~inspect.Signature` easier. (Contributed + by Yury Selivanov and Eric Snow in :issue:`17373`.) ipaddress --------- * :class:`ipaddress.IPv4Network` and :class:`ipaddress.IPv6Network` now accept an ``(address, netmask)`` tuple argument, so as to easily construct - network objects from existing addresses (contributed by Peter Moody - and Antoine Pitrou in :issue:`16531`). + network objects from existing addresses. (Contributed by Peter Moody + and Antoine Pitrou in :issue:`16531`.) os -- * :class:`os.stat_result` now has a :attr:`~os.stat_result.st_file_attributes` - attribute on Windows (contributed by Ben Hoyt in :issue:`21719`). + attribute on Windows. (Contributed by Ben Hoyt in :issue:`21719`.) re -- @@ -239,8 +239,8 @@ * Different constants of :mod:`signal` module are now enumeration values using the :mod:`enum` module. This allows meaningful names to be printed during - debugging, instead of integer ?magic numbers?. (contributed by Giampaolo - Rodola' in :issue:`21076`) + debugging, instead of integer ?magic numbers?. (Contributed by Giampaolo + Rodola' in :issue:`21076`.) smtpd ----- @@ -264,15 +264,15 @@ ------- * A new :meth:`~smtplib.SMTP.auth` method provides a convenient way to - implement custom authentication mechanisms (contributed by Milan Oberkirch in - :issue:`15014`). + implement custom authentication mechanisms. + (Contributed by Milan Oberkirch in :issue:`15014`.) sndhdr ------ * :func:`~sndhdr.what` and :func:`~sndhdr.whathdr` now return - :func:`~collections.namedtuple` \s (contributed by Claudiu Popa in - :issue:`18615`). + :func:`~collections.namedtuple`. + (Contributed by Claudiu Popa in :issue:`18615`.) socket ------ @@ -281,7 +281,7 @@ by using high-performance :func:`os.sendfile` function on UNIX resulting in uploads being from 2x to 3x faster than when using plain :meth:`socket.socket.send`. - (contributed by Giampaolo Rodola' in :issue:`17552`) + (Contributed by Giampaolo Rodola' in :issue:`17552`.) time ---- @@ -298,8 +298,8 @@ xmlrpc ------ -* :class:`xmlrpc.client.ServerProxy` is now a :term:`context manager` - (contributed by Claudiu Popa in :issue:`20627`). +* :class:`xmlrpc.client.ServerProxy` is now a :term:`context manager`. + (Contributed by Claudiu Popa in :issue:`20627`.) Optimizations @@ -380,7 +380,8 @@ and the ``__version__`` string was not updated in the last few releases. * The internal ``Netrc`` class in the :mod:`ftplib` module was deprecated in - 3.4, and has now been removed. (Contributed by Matt Chaput in :issue:`6623`.) + 3.4, and has now been removed. + (Contributed by Matt Chaput in :issue:`6623`.) Porting to Python 3.5 ===================== @@ -408,15 +409,15 @@ * The deprecated "strict" mode and argument of :class:`~html.parser.HTMLParser`, :meth:`HTMLParser.error`, and the :exc:`HTMLParserError` exception have been - removed (contributed by Ezio Melotti in :issue:`15114`). + removed. (Contributed by Ezio Melotti in :issue:`15114`.) The *convert_charrefs* argument of :class:`~html.parser.HTMLParser` is - now ``True`` by default (contributed by Berker Peksag in :issue:`21047`). + now ``True`` by default. (Contributed by Berker Peksag in :issue:`21047`.) * Although it is not formally part of the API, it is worth noting for porting purposes (ie: fixing tests) that error messages that were previously of the form "'sometype' does not support the buffer protocol" are now of the form "a - bytes-like object is required, not 'sometype'" (contributed by Ezio Melotti - in :issue:`16518`). + bytes-like object is required, not 'sometype'". (Contributed by Ezio Melotti + in :issue:`16518`.) Changes in the C API -------------------- -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 18:29:27 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Sun, 02 Nov 2014 17:29:27 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyMzg4?= =?utf-8?q?=3A_Unified_the_style_of_=22Contributed_by=22_sentences_in_What?= =?utf-8?q?=27s_New=2E?= Message-ID: <20141102172926.111408.27166@psf.io> https://hg.python.org/cpython/rev/e3825486da53 changeset: 93351:e3825486da53 branch: 3.4 parent: 93346:b5e9bc4352e1 user: Serhiy Storchaka date: Sun Nov 02 19:18:52 2014 +0200 summary: Issue #22388: Unified the style of "Contributed by" sentences in What's New. files: Doc/whatsnew/3.3.rst | 102 ++++++++++++++-------------- Doc/whatsnew/3.4.rst | 112 +++++++++++++++--------------- 2 files changed, 107 insertions(+), 107 deletions(-) diff --git a/Doc/whatsnew/3.3.rst b/Doc/whatsnew/3.3.rst --- a/Doc/whatsnew/3.3.rst +++ b/Doc/whatsnew/3.3.rst @@ -171,7 +171,7 @@ * Multi-dimensional comparisons are supported for any array type. * One-dimensional memoryviews of hashable (read-only) types with formats B, - b or c are now hashable. (Contributed by Antoine Pitrou in :issue:`13411`) + b or c are now hashable. (Contributed by Antoine Pitrou in :issue:`13411`.) * Arbitrary slicing of any 1-D arrays type is supported. For example, it is now possible to reverse a memoryview in O(1) by using a negative step. @@ -196,7 +196,7 @@ * For further changes see `Build and C API Changes`_ and `Porting C code`_. -(Contributed by Stefan Krah in :issue:`10181`) +(Contributed by Stefan Krah in :issue:`10181`.) .. seealso:: @@ -307,8 +307,8 @@ Python version when a more recent version is installed). In addition to the launcher, the Windows installer now includes an -option to add the newly installed Python to the system PATH (contributed -by Brian Curtin in :issue:`3561`). +option to add the newly installed Python to the system PATH. (Contributed +by Brian Curtin in :issue:`3561`.) .. seealso:: @@ -781,7 +781,7 @@ Both :func:`unicodedata.lookup()` and ``'\N{...}'`` now resolve name aliases, and :func:`unicodedata.lookup()` resolves named sequences too. - (Contributed by Ezio Melotti in :issue:`12753`) + (Contributed by Ezio Melotti in :issue:`12753`.) * Unicode database updated to UCD version 6.1.0 @@ -793,7 +793,7 @@ methods of :class:`bytes` and :class:`bytearray` objects now accept an integer between 0 and 255 as their first argument. - (Contributed by Petri Lehtinen in :issue:`12170`) + (Contributed by Petri Lehtinen in :issue:`12170`.) * The ``rjust()``, ``ljust()``, and ``center()`` methods of :class:`bytes` and :class:`bytearray` now accept a :class:`bytearray` for the ``fill`` @@ -854,7 +854,7 @@ * The sequence documentation has been substantially rewritten to better explain the binary/text sequence distinction and to provide specific documentation sections for the individual builtin sequence types - (:issue:`4966`) + (:issue:`4966`). New Modules @@ -891,7 +891,7 @@ objects representing IPv4 and IPv6 addresses, networks and interfaces (i.e. an IP address associated with a specific IP subnet). -(Contributed by Google and Peter Moody in :pep:`3144`) +(Contributed by Google and Peter Moody in :pep:`3144`.) lzma ---- @@ -900,7 +900,7 @@ using the LZMA algorithm, including support for the ``.xz`` and ``.lzma`` file formats. -(Contributed by Nadeem Vawda and Per ?yvind Karlsen in :issue:`6715`) +(Contributed by Nadeem Vawda and Per ?yvind Karlsen in :issue:`6715`.) Improved Modules @@ -921,7 +921,7 @@ * :class:`abc.abstractstaticmethod` has been deprecated, use :class:`staticmethod` with :func:`abc.abstractmethod` instead. -(Contributed by Darren Dale in :issue:`11610`) +(Contributed by Darren Dale in :issue:`11610`.) :meth:`abc.ABCMeta.register` now returns the registered subclass, which means it can now be used as a class decorator (:issue:`10868`). @@ -933,7 +933,7 @@ The :mod:`array` module supports the :c:type:`long long` type using ``q`` and ``Q`` type codes. -(Contributed by Oren Tirosh and Hirokazu Yamamoto in :issue:`1172711`) +(Contributed by Oren Tirosh and Hirokazu Yamamoto in :issue:`1172711`.) base64 @@ -964,14 +964,14 @@ * :class:`bz2.BZ2File` can now read from and write to arbitrary file-like objects, by means of its constructor's *fileobj* argument. - (Contributed by Nadeem Vawda in :issue:`5863`) + (Contributed by Nadeem Vawda in :issue:`5863`.) * :class:`bz2.BZ2File` and :func:`bz2.decompress` can now decompress multi-stream inputs (such as those produced by the :program:`pbzip2` tool). :class:`bz2.BZ2File` can now also be used to create this type of file, using the ``'a'`` (append) mode. - (Contributed by Nir Aides in :issue:`1625`) + (Contributed by Nir Aides in :issue:`1625`.) * :class:`bz2.BZ2File` now implements all of the :class:`io.BufferedIOBase` API, except for the :meth:`detach` and :meth:`truncate` methods. @@ -1018,7 +1018,7 @@ Addition of a new :class:`~collections.ChainMap` class to allow treating a number of mappings as a single unit. (Written by Raymond Hettinger for -:issue:`11089`, made public in :issue:`11297`) +:issue:`11089`, made public in :issue:`11297`.) The abstract base classes have been moved in a new :mod:`collections.abc` module, to better differentiate between the abstract and the concrete @@ -1069,7 +1069,7 @@ push a wide character so the next :meth:`~curses.window.get_wch` will return it -(Contributed by I?igo Serna in :issue:`6755`) +(Contributed by I?igo Serna in :issue:`6755`.) datetime -------- @@ -1376,11 +1376,11 @@ :func:`~ftplib.FTP_TLS.ccc` function to revert control channel back to plaintext. This can be useful to take advantage of firewalls that know how to handle NAT with non-secure FTP without opening fixed ports. (Contributed - by Giampaolo Rodol? in :issue:`12139`) + by Giampaolo Rodol? in :issue:`12139`.) * Added :meth:`ftplib.FTP.mlsd` method which provides a parsable directory listing format and deprecates :meth:`ftplib.FTP.nlst` and - :meth:`ftplib.FTP.dir`. (Contributed by Giampaolo Rodol? in :issue:`11072`) + :meth:`ftplib.FTP.dir`. (Contributed by Giampaolo Rodol? in :issue:`11072`.) functools @@ -1404,7 +1404,7 @@ A new :func:`~hmac.compare_digest` function has been added to prevent side channel attacks on digests through timing analysis. (Contributed by Nick -Coghlan and Christian Heimes in :issue:`15061`) +Coghlan and Christian Heimes in :issue:`15061`.) http @@ -1436,13 +1436,13 @@ (Contributed by Ezio Melotti in :issue:`15114`, and :issue:`14538`, :issue:`13993`, :issue:`13960`, :issue:`13358`, :issue:`1745761`, :issue:`755670`, :issue:`13357`, :issue:`12629`, :issue:`1200313`, -:issue:`670664`, :issue:`13273`, :issue:`12888`, :issue:`7311`) +:issue:`670664`, :issue:`13273`, :issue:`12888`, :issue:`7311`.) A new :data:`~html.entities.html5` dictionary that maps HTML5 named character references to the equivalent Unicode character(s) (e.g. ``html5['gt;'] == '>'``) has been added to the :mod:`html.entities` module. The dictionary is now also used by :class:`~html.parser.HTMLParser`. (Contributed by Ezio -Melotti in :issue:`11113` and :issue:`15156`) +Melotti in :issue:`11113` and :issue:`15156`.) imaplib @@ -1451,7 +1451,7 @@ The :class:`~imaplib.IMAP4_SSL` constructor now accepts an SSLContext parameter to control parameters of the secure channel. -(Contributed by Sijin Joseph in :issue:`8808`) +(Contributed by Sijin Joseph in :issue:`8808`.) inspect @@ -1462,14 +1462,14 @@ where those names were resolved, making it easier to verify correct internal state when testing code that relies on stateful closures. -(Contributed by Meador Inge and Nick Coghlan in :issue:`13062`) +(Contributed by Meador Inge and Nick Coghlan in :issue:`13062`.) A new :func:`~inspect.getgeneratorlocals` function has been added. This function reports the current binding of local variables in the generator's stack frame, making it easier to verify correct internal state when testing generators. -(Contributed by Meador Inge in :issue:`15153`) +(Contributed by Meador Inge in :issue:`15153`.) io -- @@ -1478,7 +1478,7 @@ exclusively create a new file, and raise a :exc:`FileExistsError` if the file already exists. It is based on the C11 'x' mode to fopen(). -(Contributed by David Townshend in :issue:`12760`) +(Contributed by David Townshend in :issue:`12760`.) The constructor of the :class:`~io.TextIOWrapper` class has a new *write_through* optional argument. If *write_through* is ``True``, calls to @@ -1513,7 +1513,7 @@ The :mod:`math` module has a new function, :func:`~math.log2`, which returns the base-2 logarithm of *x*. -(Written by Mark Dickinson in :issue:`11888`). +(Written by Mark Dickinson in :issue:`11888`.) mmap @@ -1567,7 +1567,7 @@ ('211 1755 1 1755 gmane.comp.python.committers', 1755, 1, 1755, 'gmane.comp.python.committers') >>> -(Contributed by Giampaolo Rodol? in :issue:`9795`) +(Contributed by Giampaolo Rodol? in :issue:`9795`.) os @@ -1744,24 +1744,24 @@ set to False makes the method execute the scheduled events due to expire soonest (if any) and then return immediately. This is useful in case you want to use the :class:`~sched.scheduler` in - non-blocking applications. (Contributed by Giampaolo Rodol? in :issue:`13449`) + non-blocking applications. (Contributed by Giampaolo Rodol? in :issue:`13449`.) * :class:`~sched.scheduler` class can now be safely used in multi-threaded environments. (Contributed by Josiah Carlson and Giampaolo Rodol? in - :issue:`8684`) + :issue:`8684`.) * *timefunc* and *delayfunct* parameters of :class:`~sched.scheduler` class constructor are now optional and defaults to :func:`time.time` and :func:`time.sleep` respectively. (Contributed by Chris Clark in - :issue:`13245`) + :issue:`13245`.) * :meth:`~sched.scheduler.enter` and :meth:`~sched.scheduler.enterabs` *argument* parameter is now optional. (Contributed by Chris Clark in - :issue:`13245`) + :issue:`13245`.) * :meth:`~sched.scheduler.enter` and :meth:`~sched.scheduler.enterabs` now accept a *kwargs* parameter. (Contributed by Chris Clark in - :issue:`13245`) + :issue:`13245`.) select @@ -1787,10 +1787,10 @@ * New functions: * :func:`~shutil.disk_usage`: provides total, used and free disk space - statistics. (Contributed by Giampaolo Rodol? in :issue:`12442`) + statistics. (Contributed by Giampaolo Rodol? in :issue:`12442`.) * :func:`~shutil.chown`: allows one to change user and/or group of the given path also specifying the user/group names and not only their numeric - ids. (Contributed by Sandro Tosi in :issue:`12191`) + ids. (Contributed by Sandro Tosi in :issue:`12191`.) * :func:`shutil.get_terminal_size`: returns the size of the terminal window to which the interpreter is attached. (Contributed by Zbigniew J?drzejewski-Szmek in :issue:`13609`.) @@ -1813,7 +1813,7 @@ * :func:`~shutil.rmtree` is now resistant to symlink attacks on platforms which support the new ``dir_fd`` parameter in :func:`os.open` and - :func:`os.unlink`. (Contributed by Martin von L?wis and Hynek Schlawack + :func:`os.unlink`. (Contributed by Martin von L?wis and Hynek Schlawack in :issue:`4489`.) @@ -1867,7 +1867,7 @@ The :class:`~smtplib.SMTP_SSL` constructor and the :meth:`~smtplib.SMTP.starttls` method now accept an SSLContext parameter to control parameters of the secure -channel. (Contributed by Kasun Herath in :issue:`8809`) +channel. (Contributed by Kasun Herath in :issue:`8809`.) socket @@ -1887,7 +1887,7 @@ (http://en.wikipedia.org/wiki/Socketcan), on Linux (http://lwn.net/Articles/253425). - (Contributed by Matthias Fuchs, updated by Tiago Gon?alves in :issue:`10141`) + (Contributed by Matthias Fuchs, updated by Tiago Gon?alves in :issue:`10141`.) * The :class:`~socket.socket` class now supports the PF_RDS protocol family (http://en.wikipedia.org/wiki/Reliable_Datagram_Sockets and @@ -1929,37 +1929,37 @@ pseudo-random bytes. * :func:`~ssl.RAND_pseudo_bytes`: generate pseudo-random bytes. - (Contributed by Victor Stinner in :issue:`12049`) + (Contributed by Victor Stinner in :issue:`12049`.) * The :mod:`ssl` module now exposes a finer-grained exception hierarchy in order to make it easier to inspect the various kinds of errors. - (Contributed by Antoine Pitrou in :issue:`11183`) + (Contributed by Antoine Pitrou in :issue:`11183`.) * :meth:`~ssl.SSLContext.load_cert_chain` now accepts a *password* argument to be used if the private key is encrypted. - (Contributed by Adam Simpkins in :issue:`12803`) + (Contributed by Adam Simpkins in :issue:`12803`.) * Diffie-Hellman key exchange, both regular and Elliptic Curve-based, is now supported through the :meth:`~ssl.SSLContext.load_dh_params` and :meth:`~ssl.SSLContext.set_ecdh_curve` methods. - (Contributed by Antoine Pitrou in :issue:`13626` and :issue:`13627`) + (Contributed by Antoine Pitrou in :issue:`13626` and :issue:`13627`.) * SSL sockets have a new :meth:`~ssl.SSLSocket.get_channel_binding` method allowing the implementation of certain authentication mechanisms such as - SCRAM-SHA-1-PLUS. (Contributed by Jacek Konieczny in :issue:`12551`) + SCRAM-SHA-1-PLUS. (Contributed by Jacek Konieczny in :issue:`12551`.) * You can query the SSL compression algorithm used by an SSL socket, thanks to its new :meth:`~ssl.SSLSocket.compression` method. The new attribute :attr:`~ssl.OP_NO_COMPRESSION` can be used to disable compression. - (Contributed by Antoine Pitrou in :issue:`13634`) + (Contributed by Antoine Pitrou in :issue:`13634`.) * Support has been added for the Next Procotol Negotiation extension using the :meth:`ssl.SSLContext.set_npn_protocols` method. - (Contributed by Colin Marc in :issue:`14204`) + (Contributed by Colin Marc in :issue:`14204`.) * SSL errors can now be introspected more easily thanks to :attr:`~ssl.SSLError.library` and :attr:`~ssl.SSLError.reason` attributes. - (Contributed by Antoine Pitrou in :issue:`14837`) + (Contributed by Antoine Pitrou in :issue:`14837`.) * The :func:`~ssl.get_server_certificate` function now supports IPv6. (Contributed by Charles-Fran?ois Natali in :issue:`11811`.) @@ -1976,7 +1976,7 @@ :func:`stat.filemode`. It can be used to convert a file's mode to a string of the form '-rwxrwxrwx'. -(Contributed by Giampaolo Rodol? in :issue:`14807`) +(Contributed by Giampaolo Rodol? in :issue:`14807`.) struct @@ -2035,8 +2035,8 @@ :class:`threading.Condition`, :class:`threading.Semaphore`, :class:`threading.BoundedSemaphore`, :class:`threading.Event`, and :class:`threading.Timer`, all of which used to be factory functions returning a -class instance, are now classes and may be subclassed. (Contributed by ?ric -Araujo in :issue:`10968`). +class instance, are now classes and may be subclassed. (Contributed by ?ric +Araujo in :issue:`10968`.) The :class:`threading.Thread` constructor now accepts a ``daemon`` keyword argument to override the default behavior of inheriting the ``deamon`` flag @@ -2066,7 +2066,7 @@ * :func:`~time.clock_getres`, :func:`~time.clock_gettime` and :func:`~time.clock_settime` functions with ``CLOCK_xxx`` constants. - (Contributed by Victor Stinner in :issue:`10278`) + (Contributed by Victor Stinner in :issue:`10278`.) To improve cross platform consistency, :func:`~time.sleep` now raises a :exc:`ValueError` when passed a negative sleep value. Previously this was an @@ -2090,7 +2090,7 @@ :meth:`.assertRaises`, :meth:`.assertRaisesRegex`, :meth:`.assertWarns`, and :meth:`.assertWarnsRegex` now accept a keyword argument *msg* when used as context managers. (Contributed by Ezio Melotti and Winston Ewert in -:issue:`10775`) +:issue:`10775`.) :meth:`unittest.TestCase.run` now returns the :class:`~unittest.TestResult` object. @@ -2117,7 +2117,7 @@ and the generic launchers :program:`xdg-open`, from the FreeDesktop.org project, and :program:`gvfs-open`, which is the default URI handler for GNOME 3. (The former contributed by Arnaud Calmettes in :issue:`13620`, the latter -by Matthias Klose in :issue:`14493`) +by Matthias Klose in :issue:`14493`.) xml.etree.ElementTree @@ -2160,7 +2160,7 @@ * UTF-8 is now 2x to 4x faster. UTF-16 encoding is now up to 10x faster. - (contributed by Serhiy Storchaka, :issue:`14624`, :issue:`14738` and + (Contributed by Serhiy Storchaka, :issue:`14624`, :issue:`14738` and :issue:`15026`.) diff --git a/Doc/whatsnew/3.4.rst b/Doc/whatsnew/3.4.rst --- a/Doc/whatsnew/3.4.rst +++ b/Doc/whatsnew/3.4.rst @@ -52,7 +52,7 @@ * It's helpful to add the bug/patch number as a comment: The :ref:`~socket.transmogrify()` function was added to the - :mod:`socket` module. (Contributed by P.Y. Developer in :issue:`12345`.) + :mod:`socket` module. (Contributed by P.Y. Developer in :issue:`12345`.) This saves the maintainer the effort of going through the Mercurial log when researching a change. @@ -372,7 +372,7 @@ in :ref:`binary-transforms` and :ref:`text-transforms`. (Contributed by Nick Coghlan in :issue:`7475`, :issue:`17827`, -:issue:`17828` and :issue:`19619`) +:issue:`17828` and :issue:`19619`.) .. _whatsnew-pep-451: @@ -414,14 +414,14 @@ * Module ``__file__`` attributes (and related values) should now always contain absolute paths by default, with the sole exception of ``__main__.__file__`` when a script has been executed directly using - a relative path (Contributed by Brett Cannon in :issue:`18416`). + a relative path. (Contributed by Brett Cannon in :issue:`18416`.) * All the UTF-\* codecs (except UTF-7) now reject surrogates during both encoding and decoding unless the ``surrogatepass`` error handler is used, with the exception of the UTF-16 decoder (which accepts valid surrogate pairs) and the UTF-16 encoder (which produces them while encoding non-BMP characters). - Contributed by Victor Stinner, Kang-Hao (Kenny) Lu and Serhiy Storchaka in - :issue:`12892`. + (Contributed by Victor Stinner, Kang-Hao (Kenny) Lu and Serhiy Storchaka in + :issue:`12892`.) * New German EBCDIC :ref:`codec ` ``cp273``. (Contributed by Michael Bierenfeld and Andrew Kuchling in :issue:`1097797`.) @@ -633,8 +633,8 @@ in :issue:`12866`.) New :func:`~audioop.byteswap` function converts big-endian samples to -little-endian and vice versa (Contributed by Serhiy Storchaka in -:issue:`19641`). +little-endian and vice versa. (Contributed by Serhiy Storchaka in +:issue:`19641`.) All :mod:`audioop` functions now accept any :term:`bytes-like object`. Strings are not accepted: they didn't work before, now they raise an error right away. @@ -681,8 +681,8 @@ The new :class:`contextlib.suppress` context manager helps to clarify the intent of code that deliberately suppresses exceptions from a single -statement. (Contributed by Raymond Hettinger in :issue:`15806` and -Zero Piraeus in :issue:`19266`) +statement. (Contributed by Raymond Hettinger in :issue:`15806` and +Zero Piraeus in :issue:`19266`.) The new :func:`contextlib.redirect_stdout` context manager makes it easier for utility scripts to handle inflexible APIs that write their output to @@ -693,7 +693,7 @@ from a function that was written to implement a command line interface. It is recommended only for utility scripts because it affects the global state of :data:`sys.stdout`. (Contributed by Raymond Hettinger -in :issue:`15805`) +in :issue:`15805`.) The :mod:`contextlib` documentation has also been updated to include a :ref:`discussion ` of the @@ -765,7 +765,7 @@ to ``distb(tb)``). (Contributed by Nick Coghlan, Ryan Kelly and Thomas Kluyver in :issue:`11816` -and Claudiu Popa in :issue:`17916`) +and Claudiu Popa in :issue:`17916`.) New function :func:`~dis.stack_effect` computes the effect on the Python stack of a given opcode and argument, information that is not otherwise available. @@ -855,7 +855,7 @@ for normal callables. The new descriptor also makes it easier to get arbitrary callables (including :func:`~functools.partial` instances) to behave like normal instance methods when included in a class definition. -(Contributed by Alon Horev and Nick Coghlan in :issue:`4331`) +(Contributed by Alon Horev and Nick Coghlan in :issue:`4331`.) .. _whatsnew-singledispatch: @@ -903,7 +903,7 @@ A new :func:`hashlib.pbkdf2_hmac` function provides the `PKCS#5 password-based key derivation function 2 `_. (Contributed by Christian -Heimes in :issue:`18582`) +Heimes in :issue:`18582`.) The :attr:`~hashlib.hash.name` attribute of :mod:`hashlib` hash objects is now a formally supported interface. It has always existed in CPython's @@ -939,17 +939,17 @@ New function :func:`~html.unescape` function converts HTML5 character references to the corresponding Unicode characters. (Contributed by Ezio Melotti in -:issue:`2927`) +:issue:`2927`.) :class:`~html.parser.HTMLParser` accepts a new keyword argument *convert_charrefs* that, when ``True``, automatically converts all character references. For backward-compatibility, its value defaults to ``False``, but it will change to ``True`` in a future version of Python, so you are invited to set it explicitly and update your code to use this new feature. (Contributed -by Ezio Melotti in :issue:`13633`) +by Ezio Melotti in :issue:`13633`.) The *strict* argument of :class:`~html.parser.HTMLParser` is now deprecated. -(Contributed by Ezio Melotti in :issue:`15114`) +(Contributed by Ezio Melotti in :issue:`15114`.) http @@ -1015,19 +1015,19 @@ The :mod:`inspect` module now offers a basic :ref:`command line interface ` to quickly display source code and other -information for modules, classes and functions. (Contributed by Claudiu Popa -and Nick Coghlan in :issue:`18626`) +information for modules, classes and functions. (Contributed by Claudiu Popa +and Nick Coghlan in :issue:`18626`.) :func:`~inspect.unwrap` makes it easy to unravel wrapper function chains created by :func:`functools.wraps` (and any other API that sets the -``__wrapped__`` attribute on a wrapper function). (Contributed by -Daniel Urban, Aaron Iles and Nick Coghlan in :issue:`13266`) +``__wrapped__`` attribute on a wrapper function). (Contributed by +Daniel Urban, Aaron Iles and Nick Coghlan in :issue:`13266`.) As part of the implementation of the new :mod:`enum` module, the :mod:`inspect` module now has substantially better support for custom ``__dir__`` methods and dynamic class attributes provided through -metaclasses (Contributed by Ethan Furman in :issue:`18929` and -:issue:`19030`) +metaclasses. (Contributed by Ethan Furman in :issue:`18929` and +:issue:`19030`.) :func:`~inspect.getfullargspec` and :func:`~inspect.getargspec` now use the :func:`~inspect.signature` API. This allows them to @@ -1038,11 +1038,11 @@ attributes, and report the already bound first argument for bound methods, so it is still necessary to update your code to use :func:`~inspect.signature` directly if those features are desired. -(Contributed by Yury Selivanov in :issue:`17481`) +(Contributed by Yury Selivanov in :issue:`17481`.) :func:`~inspect.signature` now supports duck types of CPython functions, -which adds support for functions compiled with Cython. (Contributed -by Stefan Behnel and Yury Selivanov in :issue:`17159`) +which adds support for functions compiled with Cython. (Contributed +by Stefan Behnel and Yury Selivanov in :issue:`17159`.) ipaddress @@ -1082,7 +1082,7 @@ Logging configuration data received from a socket via the :func:`logging.config.listen` function can now be validated before being processed by supplying a verification function as the argument to the new -*verify* keyword argument. (Contributed by Vinay Sajip in :issue:`15452`.) +*verify* keyword argument. (Contributed by Vinay Sajip in :issue:`15452`.) .. _whatsnew-marshal-3: @@ -1120,7 +1120,7 @@ :func:`~multiprocessing.get_all_start_methods` reports all start methods available on the platform, :func:`~multiprocessing.get_start_method` reports the current start method, and :func:`~multiprocessing.set_start_method` sets -the start method. (Contributed by Richard Oudkerk in :issue:`8713`). +the start method. (Contributed by Richard Oudkerk in :issue:`8713`.) :mod:`multiprocessing` also now has the concept of a ``context``, which determines how child processes are created. New function @@ -1141,7 +1141,7 @@ when using the ``spawn`` or ``forkserver`` start methods. This resolves some edge cases where combining multiprocessing, the ``-m`` command line switch, and explicit relative imports could cause obscure failures in child -processes. (Contributed by Nick Coghlan in :issue:`19946`) +processes. (Contributed by Nick Coghlan in :issue:`19946`.) operator @@ -1176,7 +1176,7 @@ Windows). (Contributed by Brian Curtin in :issue:`11939`.) :func:`os.path.ismount` now recognizes volumes mounted below a drive -root on Windows. (Contributed by Tim Golden in :issue:`9035`.) +root on Windows. (Contributed by Tim Golden in :issue:`9035`.) :func:`os.open` supports two new flags on platforms that provide them, :data:`~os.O_PATH` (un-opened file descriptor), and :data:`~os.O_TMPFILE` @@ -1230,7 +1230,7 @@ functions. (The older API is now deprecated.) In addition to the already supported XML plist format (:data:`~plistlib.FMT_XML`), it also now supports the binary plist format (:data:`~plistlib.FMT_BINARY`). (Contributed by Ronald -Oussoren and others in :issue:`14455`). +Oussoren and others in :issue:`14455`.) poplib @@ -1254,7 +1254,7 @@ (Contributed by Serhiy Storchaka in :issue:`19132`.) Long strings are now wrapped using Python's normal line continuation -syntax. (Contributed by Antoine Pitrou in :issue:`17150`). +syntax. (Contributed by Antoine Pitrou in :issue:`17150`.) pty @@ -1270,13 +1270,13 @@ The :mod:`pydoc` module is now based directly on the :func:`inspect.signature` introspection API, allowing it to provide signature information for a wider variety of callable objects. This change also means that ``__wrapped__`` -attributes are now taken into account when displaying help information -(Contributed by Larry Hastings in :issue:`19674`) +attributes are now taken into account when displaying help information. +(Contributed by Larry Hastings in :issue:`19674`.) The :mod:`pydoc` module no longer displays the ``self`` parameter for already bound methods. Instead, it aims to always display the exact current -signature of the supplied callable (Contributed by Larry Hastings in -:issue:`20710`) +signature of the supplied callable. (Contributed by Larry Hastings in +:issue:`20710`.) In addition to the changes that have been made to :mod:`pydoc` directly, its handling of custom ``__dir__`` methods and various descriptor @@ -1372,7 +1372,7 @@ :exc:`~smtplib.SMTPException` is now a subclass of :exc:`OSError`, which allows both socket level errors and SMTP protocol level errors to be caught in one try/except statement by code that only cares whether or not an error occurred. -(Contributed by Ned Jackson Lovely in :issue:`2118`). +(Contributed by Ned Jackson Lovely in :issue:`2118`.) socket @@ -1412,7 +1412,7 @@ :data:`~ssl.PROTOCOL_TLSv1_1` and :data:`~ssl.PROTOCOL_TLSv1_2` (TLSv1.1 and TLSv1.2 support) have been added; support for these protocols is only available if Python is linked with OpenSSL 1.0.1 or later. (Contributed by Michele Orr? and -Antoine Pitrou in :issue:`16692`) +Antoine Pitrou in :issue:`16692`.) .. _whatsnew34-sslcontext: @@ -1596,7 +1596,7 @@ A new :func:`traceback.clear_frames` function takes a traceback object and clears the local variables in all of the frames it references, reducing the amount of memory consumed. (Contributed by Andrew Kuchling in -:issue:`1565525`). +:issue:`1565525`.) types @@ -1619,7 +1619,7 @@ The http method that will be used by a :class:`~urllib.request.Request` class can now be specified by setting a :class:`~urllib.request.Request.method` -class attribute on the subclass. (Contributed by Jason R Coombs in +class attribute on the subclass. (Contributed by Jason R Coombs in :issue:`18978`.) :class:`~urllib.request.Request` objects are now reusable: if the @@ -1701,14 +1701,14 @@ :issue:`17015`.) :func:`~mock.mock_open` objects now have ``readline`` and ``readlines`` -methods. (Contributed by Toshio Kuratomi in :issue:`17467`.) +methods. (Contributed by Toshio Kuratomi in :issue:`17467`.) venv ---- :mod:`venv` now includes activation scripts for the ``csh`` and ``fish`` -shells (Contributed by Andrew Svetlov in :issue:`15417`.) +shells. (Contributed by Andrew Svetlov in :issue:`15417`.) :class:`~venv.EnvBuilder` and the :func:`~venv.create` convenience function take a new keyword argument *with_pip*, which defaults to ``False``, that @@ -1739,12 +1739,12 @@ ------- New :class:`~weakref.WeakMethod` class simulates weak references to bound -methods. (Contributed by Antoine Pitrou in :issue:`14631`.) +methods. (Contributed by Antoine Pitrou in :issue:`14631`.) New :class:`~weakref.finalize` class makes it possible to register a callback to be invoked when an object is garbage collected, without needing to -carefully manage the lifecycle of the weak reference itself. (Contributed by -Richard Oudkerk in :issue:`15528`) +carefully manage the lifecycle of the weak reference itself. (Contributed by +Richard Oudkerk in :issue:`15528`.) The callback, if any, associated with a :class:`~weakref.ref` is now exposed via the :attr:`~weakref.ref.__callback__` attribute. (Contributed @@ -1879,16 +1879,16 @@ * The new :c:func:`PyType_GetSlot` function has been added to the stable ABI, allowing retrieval of function pointers from named type slots when using - the limited API. (Contributed by Martin von L?wis in :issue:`17162`) + the limited API. (Contributed by Martin von L?wis in :issue:`17162`.) * The new :c:func:`Py_SetStandardStreamEncoding` pre-initialization API allows applications embedding the CPython interpreter to reliably force - a particular encoding and error handler for the standard streams - (Contributed by Bastien Montagne and Nick Coghlan in :issue:`16129`) + a particular encoding and error handler for the standard streams. + (Contributed by Bastien Montagne and Nick Coghlan in :issue:`16129`.) * Most Python C APIs that don't mutate string arguments are now correctly - marked as accepting ``const char *`` rather than ``char *`` (Contributed - by Serhiy Storchaka in :issue:`1772673`). + marked as accepting ``const char *`` rather than ``char *``. (Contributed + by Serhiy Storchaka in :issue:`1772673`.) * A new shell version of ``python-config`` can be used even when a python interpreter is not available (for example, in cross compilation scenarios). @@ -1958,7 +1958,7 @@ * The ``-R`` option to the :ref:`python regression test suite ` now also checks for memory allocation leaks, using :func:`sys.getallocatedblocks()`. (Contributed by Antoine Pitrou in - :issue:`13390`). + :issue:`13390`.) * ``python -m`` now works with namespace packages. @@ -2021,14 +2021,14 @@ longer imported by default. The marshal module has been improved to load compiled Python code faster. (Contributed by Antoine Pitrou, Christian Heimes and Victor Stinner in :issue:`19219`, :issue:`19218`, :issue:`19209`, - :issue:`19205` and :issue:`9548`) + :issue:`19205` and :issue:`9548`.) * :class:`bz2.BZ2File` is now as fast or faster than the Python2 version for most cases. :class:`lzma.LZMAFile` has also been optimized. (Contributed by Serhiy Storchaka and Nadeem Vawda in :issue:`16034`.) * :func:`random.getrandbits` is 20%-40% faster for small integers (the most - common use case). (Contributed by Serhiy Storchaka in :issue:`16674`). + common use case). (Contributed by Serhiy Storchaka in :issue:`16674`.) * By taking advantage of the new storage format for strings, pickling of strings is now significantly faster. (Contributed by Victor Stinner and @@ -2048,7 +2048,7 @@ * :func:`os.urandom` now uses a lazily-opened persistent file descriptor so as to avoid using many file descriptors when run in parallel from - multiple threads. (Contributed by Antoine Pitrou in :issue:`18756`.) + multiple threads. (Contributed by Antoine Pitrou in :issue:`18756`.) .. _deprecated-3.4: @@ -2246,7 +2246,7 @@ * The [X refs, Y blocks] output of a debug (``--with-pydebug``) build of the CPython interpreter is now off by default. It can be re-enabled using the - ``-X showrefcount`` option. (Contributed by Ezio Melotti in :issue:`17323`.) + ``-X showrefcount`` option. (Contributed by Ezio Melotti in :issue:`17323`.) * The python command and most stdlib scripts (as well as :mod:`argparse`) now output ``--version`` information to ``stdout`` instead of ``stderr`` (for @@ -2395,8 +2395,8 @@ storage). (:issue:`17094`.) * Parameter names in ``__annotations__`` dicts are now mangled properly, - similarly to ``__kwdefaults__``. (Contributed by Yury Selivanov in - :issue:`20625`). + similarly to ``__kwdefaults__``. (Contributed by Yury Selivanov in + :issue:`20625`.) * :attr:`hashlib.hash.name` now always returns the identifier in lower case. Previously some builtin hashes had uppercase names, but now that it is a -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 18:34:14 2014 From: python-checkins at python.org (r.david.murray) Date: Sun, 02 Nov 2014 17:34:14 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E4=29=3A_Fix_English_ph?= =?utf-8?q?rasing=2E?= Message-ID: <20141102173359.120726.12716@psf.io> https://hg.python.org/cpython/rev/1cafcc11e719 changeset: 93356:1cafcc11e719 branch: 3.4 parent: 93353:a5dd8e89d4da user: R David Murray date: Sun Nov 02 12:31:47 2014 -0500 summary: Fix English phrasing. files: Doc/library/asyncio-protocol.rst | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Doc/library/asyncio-protocol.rst b/Doc/library/asyncio-protocol.rst --- a/Doc/library/asyncio-protocol.rst +++ b/Doc/library/asyncio-protocol.rst @@ -439,7 +439,7 @@ ------------------------ Coroutines can be scheduled in a protocol method using :func:`async`, but there -is not guarantee on the execution order. Protocols are not aware of coroutines +is no guarantee made about the execution order. Protocols are not aware of coroutines created in protocol methods and so will not wait for them. To have a reliable execution order, use :ref:`stream objects ` in a -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 18:34:14 2014 From: python-checkins at python.org (r.david.murray) Date: Sun, 02 Nov 2014 17:34:14 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Merge_asyncio_doc_English_phrasing_fix=2E?= Message-ID: <20141102173359.35246.5785@psf.io> https://hg.python.org/cpython/rev/b2a57fe50712 changeset: 93358:b2a57fe50712 parent: 93355:769a217764f2 parent: 93357:4924b0ce72c0 user: R David Murray date: Sun Nov 02 12:33:37 2014 -0500 summary: Merge asyncio doc English phrasing fix. files: Doc/library/asyncio-protocol.rst | 4 ++-- 1 files changed, 2 insertions(+), 2 deletions(-) diff --git a/Doc/library/asyncio-protocol.rst b/Doc/library/asyncio-protocol.rst --- a/Doc/library/asyncio-protocol.rst +++ b/Doc/library/asyncio-protocol.rst @@ -439,8 +439,8 @@ ------------------------ Coroutines can be scheduled in a protocol method using :func:`async`, but there -is not guarantee on the execution order. Protocols are not aware of coroutines -created in protocol methods and so will not wait for them. +is no guarantee made about the execution order. Protocols are not aware of +coroutines created in protocol methods and so will not wait for them. To have a reliable execution order, use :ref:`stream objects ` in a coroutine with ``yield from``. For example, the :meth:`StreamWriter.drain` -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 18:34:14 2014 From: python-checkins at python.org (r.david.murray) Date: Sun, 02 Nov 2014 17:34:14 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E4=29=3A_Reflow_paragra?= =?utf-8?b?cGgu?= Message-ID: <20141102173359.35274.93079@psf.io> https://hg.python.org/cpython/rev/4924b0ce72c0 changeset: 93357:4924b0ce72c0 branch: 3.4 user: R David Murray date: Sun Nov 02 12:32:26 2014 -0500 summary: Reflow paragraph. files: Doc/library/asyncio-protocol.rst | 4 ++-- 1 files changed, 2 insertions(+), 2 deletions(-) diff --git a/Doc/library/asyncio-protocol.rst b/Doc/library/asyncio-protocol.rst --- a/Doc/library/asyncio-protocol.rst +++ b/Doc/library/asyncio-protocol.rst @@ -439,8 +439,8 @@ ------------------------ Coroutines can be scheduled in a protocol method using :func:`async`, but there -is no guarantee made about the execution order. Protocols are not aware of coroutines -created in protocol methods and so will not wait for them. +is no guarantee made about the execution order. Protocols are not aware of +coroutines created in protocol methods and so will not wait for them. To have a reliable execution order, use :ref:`stream objects ` in a coroutine with ``yield from``. For example, the :meth:`StreamWriter.drain` -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 18:42:53 2014 From: python-checkins at python.org (antoine.pitrou) Date: Sun, 02 Nov 2014 17:42:53 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_default_-=3E_default?= =?utf-8?q?=29=3A_Merge_heads?= Message-ID: <20141102174253.120720.70057@psf.io> https://hg.python.org/cpython/rev/7e89c24245ea changeset: 93362:7e89c24245ea parent: 93361:f0b334ae95c9 parent: 93359:016bc54999a2 user: Antoine Pitrou date: Sun Nov 02 18:42:41 2014 +0100 summary: Merge heads files: Lib/test/test_urllib.py | 6 +++++- 1 files changed, 5 insertions(+), 1 deletions(-) diff --git a/Lib/test/test_urllib.py b/Lib/test/test_urllib.py --- a/Lib/test/test_urllib.py +++ b/Lib/test/test_urllib.py @@ -10,7 +10,10 @@ from unittest.mock import patch from test import support import os -import ssl +try: + import ssl +except ImportError: + ssl = None import sys import tempfile from nturl2path import url2pathname, pathname2url @@ -380,6 +383,7 @@ with support.check_warnings(('',DeprecationWarning)): urllib.request.URLopener() + @unittest.skipUnless(ssl, "ssl module required") def test_cafile_and_context(self): context = ssl.create_default_context() with self.assertRaises(ValueError): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 18:42:53 2014 From: python-checkins at python.org (antoine.pitrou) Date: Sun, 02 Nov 2014 17:42:53 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Fix_test=5Furllib_without_?= =?utf-8?q?the_ssl_module?= Message-ID: <20141102174252.35262.90121@psf.io> https://hg.python.org/cpython/rev/016bc54999a2 changeset: 93359:016bc54999a2 parent: 93347:64a54f0c87d7 user: Antoine Pitrou date: Sun Nov 02 17:23:14 2014 +0100 summary: Fix test_urllib without the ssl module files: Lib/test/test_urllib.py | 6 +++++- 1 files changed, 5 insertions(+), 1 deletions(-) diff --git a/Lib/test/test_urllib.py b/Lib/test/test_urllib.py --- a/Lib/test/test_urllib.py +++ b/Lib/test/test_urllib.py @@ -10,7 +10,10 @@ from unittest.mock import patch from test import support import os -import ssl +try: + import ssl +except ImportError: + ssl = None import sys import tempfile from nturl2path import url2pathname, pathname2url @@ -380,6 +383,7 @@ with support.check_warnings(('',DeprecationWarning)): urllib.request.URLopener() + @unittest.skipUnless(ssl, "ssl module required") def test_cafile_and_context(self): context = ssl.create_default_context() with self.assertRaises(ValueError): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 18:42:53 2014 From: python-checkins at python.org (antoine.pitrou) Date: Sun, 02 Nov 2014 17:42:53 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyMzM1?= =?utf-8?q?=3A_Fix_crash_when_trying_to_enlarge_a_bytearray_to_0x7fffffff_?= =?utf-8?q?bytes?= Message-ID: <20141102174252.35272.29008@psf.io> https://hg.python.org/cpython/rev/1590c594550e changeset: 93360:1590c594550e branch: 3.4 parent: 93357:4924b0ce72c0 user: Antoine Pitrou date: Sun Nov 02 18:40:09 2014 +0100 summary: Issue #22335: Fix crash when trying to enlarge a bytearray to 0x7fffffff bytes on a 32-bit platform. files: Lib/test/test_bytes.py | 13 +++++++++++++ Misc/NEWS | 3 +++ Objects/bytearrayobject.c | 23 +++++++++++++++-------- Objects/obmalloc.c | 8 ++++---- 4 files changed, 35 insertions(+), 12 deletions(-) diff --git a/Lib/test/test_bytes.py b/Lib/test/test_bytes.py --- a/Lib/test/test_bytes.py +++ b/Lib/test/test_bytes.py @@ -13,9 +13,11 @@ import pickle import tempfile import unittest + import test.support import test.string_tests import test.buffer_tests +from test.support import bigaddrspacetest, MAX_Py_ssize_t if sys.flags.bytes_warning: @@ -111,6 +113,17 @@ self.assertRaises(ValueError, self.type2test, [sys.maxsize+1]) self.assertRaises(ValueError, self.type2test, [10**100]) + @bigaddrspacetest + def test_constructor_overflow(self): + size = MAX_Py_ssize_t + self.assertRaises((OverflowError, MemoryError), self.type2test, size) + try: + # Should either pass or raise an error (e.g. on debug builds with + # additional malloc() overhead), but shouldn't crash. + bytearray(size - 4) + except (OverflowError, MemoryError): + pass + def test_compare(self): b1 = self.type2test([1, 2, 3]) b2 = self.type2test([1, 2, 3]) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -11,6 +11,9 @@ Core and Builtins ----------------- +- Issue #22335: Fix crash when trying to enlarge a bytearray to 0x7fffffff + bytes on a 32-bit platform. + - Issue #22653: Fix an assertion failure in debug mode when doing a reentrant dict insertion in debug mode. diff --git a/Objects/bytearrayobject.c b/Objects/bytearrayobject.c --- a/Objects/bytearrayobject.c +++ b/Objects/bytearrayobject.c @@ -175,20 +175,22 @@ } int -PyByteArray_Resize(PyObject *self, Py_ssize_t size) +PyByteArray_Resize(PyObject *self, Py_ssize_t requested_size) { void *sval; PyByteArrayObject *obj = ((PyByteArrayObject *)self); - Py_ssize_t alloc = obj->ob_alloc; - Py_ssize_t logical_offset = obj->ob_start - obj->ob_bytes; + /* All computations are done unsigned to avoid integer overflows + (see issue #22335). */ + size_t alloc = (size_t) obj->ob_alloc; + size_t logical_offset = (size_t) (obj->ob_start - obj->ob_bytes); + size_t size = (size_t) requested_size; assert(self != NULL); assert(PyByteArray_Check(self)); - assert(size >= 0); - assert(logical_offset >= 0); assert(logical_offset <= alloc); - - if (size == Py_SIZE(self)) { + assert(requested_size >= 0); + + if (requested_size == Py_SIZE(self)) { return 0; } if (!_canresize(obj)) { @@ -220,6 +222,10 @@ alloc = size + 1; } } + if (alloc > PY_SSIZE_T_MAX) { + PyErr_NoMemory(); + return -1; + } if (logical_offset > 0) { sval = PyObject_Malloc(alloc); @@ -227,7 +233,8 @@ PyErr_NoMemory(); return -1; } - memcpy(sval, PyByteArray_AS_STRING(self), Py_MIN(size, Py_SIZE(self))); + memcpy(sval, PyByteArray_AS_STRING(self), + Py_MIN(requested_size, Py_SIZE(self))); PyObject_Free(obj->ob_bytes); } else { diff --git a/Objects/obmalloc.c b/Objects/obmalloc.c --- a/Objects/obmalloc.c +++ b/Objects/obmalloc.c @@ -1754,8 +1754,8 @@ bumpserialno(); total = nbytes + 4*SST; - if (total < nbytes) - /* overflow: can't represent total as a size_t */ + if (nbytes > PY_SSIZE_T_MAX - 4*SST) + /* overflow: can't represent total as a Py_ssize_t */ return NULL; p = (uchar *)api->alloc.malloc(api->alloc.ctx, total); @@ -1817,8 +1817,8 @@ bumpserialno(); original_nbytes = read_size_t(q - 2*SST); total = nbytes + 4*SST; - if (total < nbytes) - /* overflow: can't represent total as a size_t */ + if (nbytes > PY_SSIZE_T_MAX - 4*SST) + /* overflow: can't represent total as a Py_ssize_t */ return NULL; /* Resize and add decorations. We may get a new pointer here, in which -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 18:42:53 2014 From: python-checkins at python.org (antoine.pitrou) Date: Sun, 02 Nov 2014 17:42:53 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2322335=3A_Fix_crash_when_trying_to_enlarge_a_byt?= =?utf-8?q?earray_to_0x7fffffff_bytes?= Message-ID: <20141102174252.111422.12155@psf.io> https://hg.python.org/cpython/rev/f0b334ae95c9 changeset: 93361:f0b334ae95c9 parent: 93358:b2a57fe50712 parent: 93360:1590c594550e user: Antoine Pitrou date: Sun Nov 02 18:41:56 2014 +0100 summary: Issue #22335: Fix crash when trying to enlarge a bytearray to 0x7fffffff bytes on a 32-bit platform. files: Lib/test/test_bytes.py | 13 +++++++++++++ Misc/NEWS | 3 +++ Objects/bytearrayobject.c | 23 +++++++++++++++-------- Objects/obmalloc.c | 8 ++++---- 4 files changed, 35 insertions(+), 12 deletions(-) diff --git a/Lib/test/test_bytes.py b/Lib/test/test_bytes.py --- a/Lib/test/test_bytes.py +++ b/Lib/test/test_bytes.py @@ -13,9 +13,11 @@ import pickle import tempfile import unittest + import test.support import test.string_tests import test.buffer_tests +from test.support import bigaddrspacetest, MAX_Py_ssize_t if sys.flags.bytes_warning: @@ -111,6 +113,17 @@ self.assertRaises(ValueError, self.type2test, [sys.maxsize+1]) self.assertRaises(ValueError, self.type2test, [10**100]) + @bigaddrspacetest + def test_constructor_overflow(self): + size = MAX_Py_ssize_t + self.assertRaises((OverflowError, MemoryError), self.type2test, size) + try: + # Should either pass or raise an error (e.g. on debug builds with + # additional malloc() overhead), but shouldn't crash. + bytearray(size - 4) + except (OverflowError, MemoryError): + pass + def test_compare(self): b1 = self.type2test([1, 2, 3]) b2 = self.type2test([1, 2, 3]) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -10,6 +10,9 @@ Core and Builtins ----------------- +- Issue #22335: Fix crash when trying to enlarge a bytearray to 0x7fffffff + bytes on a 32-bit platform. + - Issue #22653: Fix an assertion failure in debug mode when doing a reentrant dict insertion in debug mode. diff --git a/Objects/bytearrayobject.c b/Objects/bytearrayobject.c --- a/Objects/bytearrayobject.c +++ b/Objects/bytearrayobject.c @@ -180,20 +180,22 @@ } int -PyByteArray_Resize(PyObject *self, Py_ssize_t size) +PyByteArray_Resize(PyObject *self, Py_ssize_t requested_size) { void *sval; PyByteArrayObject *obj = ((PyByteArrayObject *)self); - Py_ssize_t alloc = obj->ob_alloc; - Py_ssize_t logical_offset = obj->ob_start - obj->ob_bytes; + /* All computations are done unsigned to avoid integer overflows + (see issue #22335). */ + size_t alloc = (size_t) obj->ob_alloc; + size_t logical_offset = (size_t) (obj->ob_start - obj->ob_bytes); + size_t size = (size_t) requested_size; assert(self != NULL); assert(PyByteArray_Check(self)); - assert(size >= 0); - assert(logical_offset >= 0); assert(logical_offset <= alloc); - - if (size == Py_SIZE(self)) { + assert(requested_size >= 0); + + if (requested_size == Py_SIZE(self)) { return 0; } if (!_canresize(obj)) { @@ -225,6 +227,10 @@ alloc = size + 1; } } + if (alloc > PY_SSIZE_T_MAX) { + PyErr_NoMemory(); + return -1; + } if (logical_offset > 0) { sval = PyObject_Malloc(alloc); @@ -232,7 +238,8 @@ PyErr_NoMemory(); return -1; } - memcpy(sval, PyByteArray_AS_STRING(self), Py_MIN(size, Py_SIZE(self))); + memcpy(sval, PyByteArray_AS_STRING(self), + Py_MIN(requested_size, Py_SIZE(self))); PyObject_Free(obj->ob_bytes); } else { diff --git a/Objects/obmalloc.c b/Objects/obmalloc.c --- a/Objects/obmalloc.c +++ b/Objects/obmalloc.c @@ -1828,8 +1828,8 @@ bumpserialno(); total = nbytes + 4*SST; - if (total < nbytes) - /* overflow: can't represent total as a size_t */ + if (nbytes > PY_SSIZE_T_MAX - 4*SST) + /* overflow: can't represent total as a Py_ssize_t */ return NULL; if (use_calloc) @@ -1909,8 +1909,8 @@ bumpserialno(); original_nbytes = read_size_t(q - 2*SST); total = nbytes + 4*SST; - if (total < nbytes) - /* overflow: can't represent total as a size_t */ + if (nbytes > PY_SSIZE_T_MAX - 4*SST) + /* overflow: can't represent total as a Py_ssize_t */ return NULL; /* Resize and add decorations. We may get a new pointer here, in which -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 19:19:24 2014 From: python-checkins at python.org (benjamin.peterson) Date: Sun, 02 Nov 2014 18:19:24 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?b?KTogbWVyZ2UgMy40?= Message-ID: <20141102181920.109262.53974@psf.io> https://hg.python.org/cpython/rev/21b4356ffc06 changeset: 93365:21b4356ffc06 parent: 93362:7e89c24245ea parent: 93364:c51d85cf57f2 user: Benjamin Peterson date: Sun Nov 02 13:19:15 2014 -0500 summary: merge 3.4 files: Doc/library/urllib.request.rst | 5 +++-- 1 files changed, 3 insertions(+), 2 deletions(-) diff --git a/Doc/library/urllib.request.rst b/Doc/library/urllib.request.rst --- a/Doc/library/urllib.request.rst +++ b/Doc/library/urllib.request.rst @@ -48,8 +48,8 @@ only works for HTTP, HTTPS and FTP connections. If *context* is specified, it must be a :class:`ssl.SSLContext` instance - describing the various SSL options. See - :class:`~http.client.HTTPSConnection` for more details. + describing the various SSL options. See :class:`~http.client.HTTPSConnection` + for more details. The optional *cafile* and *capath* parameters specify a set of trusted CA certificates for HTTPS requests. *cafile* should point to a single @@ -118,6 +118,7 @@ .. versionchanged:: 3.5 *context* was added. + .. function:: install_opener(opener) Install an :class:`OpenerDirector` instance as the default global opener. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 19:19:24 2014 From: python-checkins at python.org (benjamin.peterson) Date: Sun, 02 Nov 2014 18:19:24 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E4=29=3A_wrap?= Message-ID: <20141102181920.35270.70983@psf.io> https://hg.python.org/cpython/rev/c51d85cf57f2 changeset: 93364:c51d85cf57f2 branch: 3.4 user: Benjamin Peterson date: Sun Nov 02 13:17:56 2014 -0500 summary: wrap files: Doc/library/urllib.request.rst | 4 ++-- 1 files changed, 2 insertions(+), 2 deletions(-) diff --git a/Doc/library/urllib.request.rst b/Doc/library/urllib.request.rst --- a/Doc/library/urllib.request.rst +++ b/Doc/library/urllib.request.rst @@ -48,8 +48,8 @@ only works for HTTP, HTTPS and FTP connections. If *context* is specified, it must be a :class:`ssl.SSLContext` instance - describing the various SSL options. See - :class:`~http.client.HTTPSConnection` for more details. + describing the various SSL options. See :class:`~http.client.HTTPSConnection` + for more details. The optional *cafile* and *capath* parameters specify a set of trusted CA certificates for HTTPS requests. *cafile* should point to a single -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 19:19:24 2014 From: python-checkins at python.org (benjamin.peterson) Date: Sun, 02 Nov 2014 18:19:24 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E4=29=3A_backport_conte?= =?utf-8?q?xt_argument_of_urlopen_=28=2322366=29_for_pep_476?= Message-ID: <20141102181920.35260.9219@psf.io> https://hg.python.org/cpython/rev/13f46fc1a002 changeset: 93363:13f46fc1a002 branch: 3.4 parent: 93360:1590c594550e user: Senthil Kumaran date: Fri Sep 19 15:23:30 2014 +0800 summary: backport context argument of urlopen (#22366) for pep 476 files: Doc/library/urllib.request.rst | 9 ++++++++- Lib/test/test_urllib.py | 8 ++++++++ Lib/urllib/request.py | 10 +++++++++- Misc/NEWS | 4 ++++ 4 files changed, 29 insertions(+), 2 deletions(-) diff --git a/Doc/library/urllib.request.rst b/Doc/library/urllib.request.rst --- a/Doc/library/urllib.request.rst +++ b/Doc/library/urllib.request.rst @@ -16,7 +16,7 @@ The :mod:`urllib.request` module defines the following functions: -.. function:: urlopen(url, data=None[, timeout], *, cafile=None, capath=None, cadefault=False) +.. function:: urlopen(url, data=None[, timeout], *, cafile=None, capath=None, cadefault=False, context=None) Open the URL *url*, which can be either a string or a :class:`Request` object. @@ -47,6 +47,10 @@ the global default timeout setting will be used). This actually only works for HTTP, HTTPS and FTP connections. + If *context* is specified, it must be a :class:`ssl.SSLContext` instance + describing the various SSL options. See + :class:`~http.client.HTTPSConnection` for more details. + The optional *cafile* and *capath* parameters specify a set of trusted CA certificates for HTTPS requests. *cafile* should point to a single file containing a bundle of CA certificates, whereas *capath* should @@ -111,6 +115,9 @@ .. versionchanged:: 3.3 *cadefault* was added. + .. versionchanged:: 3.4.3 + *context* was added. + .. function:: install_opener(opener) Install an :class:`OpenerDirector` instance as the default global opener. diff --git a/Lib/test/test_urllib.py b/Lib/test/test_urllib.py --- a/Lib/test/test_urllib.py +++ b/Lib/test/test_urllib.py @@ -10,6 +10,7 @@ from unittest.mock import patch from test import support import os +import ssl import sys import tempfile from nturl2path import url2pathname, pathname2url @@ -379,6 +380,13 @@ with support.check_warnings(('',DeprecationWarning)): urllib.request.URLopener() + def test_cafile_and_context(self): + context = ssl.create_default_context() + with self.assertRaises(ValueError): + urllib.request.urlopen( + "https://localhost", cafile="/nonexistent/path", context=context + ) + class urlopen_DataTests(unittest.TestCase): """Test urlopen() opening a data URL.""" diff --git a/Lib/urllib/request.py b/Lib/urllib/request.py --- a/Lib/urllib/request.py +++ b/Lib/urllib/request.py @@ -136,9 +136,14 @@ _opener = None def urlopen(url, data=None, timeout=socket._GLOBAL_DEFAULT_TIMEOUT, - *, cafile=None, capath=None, cadefault=False): + *, cafile=None, capath=None, cadefault=False, context=None): global _opener if cafile or capath or cadefault: + if context is not None: + raise ValueError( + "You can't pass both context and any of cafile, capath, and " + "cadefault" + ) if not _have_ssl: raise ValueError('SSL support not available') context = ssl._create_stdlib_context(cert_reqs=ssl.CERT_REQUIRED, @@ -146,6 +151,9 @@ capath=capath) https_handler = HTTPSHandler(context=context, check_hostname=True) opener = build_opener(https_handler) + elif context: + https_handler = HTTPSHandler(context=context) + opener = build_opener(https_handler) elif _opener is None: _opener = opener = build_opener() else: diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -36,6 +36,10 @@ Library ------- +- Issue #22366: urllib.request.urlopen will accept a context object + (SSLContext) as an argument which will then used be for HTTPS connection. + Patch by Alex Gaynor. + - Issue #22776: Brought excluded code into the scope of a try block in SysLogHandler.emit(). -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 21:22:45 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Sun, 02 Nov 2014 20:22:45 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2322775=3A_Fixed_unpickling_of_http=2Ecookies=2ES?= =?utf-8?q?impleCookie_with_protocol_2?= Message-ID: <20141102202244.101668.84743@psf.io> https://hg.python.org/cpython/rev/caa8f9248ab8 changeset: 93367:caa8f9248ab8 parent: 93365:21b4356ffc06 parent: 93366:7be6ef737aaf user: Serhiy Storchaka date: Sun Nov 02 22:19:56 2014 +0200 summary: Issue #22775: Fixed unpickling of http.cookies.SimpleCookie with protocol 2 and above. Patch by Tim Graham. files: Lib/http/cookies.py | 8 ++++++-- Lib/test/pickletester.py | 2 +- Lib/test/test_http_cookies.py | 15 ++++++++++++++- Misc/ACKS | 1 + Misc/NEWS | 3 +++ 5 files changed, 25 insertions(+), 4 deletions(-) diff --git a/Lib/http/cookies.py b/Lib/http/cookies.py --- a/Lib/http/cookies.py +++ b/Lib/http/cookies.py @@ -486,8 +486,12 @@ def __setitem__(self, key, value): """Dictionary style assignment.""" - rval, cval = self.value_encode(value) - self.__set(key, rval, cval) + if isinstance(value, Morsel): + # allow assignment of constructed Morsels (e.g. for pickling) + dict.__setitem__(self, key, value) + else: + rval, cval = self.value_encode(value) + self.__set(key, rval, cval) def output(self, attrs=None, header="Set-Cookie:", sep="\015\012"): """Return a string suitable for HTTP.""" diff --git a/Lib/test/pickletester.py b/Lib/test/pickletester.py --- a/Lib/test/pickletester.py +++ b/Lib/test/pickletester.py @@ -1284,7 +1284,7 @@ loaded = self.loads(DATA5) self.assertEqual(type(loaded), SimpleCookie) self.assertEqual(list(loaded.keys()), ["key"]) - self.assertEqual(loaded["key"].value, "Set-Cookie: key=value") + self.assertEqual(loaded["key"].value, "value") for (exc, data) in DATA7.items(): loaded = self.loads(data) diff --git a/Lib/test/test_http_cookies.py b/Lib/test/test_http_cookies.py --- a/Lib/test/test_http_cookies.py +++ b/Lib/test/test_http_cookies.py @@ -3,7 +3,7 @@ from test.support import run_unittest, run_doctest, check_warnings import unittest from http import cookies - +import pickle import warnings class CookieTests(unittest.TestCase): @@ -187,6 +187,19 @@ self.assertEqual(dict(C), {}) self.assertEqual(C.output(), '') + def test_pickle(self): + rawdata = 'Customer="WILE_E_COYOTE"; Path=/acme; Version=1' + expected_output = 'Set-Cookie: %s' % rawdata + + C = cookies.SimpleCookie() + C.load(rawdata) + self.assertEqual(C.output(), expected_output) + + for proto in range(pickle.HIGHEST_PROTOCOL + 1): + with self.subTest(proto=proto): + C1 = pickle.loads(pickle.dumps(C, protocol=proto)) + self.assertEqual(C1.output(), expected_output) + class MorselTests(unittest.TestCase): """Tests for the Morsel object.""" diff --git a/Misc/ACKS b/Misc/ACKS --- a/Misc/ACKS +++ b/Misc/ACKS @@ -496,6 +496,7 @@ Shelley Gooch David Goodger Hans de Graaff +Tim Graham Kim Gr?sman Nathaniel Gray Eddy De Greef diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -183,6 +183,9 @@ Library ------- +- Issue #22775: Fixed unpickling of http.cookies.SimpleCookie with protocol 2 + and above. Patch by Tim Graham. + - Issue #22776: Brought excluded code into the scope of a try block in SysLogHandler.emit(). -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 21:22:44 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Sun, 02 Nov 2014 20:22:44 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyNzc1?= =?utf-8?q?=3A_Fixed_unpickling_of_http=2Ecookies=2ESimpleCookie_with_prot?= =?utf-8?q?ocol_2?= Message-ID: <20141102202244.111412.63530@psf.io> https://hg.python.org/cpython/rev/7be6ef737aaf changeset: 93366:7be6ef737aaf branch: 3.4 parent: 93364:c51d85cf57f2 user: Serhiy Storchaka date: Sun Nov 02 22:18:25 2014 +0200 summary: Issue #22775: Fixed unpickling of http.cookies.SimpleCookie with protocol 2 and above. Patch by Tim Graham. files: Lib/http/cookies.py | 8 ++++++-- Lib/test/pickletester.py | 2 +- Lib/test/test_http_cookies.py | 15 ++++++++++++++- Misc/ACKS | 1 + Misc/NEWS | 3 +++ 5 files changed, 25 insertions(+), 4 deletions(-) diff --git a/Lib/http/cookies.py b/Lib/http/cookies.py --- a/Lib/http/cookies.py +++ b/Lib/http/cookies.py @@ -486,8 +486,12 @@ def __setitem__(self, key, value): """Dictionary style assignment.""" - rval, cval = self.value_encode(value) - self.__set(key, rval, cval) + if isinstance(value, Morsel): + # allow assignment of constructed Morsels (e.g. for pickling) + dict.__setitem__(self, key, value) + else: + rval, cval = self.value_encode(value) + self.__set(key, rval, cval) def output(self, attrs=None, header="Set-Cookie:", sep="\015\012"): """Return a string suitable for HTTP.""" diff --git a/Lib/test/pickletester.py b/Lib/test/pickletester.py --- a/Lib/test/pickletester.py +++ b/Lib/test/pickletester.py @@ -1284,7 +1284,7 @@ loaded = self.loads(DATA5) self.assertEqual(type(loaded), SimpleCookie) self.assertEqual(list(loaded.keys()), ["key"]) - self.assertEqual(loaded["key"].value, "Set-Cookie: key=value") + self.assertEqual(loaded["key"].value, "value") for (exc, data) in DATA7.items(): loaded = self.loads(data) diff --git a/Lib/test/test_http_cookies.py b/Lib/test/test_http_cookies.py --- a/Lib/test/test_http_cookies.py +++ b/Lib/test/test_http_cookies.py @@ -3,7 +3,7 @@ from test.support import run_unittest, run_doctest, check_warnings import unittest from http import cookies - +import pickle import warnings class CookieTests(unittest.TestCase): @@ -187,6 +187,19 @@ self.assertEqual(dict(C), {}) self.assertEqual(C.output(), '') + def test_pickle(self): + rawdata = 'Customer="WILE_E_COYOTE"; Path=/acme; Version=1' + expected_output = 'Set-Cookie: %s' % rawdata + + C = cookies.SimpleCookie() + C.load(rawdata) + self.assertEqual(C.output(), expected_output) + + for proto in range(pickle.HIGHEST_PROTOCOL + 1): + with self.subTest(proto=proto): + C1 = pickle.loads(pickle.dumps(C, protocol=proto)) + self.assertEqual(C1.output(), expected_output) + class MorselTests(unittest.TestCase): """Tests for the Morsel object.""" diff --git a/Misc/ACKS b/Misc/ACKS --- a/Misc/ACKS +++ b/Misc/ACKS @@ -492,6 +492,7 @@ Shelley Gooch David Goodger Hans de Graaff +Tim Graham Nathaniel Gray Eddy De Greef Grant Griffin diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -36,6 +36,9 @@ Library ------- +- Issue #22775: Fixed unpickling of http.cookies.SimpleCookie with protocol 2 + and above. Patch by Tim Graham. + - Issue #22366: urllib.request.urlopen will accept a context object (SSLContext) as an argument which will then used be for HTTPS connection. Patch by Alex Gaynor. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sun Nov 2 21:37:48 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Sun, 02 Nov 2014 20:37:48 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzIyNzc1?= =?utf-8?q?=3A_Fixed_unpickling_of_Cookie=2ESimpleCookie_with_protocol_2?= =?utf-8?q?=2E?= Message-ID: <20141102203747.120710.6007@psf.io> https://hg.python.org/cpython/rev/515331e0ca0c changeset: 93368:515331e0ca0c branch: 2.7 parent: 93349:16dfefe67c1f user: Serhiy Storchaka date: Sun Nov 02 22:35:47 2014 +0200 summary: Issue #22775: Fixed unpickling of Cookie.SimpleCookie with protocol 2. Patch by Tim Graham. files: Lib/Cookie.py | 8 ++++++-- Lib/test/test_cookie.py | 13 +++++++++++++ Misc/ACKS | 1 + Misc/NEWS | 3 +++ 4 files changed, 23 insertions(+), 2 deletions(-) diff --git a/Lib/Cookie.py b/Lib/Cookie.py --- a/Lib/Cookie.py +++ b/Lib/Cookie.py @@ -591,8 +591,12 @@ def __setitem__(self, key, value): """Dictionary style assignment.""" - rval, cval = self.value_encode(value) - self.__set(key, rval, cval) + if isinstance(value, Morsel): + # allow assignment of constructed Morsels (e.g. for pickling) + dict.__setitem__(self, key, value) + else: + rval, cval = self.value_encode(value) + self.__set(key, rval, cval) # end __setitem__ def output(self, attrs=None, header="Set-Cookie:", sep="\015\012"): diff --git a/Lib/test/test_cookie.py b/Lib/test/test_cookie.py --- a/Lib/test/test_cookie.py +++ b/Lib/test/test_cookie.py @@ -3,6 +3,7 @@ from test.test_support import run_unittest, run_doctest, check_warnings import unittest import Cookie +import pickle class CookieTests(unittest.TestCase): @@ -141,6 +142,18 @@ self.assertEqual(dict(C), {}) self.assertEqual(C.output(), '') + def test_pickle(self): + rawdata = 'Customer="WILE_E_COYOTE"; Path=/acme; Version=1' + expected_output = 'Set-Cookie: %s' % rawdata + + C = Cookie.SimpleCookie() + C.load(rawdata) + self.assertEqual(C.output(), expected_output) + + for proto in range(pickle.HIGHEST_PROTOCOL + 1): + C1 = pickle.loads(pickle.dumps(C, protocol=proto)) + self.assertEqual(C1.output(), expected_output) + def test_main(): run_unittest(CookieTests) diff --git a/Misc/ACKS b/Misc/ACKS --- a/Misc/ACKS +++ b/Misc/ACKS @@ -484,6 +484,7 @@ Shelley Gooch David Goodger Hans de Graaff +Tim Graham Nathaniel Gray Eddy De Greef Grant Griffin diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -37,6 +37,9 @@ Library ------- +- Issue #22775: Fixed unpickling of Cookie.SimpleCookie with protocol 2. + Patch by Tim Graham. + - Issue #22776: Brought excluded code into the scope of a try block in SysLogHandler.emit(). -- Repository URL: https://hg.python.org/cpython From solipsis at pitrou.net Mon Nov 3 10:05:19 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Mon, 03 Nov 2014 10:05:19 +0100 Subject: [Python-checkins] Daily reference leaks (caa8f9248ab8): sum=3 Message-ID: results for caa8f9248ab8 on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogM9fFaa', '-x'] From python-checkins at python.org Mon Nov 3 11:28:26 2014 From: python-checkins at python.org (georg.brandl) Date: Mon, 03 Nov 2014 10:28:26 +0000 Subject: [Python-checkins] =?utf-8?q?devguide=3A_Add_instruction_how_to_ac?= =?utf-8?q?tivate_python-gdb=2Epy?= Message-ID: <20141103102822.101690.49823@psf.io> https://hg.python.org/devguide/rev/4bf21e0cb078 changeset: 723:4bf21e0cb078 user: Georg Brandl date: Mon Nov 03 11:28:19 2014 +0100 summary: Add instruction how to activate python-gdb.py files: gdb.rst | 7 +++++++ 1 files changed, 7 insertions(+), 0 deletions(-) diff --git a/gdb.rst b/gdb.rst --- a/gdb.rst +++ b/gdb.rst @@ -23,6 +23,13 @@ root directory of your checkout. Read the module docstring for details on how to use the file to enhance gdb for easier debugging of a CPython process. +To activate support, you must add the directory containing ``python-gdb.py`` +to GDB's "auto-load-safe-path". Put this in your ``~/.gdbinit`` file:: + + add-auto-load-safe-path /path/to/checkout + +You can also add multiple paths, separated by ``:``. + This is what a backtrace looks like (truncated) when this extension is enabled:: -- Repository URL: https://hg.python.org/devguide From python-checkins at python.org Mon Nov 3 20:37:00 2014 From: python-checkins at python.org (benjamin.peterson) Date: Mon, 03 Nov 2014 19:37:00 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?b?KTogbWVyZ2UgMy40ICgjMjI0MTcp?= Message-ID: <20141103193658.120736.55619@psf.io> https://hg.python.org/cpython/rev/731375f83406 changeset: 93370:731375f83406 parent: 93367:caa8f9248ab8 parent: 93369:2afe5413d7af user: Benjamin Peterson date: Mon Nov 03 14:36:48 2014 -0500 summary: merge 3.4 (#22417) files: Doc/library/http.client.rst | 12 ++-- Doc/library/urllib.request.rst | 5 - Doc/library/xmlrpc.client.rst | 7 +- Doc/whatsnew/3.4.rst | 29 ++++++++++ Lib/http/client.py | 2 +- Lib/ssl.py | 10 ++- Lib/test/test_httplib.py | 49 +++++++++++++--- Lib/test/test_logging.py | 55 ++++++------------ Lib/test/test_ssl.py | 7 +- Lib/test/test_urllib2_localnet.py | 6 +- Misc/NEWS | 2 + 11 files changed, 115 insertions(+), 69 deletions(-) diff --git a/Doc/library/http.client.rst b/Doc/library/http.client.rst --- a/Doc/library/http.client.rst +++ b/Doc/library/http.client.rst @@ -71,12 +71,6 @@ :func:`ssl.create_default_context` select the system's trusted CA certificates for you. - The recommended way to connect to HTTPS hosts on the Internet is as - follows:: - - context = ssl.create_default_context() - h = client.HTTPSConnection('www.python.org', 443, context=context) - Please read :ref:`ssl-security` for more information on best practices. .. note:: @@ -97,6 +91,12 @@ The *strict* parameter was removed. HTTP 0.9-style "Simple Responses" are no longer supported. + .. versionchanged:: 3.4.3 + This class now performs all the necessary certificate and hostname checks + by default. To revert to the previous, unverified, behavior + :func:`ssl._create_unverified_context` can be passed to the *context* + parameter. + .. class:: HTTPResponse(sock, debuglevel=0, method=None, url=None) diff --git a/Doc/library/urllib.request.rst b/Doc/library/urllib.request.rst --- a/Doc/library/urllib.request.rst +++ b/Doc/library/urllib.request.rst @@ -62,11 +62,6 @@ *cafile* and *capath* parameters are omitted. This will only work on some non-Windows platforms. - .. warning:: - If neither *cafile* nor *capath* is specified, and *cadefault* is ``False``, - an HTTPS request will not do any verification of the server's - certificate. - For http and https urls, this function returns a :class:`http.client.HTTPResponse` object which has the following :ref:`httpresponse-objects` methods. diff --git a/Doc/library/xmlrpc.client.rst b/Doc/library/xmlrpc.client.rst --- a/Doc/library/xmlrpc.client.rst +++ b/Doc/library/xmlrpc.client.rst @@ -27,11 +27,10 @@ constructed data. If you need to parse untrusted or unauthenticated data see :ref:`xml-vulnerabilities`. -.. warning:: +.. versionchanged:: 3.4.3 - In the case of https URIs, :mod:`xmlrpc.client` does not do any verification - of the server's certificate. - + For https URIs, :mod:`xmlrpc.client` now performs all the necessary + certificate and hostname checks by default .. class:: ServerProxy(uri, transport=None, encoding=None, verbose=False, \ allow_none=False, use_datetime=False, \ diff --git a/Doc/whatsnew/3.4.rst b/Doc/whatsnew/3.4.rst --- a/Doc/whatsnew/3.4.rst +++ b/Doc/whatsnew/3.4.rst @@ -2504,3 +2504,32 @@ * The ``f_tstate`` (thread state) field of the :c:type:`PyFrameObject` structure has been removed to fix a bug: see :issue:`14432` for the rationale. + +Changed in 3.4.3 +================ + +.. _pep-476: + +PEP 476: Enabling certificate verification by default for stdlib http clients +----------------------------------------------------------------------------- + +:mod:`http.client` and modules which use it, such as :mod:`urllib.request` and +:mod:`xmlrpc.client`, will now verify that the server presents a certificate +which is signed by a CA in the platform trust store and whose hostname matches +the hostname being requested by default, significantly improving security for +many applications. + +For applications which require the old previous behavior, they can pass an +alternate context:: + + import urllib.request + import ssl + + # This disables all verification + context = ssl._create_unverified_context() + + # This allows using a specific certificate for the host, which doesn't need + # to be in the trust store + context = ssl.create_default_context(cafile="/path/to/file.crt") + + urllib.request.urlopen("https://invalid-cert", context=context) diff --git a/Lib/http/client.py b/Lib/http/client.py --- a/Lib/http/client.py +++ b/Lib/http/client.py @@ -1267,7 +1267,7 @@ self.key_file = key_file self.cert_file = cert_file if context is None: - context = ssl._create_stdlib_context() + context = ssl._create_default_https_context() will_verify = context.verify_mode != ssl.CERT_NONE if check_hostname is None: check_hostname = will_verify diff --git a/Lib/ssl.py b/Lib/ssl.py --- a/Lib/ssl.py +++ b/Lib/ssl.py @@ -436,8 +436,7 @@ context.load_default_certs(purpose) return context - -def _create_stdlib_context(protocol=PROTOCOL_SSLv23, *, cert_reqs=None, +def _create_unverified_context(protocol=PROTOCOL_SSLv23, *, cert_reqs=None, check_hostname=False, purpose=Purpose.SERVER_AUTH, certfile=None, keyfile=None, cafile=None, capath=None, cadata=None): @@ -478,6 +477,13 @@ return context +# Used by http.client if no context is explicitly passed. +_create_default_https_context = create_default_context + + +# Backwards compatibility alias, even though it's not a public name. +_create_stdlib_context = _create_unverified_context + class SSLObject: """This class implements an interface on top of a low-level SSL object as diff --git a/Lib/test/test_httplib.py b/Lib/test/test_httplib.py --- a/Lib/test/test_httplib.py +++ b/Lib/test/test_httplib.py @@ -1012,13 +1012,36 @@ self.assertIn('Apache', server_string) def test_networked(self): - # Default settings: no cert verification is done + # Default settings: requires a valid cert from a trusted CA + import ssl support.requires('network') - with support.transient_internet('svn.python.org'): - h = client.HTTPSConnection('svn.python.org', 443) + with support.transient_internet('self-signed.pythontest.net'): + h = client.HTTPSConnection('self-signed.pythontest.net', 443) + with self.assertRaises(ssl.SSLError) as exc_info: + h.request('GET', '/') + self.assertEqual(exc_info.exception.reason, 'CERTIFICATE_VERIFY_FAILED') + + def test_networked_noverification(self): + # Switch off cert verification + import ssl + support.requires('network') + with support.transient_internet('self-signed.pythontest.net'): + context = ssl._create_unverified_context() + h = client.HTTPSConnection('self-signed.pythontest.net', 443, + context=context) h.request('GET', '/') resp = h.getresponse() - self._check_svn_python_org(resp) + self.assertIn('nginx', resp.getheader('server')) + + def test_networked_trusted_by_default_cert(self): + # Default settings: requires a valid cert from a trusted CA + support.requires('network') + with support.transient_internet('www.python.org'): + h = client.HTTPSConnection('www.python.org', 443) + h.request('GET', '/') + resp = h.getresponse() + content_type = resp.getheader('content-type') + self.assertIn('text/html', content_type) def test_networked_good_cert(self): # We feed a CA cert that validates the server's cert @@ -1037,13 +1060,23 @@ # We feed a "CA" cert that is unrelated to the server's cert import ssl support.requires('network') - with support.transient_internet('svn.python.org'): + with support.transient_internet('self-signed.pythontest.net'): context = ssl.SSLContext(ssl.PROTOCOL_TLSv1) context.verify_mode = ssl.CERT_REQUIRED context.load_verify_locations(CERT_localhost) - h = client.HTTPSConnection('svn.python.org', 443, context=context) - with self.assertRaises(ssl.SSLError): + h = client.HTTPSConnection('self-signed.pythontest.net', 443, context=context) + with self.assertRaises(ssl.SSLError) as exc_info: h.request('GET', '/') + self.assertEqual(exc_info.exception.reason, 'CERTIFICATE_VERIFY_FAILED') + + def test_local_unknown_cert(self): + # The custom cert isn't known to the default trust bundle + import ssl + server = self.make_server(CERT_localhost) + h = client.HTTPSConnection('localhost', server.port) + with self.assertRaises(ssl.SSLError) as exc_info: + h.request('GET', '/') + self.assertEqual(exc_info.exception.reason, 'CERTIFICATE_VERIFY_FAILED') def test_local_good_hostname(self): # The (valid) cert validates the HTTP hostname @@ -1056,7 +1089,6 @@ h.request('GET', '/nonexistent') resp = h.getresponse() self.assertEqual(resp.status, 404) - del server def test_local_bad_hostname(self): # The (valid) cert doesn't validate the HTTP hostname @@ -1079,7 +1111,6 @@ h.request('GET', '/nonexistent') resp = h.getresponse() self.assertEqual(resp.status, 404) - del server @unittest.skipIf(not hasattr(client, 'HTTPSConnection'), 'http.client.HTTPSConnection not available') diff --git a/Lib/test/test_logging.py b/Lib/test/test_logging.py --- a/Lib/test/test_logging.py +++ b/Lib/test/test_logging.py @@ -1627,36 +1627,6 @@ class HTTPHandlerTest(BaseTest): """Test for HTTPHandler.""" - PEMFILE = """-----BEGIN RSA PRIVATE KEY----- -MIICXQIBAAKBgQDGT4xS5r91rbLJQK2nUDenBhBG6qFk+bVOjuAGC/LSHlAoBnvG -zQG3agOG+e7c5z2XT8m2ktORLqG3E4mYmbxgyhDrzP6ei2Anc+pszmnxPoK3Puh5 -aXV+XKt0bU0C1m2+ACmGGJ0t3P408art82nOxBw8ZHgIg9Dtp6xIUCyOqwIDAQAB -AoGBAJFTnFboaKh5eUrIzjmNrKsG44jEyy+vWvHN/FgSC4l103HxhmWiuL5Lv3f7 -0tMp1tX7D6xvHwIG9VWvyKb/Cq9rJsDibmDVIOslnOWeQhG+XwJyitR0pq/KlJIB -5LjORcBw795oKWOAi6RcOb1ON59tysEFYhAGQO9k6VL621gRAkEA/Gb+YXULLpbs -piXN3q4zcHzeaVANo69tUZ6TjaQqMeTxE4tOYM0G0ZoSeHEdaP59AOZGKXXNGSQy -2z/MddcYGQJBAMkjLSYIpOLJY11ja8OwwswFG2hEzHe0cS9bzo++R/jc1bHA5R0Y -i6vA5iPi+wopPFvpytdBol7UuEBe5xZrxWMCQQCWxELRHiP2yWpEeLJ3gGDzoXMN -PydWjhRju7Bx3AzkTtf+D6lawz1+eGTuEss5i0JKBkMEwvwnN2s1ce+EuF4JAkBb -E96h1lAzkVW5OAfYOPY8RCPA90ZO/hoyg7PpSxR0ECuDrgERR8gXIeYUYfejBkEa -rab4CfRoVJKKM28Yq/xZAkBvuq670JRCwOgfUTdww7WpdOQBYPkzQccsKNCslQW8 -/DyW6y06oQusSENUvynT6dr3LJxt/NgZPhZX2+k1eYDV ------END RSA PRIVATE KEY----- ------BEGIN CERTIFICATE----- -MIICGzCCAYSgAwIBAgIJAIq84a2Q/OvlMA0GCSqGSIb3DQEBBQUAMBQxEjAQBgNV -BAMTCWxvY2FsaG9zdDAeFw0xMTA1MjExMDIzMzNaFw03NTAzMjEwMzU1MTdaMBQx -EjAQBgNVBAMTCWxvY2FsaG9zdDCBnzANBgkqhkiG9w0BAQEFAAOBjQAwgYkCgYEA -xk+MUua/da2yyUCtp1A3pwYQRuqhZPm1To7gBgvy0h5QKAZ7xs0Bt2oDhvnu3Oc9 -l0/JtpLTkS6htxOJmJm8YMoQ68z+notgJ3PqbM5p8T6Ctz7oeWl1flyrdG1NAtZt -vgAphhidLdz+NPGq7fNpzsQcPGR4CIPQ7aesSFAsjqsCAwEAAaN1MHMwHQYDVR0O -BBYEFLWaUPO6N7efGiuoS9i3DVYcUwn0MEQGA1UdIwQ9MDuAFLWaUPO6N7efGiuo -S9i3DVYcUwn0oRikFjAUMRIwEAYDVQQDEwlsb2NhbGhvc3SCCQCKvOGtkPzr5TAM -BgNVHRMEBTADAQH/MA0GCSqGSIb3DQEBBQUAA4GBAMK5whPjLNQK1Ivvk88oqJqq -4f889OwikGP0eUhOBhbFlsZs+jq5YZC2UzHz+evzKBlgAP1u4lP/cB85CnjvWqM+ -1c/lywFHQ6HOdDeQ1L72tSYMrNOG4XNmLn0h7rx6GoTU7dcFRfseahBCq8mv0IDt -IRbTpvlHWPjsSvHz0ZOH ------END CERTIFICATE-----""" - def setUp(self): """Set up an HTTP server to receive log messages, and a HTTPHandler pointing to that server's address and port.""" @@ -1686,15 +1656,26 @@ if secure: try: import ssl - fd, fn = tempfile.mkstemp() - os.close(fd) - with open(fn, 'w') as f: - f.write(self.PEMFILE) - sslctx = ssl.SSLContext(ssl.PROTOCOL_SSLv23) - sslctx.load_cert_chain(fn) - os.unlink(fn) except ImportError: sslctx = None + else: + here = os.path.dirname(__file__) + localhost_cert = os.path.join(here, "keycert.pem") + sslctx = ssl.SSLContext(ssl.PROTOCOL_SSLv23) + sslctx.load_cert_chain(localhost_cert) + # Unfortunately, HTTPHandler doesn't allow us to change the + # SSLContext used by HTTPSConnection, so we have to + # monkeypatch. This can be cleaned up if issue 22788 is + # fixed. + old = ssl._create_default_https_context + def restore_handler(): + ssl._create_default_https_context = old + self.addCleanup(restore_handler) + def hack_create_ctx(): + ctx = old() + ctx.load_verify_locations(localhost_cert) + return ctx + ssl._create_default_https_context = hack_create_ctx else: sslctx = None self.server = server = TestHTTPServer(addr, self.handle_request, diff --git a/Lib/test/test_ssl.py b/Lib/test/test_ssl.py --- a/Lib/test/test_ssl.py +++ b/Lib/test/test_ssl.py @@ -2582,9 +2582,10 @@ d1 = f.read() d2 = '' # now fetch the same data from the HTTPS server - url = 'https://%s:%d/%s' % ( - HOST, server.port, os.path.split(CERTFILE)[1]) - f = urllib.request.urlopen(url) + url = 'https://localhost:%d/%s' % ( + server.port, os.path.split(CERTFILE)[1]) + context = ssl.create_default_context(cafile=CERTFILE) + f = urllib.request.urlopen(url, context=context) try: dlen = f.info().get("content-length") if dlen and (int(dlen) > 0): diff --git a/Lib/test/test_urllib2_localnet.py b/Lib/test/test_urllib2_localnet.py --- a/Lib/test/test_urllib2_localnet.py +++ b/Lib/test/test_urllib2_localnet.py @@ -545,7 +545,8 @@ def test_https(self): handler = self.start_https_server() - data = self.urlopen("https://localhost:%s/bizarre" % handler.port) + context = ssl.create_default_context(cafile=CERT_localhost) + data = self.urlopen("https://localhost:%s/bizarre" % handler.port, context=context) self.assertEqual(data, b"we care a bit") def test_https_with_cafile(self): @@ -584,7 +585,8 @@ context = ssl.SSLContext(ssl.PROTOCOL_TLSv1) context.set_servername_callback(cb_sni) handler = self.start_https_server(context=context, certfile=CERT_localhost) - self.urlopen("https://localhost:%s" % handler.port) + context = ssl.create_default_context(cafile=CERT_localhost) + self.urlopen("https://localhost:%s" % handler.port, context=context) self.assertEqual(sni_name, "localhost") def test_sending_headers(self): diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -183,6 +183,8 @@ Library ------- +- Issue #22417: Verify certificates by default in httplib (PEP 476). + - Issue #22775: Fixed unpickling of http.cookies.SimpleCookie with protocol 2 and above. Patch by Tim Graham. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 3 20:37:08 2014 From: python-checkins at python.org (benjamin.peterson) Date: Mon, 03 Nov 2014 19:37:08 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogUEVQIDQ3NjogZW5h?= =?utf-8?q?ble_HTTPS_certificate_verification_by_default_=28=2322417=29?= Message-ID: <20141103193654.35246.40303@psf.io> https://hg.python.org/cpython/rev/2afe5413d7af changeset: 93369:2afe5413d7af branch: 3.4 parent: 93366:7be6ef737aaf user: Benjamin Peterson date: Mon Nov 03 14:29:33 2014 -0500 summary: PEP 476: enable HTTPS certificate verification by default (#22417) Patch by Alex Gaynor with some modifications by me. files: Doc/library/http.client.rst | 12 ++-- Doc/library/urllib.request.rst | 5 - Doc/library/xmlrpc.client.rst | 7 +- Doc/whatsnew/3.4.rst | 29 ++++++++++ Lib/http/client.py | 2 +- Lib/ssl.py | 11 +++- Lib/test/test_httplib.py | 49 +++++++++++++--- Lib/test/test_logging.py | 55 ++++++------------ Lib/test/test_ssl.py | 7 +- Lib/test/test_urllib2_localnet.py | 6 +- Misc/NEWS | 2 + 11 files changed, 116 insertions(+), 69 deletions(-) diff --git a/Doc/library/http.client.rst b/Doc/library/http.client.rst --- a/Doc/library/http.client.rst +++ b/Doc/library/http.client.rst @@ -71,12 +71,6 @@ :func:`ssl.create_default_context` select the system's trusted CA certificates for you. - The recommended way to connect to HTTPS hosts on the Internet is as - follows:: - - context = ssl.create_default_context() - h = client.HTTPSConnection('www.python.org', 443, context=context) - Please read :ref:`ssl-security` for more information on best practices. .. note:: @@ -97,6 +91,12 @@ The *strict* parameter was removed. HTTP 0.9-style "Simple Responses" are no longer supported. + .. versionchanged:: 3.4.3 + This class now performs all the necessary certificate and hostname checks + by default. To revert to the previous, unverified, behavior + :func:`ssl._create_unverified_context` can be passed to the *context* + parameter. + .. class:: HTTPResponse(sock, debuglevel=0, method=None, url=None) diff --git a/Doc/library/urllib.request.rst b/Doc/library/urllib.request.rst --- a/Doc/library/urllib.request.rst +++ b/Doc/library/urllib.request.rst @@ -62,11 +62,6 @@ *cafile* and *capath* parameters are omitted. This will only work on some non-Windows platforms. - .. warning:: - If neither *cafile* nor *capath* is specified, and *cadefault* is ``False``, - an HTTPS request will not do any verification of the server's - certificate. - For http and https urls, this function returns a :class:`http.client.HTTPResponse` object which has the following :ref:`httpresponse-objects` methods. diff --git a/Doc/library/xmlrpc.client.rst b/Doc/library/xmlrpc.client.rst --- a/Doc/library/xmlrpc.client.rst +++ b/Doc/library/xmlrpc.client.rst @@ -27,11 +27,10 @@ constructed data. If you need to parse untrusted or unauthenticated data see :ref:`xml-vulnerabilities`. -.. warning:: +.. versionchanged:: 3.4.3 - In the case of https URIs, :mod:`xmlrpc.client` does not do any verification - of the server's certificate. - + For https URIs, :mod:`xmlrpc.client` now performs all the necessary + certificate and hostname checks by default .. class:: ServerProxy(uri, transport=None, encoding=None, verbose=False, \ allow_none=False, use_datetime=False, \ diff --git a/Doc/whatsnew/3.4.rst b/Doc/whatsnew/3.4.rst --- a/Doc/whatsnew/3.4.rst +++ b/Doc/whatsnew/3.4.rst @@ -2504,3 +2504,32 @@ * The ``f_tstate`` (thread state) field of the :c:type:`PyFrameObject` structure has been removed to fix a bug: see :issue:`14432` for the rationale. + +Changed in 3.4.3 +================ + +.. _pep-476: + +PEP 476: Enabling certificate verification by default for stdlib http clients +----------------------------------------------------------------------------- + +:mod:`http.client` and modules which use it, such as :mod:`urllib.request` and +:mod:`xmlrpc.client`, will now verify that the server presents a certificate +which is signed by a CA in the platform trust store and whose hostname matches +the hostname being requested by default, significantly improving security for +many applications. + +For applications which require the old previous behavior, they can pass an +alternate context:: + + import urllib.request + import ssl + + # This disables all verification + context = ssl._create_unverified_context() + + # This allows using a specific certificate for the host, which doesn't need + # to be in the trust store + context = ssl.create_default_context(cafile="/path/to/file.crt") + + urllib.request.urlopen("https://invalid-cert", context=context) diff --git a/Lib/http/client.py b/Lib/http/client.py --- a/Lib/http/client.py +++ b/Lib/http/client.py @@ -1203,7 +1203,7 @@ self.key_file = key_file self.cert_file = cert_file if context is None: - context = ssl._create_stdlib_context() + context = ssl._create_default_https_context() will_verify = context.verify_mode != ssl.CERT_NONE if check_hostname is None: check_hostname = will_verify diff --git a/Lib/ssl.py b/Lib/ssl.py --- a/Lib/ssl.py +++ b/Lib/ssl.py @@ -441,8 +441,7 @@ context.load_default_certs(purpose) return context - -def _create_stdlib_context(protocol=PROTOCOL_SSLv23, *, cert_reqs=None, +def _create_unverified_context(protocol=PROTOCOL_SSLv23, *, cert_reqs=None, check_hostname=False, purpose=Purpose.SERVER_AUTH, certfile=None, keyfile=None, cafile=None, capath=None, cadata=None): @@ -480,6 +479,14 @@ return context +# Used by http.client if no context is explicitly passed. +_create_default_https_context = create_default_context + + +# Backwards compatibility alias, even though it's not a public name. +_create_stdlib_context = _create_unverified_context + + class SSLSocket(socket): """This class implements a subtype of socket.socket that wraps the underlying OS socket in an SSL context when necessary, and diff --git a/Lib/test/test_httplib.py b/Lib/test/test_httplib.py --- a/Lib/test/test_httplib.py +++ b/Lib/test/test_httplib.py @@ -778,13 +778,36 @@ self.assertIn('Apache', server_string) def test_networked(self): - # Default settings: no cert verification is done + # Default settings: requires a valid cert from a trusted CA + import ssl support.requires('network') - with support.transient_internet('svn.python.org'): - h = client.HTTPSConnection('svn.python.org', 443) + with support.transient_internet('self-signed.pythontest.net'): + h = client.HTTPSConnection('self-signed.pythontest.net', 443) + with self.assertRaises(ssl.SSLError) as exc_info: + h.request('GET', '/') + self.assertEqual(exc_info.exception.reason, 'CERTIFICATE_VERIFY_FAILED') + + def test_networked_noverification(self): + # Switch off cert verification + import ssl + support.requires('network') + with support.transient_internet('self-signed.pythontest.net'): + context = ssl._create_unverified_context() + h = client.HTTPSConnection('self-signed.pythontest.net', 443, + context=context) h.request('GET', '/') resp = h.getresponse() - self._check_svn_python_org(resp) + self.assertIn('nginx', resp.getheader('server')) + + def test_networked_trusted_by_default_cert(self): + # Default settings: requires a valid cert from a trusted CA + support.requires('network') + with support.transient_internet('www.python.org'): + h = client.HTTPSConnection('www.python.org', 443) + h.request('GET', '/') + resp = h.getresponse() + content_type = resp.getheader('content-type') + self.assertIn('text/html', content_type) def test_networked_good_cert(self): # We feed a CA cert that validates the server's cert @@ -803,13 +826,23 @@ # We feed a "CA" cert that is unrelated to the server's cert import ssl support.requires('network') - with support.transient_internet('svn.python.org'): + with support.transient_internet('self-signed.pythontest.net'): context = ssl.SSLContext(ssl.PROTOCOL_TLSv1) context.verify_mode = ssl.CERT_REQUIRED context.load_verify_locations(CERT_localhost) - h = client.HTTPSConnection('svn.python.org', 443, context=context) - with self.assertRaises(ssl.SSLError): + h = client.HTTPSConnection('self-signed.pythontest.net', 443, context=context) + with self.assertRaises(ssl.SSLError) as exc_info: h.request('GET', '/') + self.assertEqual(exc_info.exception.reason, 'CERTIFICATE_VERIFY_FAILED') + + def test_local_unknown_cert(self): + # The custom cert isn't known to the default trust bundle + import ssl + server = self.make_server(CERT_localhost) + h = client.HTTPSConnection('localhost', server.port) + with self.assertRaises(ssl.SSLError) as exc_info: + h.request('GET', '/') + self.assertEqual(exc_info.exception.reason, 'CERTIFICATE_VERIFY_FAILED') def test_local_good_hostname(self): # The (valid) cert validates the HTTP hostname @@ -822,7 +855,6 @@ h.request('GET', '/nonexistent') resp = h.getresponse() self.assertEqual(resp.status, 404) - del server def test_local_bad_hostname(self): # The (valid) cert doesn't validate the HTTP hostname @@ -845,7 +877,6 @@ h.request('GET', '/nonexistent') resp = h.getresponse() self.assertEqual(resp.status, 404) - del server @unittest.skipIf(not hasattr(client, 'HTTPSConnection'), 'http.client.HTTPSConnection not available') diff --git a/Lib/test/test_logging.py b/Lib/test/test_logging.py --- a/Lib/test/test_logging.py +++ b/Lib/test/test_logging.py @@ -1631,36 +1631,6 @@ class HTTPHandlerTest(BaseTest): """Test for HTTPHandler.""" - PEMFILE = """-----BEGIN RSA PRIVATE KEY----- -MIICXQIBAAKBgQDGT4xS5r91rbLJQK2nUDenBhBG6qFk+bVOjuAGC/LSHlAoBnvG -zQG3agOG+e7c5z2XT8m2ktORLqG3E4mYmbxgyhDrzP6ei2Anc+pszmnxPoK3Puh5 -aXV+XKt0bU0C1m2+ACmGGJ0t3P408art82nOxBw8ZHgIg9Dtp6xIUCyOqwIDAQAB -AoGBAJFTnFboaKh5eUrIzjmNrKsG44jEyy+vWvHN/FgSC4l103HxhmWiuL5Lv3f7 -0tMp1tX7D6xvHwIG9VWvyKb/Cq9rJsDibmDVIOslnOWeQhG+XwJyitR0pq/KlJIB -5LjORcBw795oKWOAi6RcOb1ON59tysEFYhAGQO9k6VL621gRAkEA/Gb+YXULLpbs -piXN3q4zcHzeaVANo69tUZ6TjaQqMeTxE4tOYM0G0ZoSeHEdaP59AOZGKXXNGSQy -2z/MddcYGQJBAMkjLSYIpOLJY11ja8OwwswFG2hEzHe0cS9bzo++R/jc1bHA5R0Y -i6vA5iPi+wopPFvpytdBol7UuEBe5xZrxWMCQQCWxELRHiP2yWpEeLJ3gGDzoXMN -PydWjhRju7Bx3AzkTtf+D6lawz1+eGTuEss5i0JKBkMEwvwnN2s1ce+EuF4JAkBb -E96h1lAzkVW5OAfYOPY8RCPA90ZO/hoyg7PpSxR0ECuDrgERR8gXIeYUYfejBkEa -rab4CfRoVJKKM28Yq/xZAkBvuq670JRCwOgfUTdww7WpdOQBYPkzQccsKNCslQW8 -/DyW6y06oQusSENUvynT6dr3LJxt/NgZPhZX2+k1eYDV ------END RSA PRIVATE KEY----- ------BEGIN CERTIFICATE----- -MIICGzCCAYSgAwIBAgIJAIq84a2Q/OvlMA0GCSqGSIb3DQEBBQUAMBQxEjAQBgNV -BAMTCWxvY2FsaG9zdDAeFw0xMTA1MjExMDIzMzNaFw03NTAzMjEwMzU1MTdaMBQx -EjAQBgNVBAMTCWxvY2FsaG9zdDCBnzANBgkqhkiG9w0BAQEFAAOBjQAwgYkCgYEA -xk+MUua/da2yyUCtp1A3pwYQRuqhZPm1To7gBgvy0h5QKAZ7xs0Bt2oDhvnu3Oc9 -l0/JtpLTkS6htxOJmJm8YMoQ68z+notgJ3PqbM5p8T6Ctz7oeWl1flyrdG1NAtZt -vgAphhidLdz+NPGq7fNpzsQcPGR4CIPQ7aesSFAsjqsCAwEAAaN1MHMwHQYDVR0O -BBYEFLWaUPO6N7efGiuoS9i3DVYcUwn0MEQGA1UdIwQ9MDuAFLWaUPO6N7efGiuo -S9i3DVYcUwn0oRikFjAUMRIwEAYDVQQDEwlsb2NhbGhvc3SCCQCKvOGtkPzr5TAM -BgNVHRMEBTADAQH/MA0GCSqGSIb3DQEBBQUAA4GBAMK5whPjLNQK1Ivvk88oqJqq -4f889OwikGP0eUhOBhbFlsZs+jq5YZC2UzHz+evzKBlgAP1u4lP/cB85CnjvWqM+ -1c/lywFHQ6HOdDeQ1L72tSYMrNOG4XNmLn0h7rx6GoTU7dcFRfseahBCq8mv0IDt -IRbTpvlHWPjsSvHz0ZOH ------END CERTIFICATE-----""" - def setUp(self): """Set up an HTTP server to receive log messages, and a HTTPHandler pointing to that server's address and port.""" @@ -1690,15 +1660,26 @@ if secure: try: import ssl - fd, fn = tempfile.mkstemp() - os.close(fd) - with open(fn, 'w') as f: - f.write(self.PEMFILE) - sslctx = ssl.SSLContext(ssl.PROTOCOL_SSLv23) - sslctx.load_cert_chain(fn) - os.unlink(fn) except ImportError: sslctx = None + else: + here = os.path.dirname(__file__) + localhost_cert = os.path.join(here, "keycert.pem") + sslctx = ssl.SSLContext(ssl.PROTOCOL_SSLv23) + sslctx.load_cert_chain(localhost_cert) + # Unfortunately, HTTPHandler doesn't allow us to change the + # SSLContext used by HTTPSConnection, so we have to + # monkeypatch. This can be cleaned up if issue 22788 is + # fixed. + old = ssl._create_default_https_context + def restore_handler(): + ssl._create_default_https_context = old + self.addCleanup(restore_handler) + def hack_create_ctx(): + ctx = old() + ctx.load_verify_locations(localhost_cert) + return ctx + ssl._create_default_https_context = hack_create_ctx else: sslctx = None self.server = server = TestHTTPServer(addr, self.handle_request, diff --git a/Lib/test/test_ssl.py b/Lib/test/test_ssl.py --- a/Lib/test/test_ssl.py +++ b/Lib/test/test_ssl.py @@ -2337,9 +2337,10 @@ d1 = f.read() d2 = '' # now fetch the same data from the HTTPS server - url = 'https://%s:%d/%s' % ( - HOST, server.port, os.path.split(CERTFILE)[1]) - f = urllib.request.urlopen(url) + url = 'https://localhost:%d/%s' % ( + server.port, os.path.split(CERTFILE)[1]) + context = ssl.create_default_context(cafile=CERTFILE) + f = urllib.request.urlopen(url, context=context) try: dlen = f.info().get("content-length") if dlen and (int(dlen) > 0): diff --git a/Lib/test/test_urllib2_localnet.py b/Lib/test/test_urllib2_localnet.py --- a/Lib/test/test_urllib2_localnet.py +++ b/Lib/test/test_urllib2_localnet.py @@ -545,7 +545,8 @@ def test_https(self): handler = self.start_https_server() - data = self.urlopen("https://localhost:%s/bizarre" % handler.port) + context = ssl.create_default_context(cafile=CERT_localhost) + data = self.urlopen("https://localhost:%s/bizarre" % handler.port, context=context) self.assertEqual(data, b"we care a bit") def test_https_with_cafile(self): @@ -584,7 +585,8 @@ context = ssl.SSLContext(ssl.PROTOCOL_TLSv1) context.set_servername_callback(cb_sni) handler = self.start_https_server(context=context, certfile=CERT_localhost) - self.urlopen("https://localhost:%s" % handler.port) + context = ssl.create_default_context(cafile=CERT_localhost) + self.urlopen("https://localhost:%s" % handler.port, context=context) self.assertEqual(sni_name, "localhost") def test_sending_headers(self): diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -36,6 +36,8 @@ Library ------- +- Issue #22417: Verify certificates by default in httplib (PEP 476). + - Issue #22775: Fixed unpickling of http.cookies.SimpleCookie with protocol 2 and above. Patch by Tim Graham. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 3 21:13:36 2014 From: python-checkins at python.org (benjamin.peterson) Date: Mon, 03 Nov 2014 20:13:36 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAobWVyZ2UgMy4yIC0+IDMuMyk6?= =?utf-8?q?_merge_3=2E2?= Message-ID: <20141103201258.35250.40427@psf.io> https://hg.python.org/cpython/rev/b5d92b52d494 changeset: 93372:b5d92b52d494 branch: 3.3 parent: 93137:a34be8915cf6 parent: 93371:c16e047965a2 user: Benjamin Peterson date: Mon Nov 03 15:11:53 2014 -0500 summary: merge 3.2 files: Lib/test/test_socket.py | 7 ++++--- 1 files changed, 4 insertions(+), 3 deletions(-) diff --git a/Lib/test/test_socket.py b/Lib/test/test_socket.py --- a/Lib/test/test_socket.py +++ b/Lib/test/test_socket.py @@ -1188,9 +1188,10 @@ if e.errno == socket.EAI_NODATA: self.skipTest('internet access required for this test') # these should all be successful - socket.gethostbyname('?????????.python.org') - socket.gethostbyname_ex('?????????.python.org') - socket.getaddrinfo('?????????.python.org',0,socket.AF_UNSPEC,socket.SOCK_STREAM) + domain = '?????????.pythontest.net' + socket.gethostbyname(domain) + socket.gethostbyname_ex(domain) + socket.getaddrinfo(domain,0,socket.AF_UNSPEC,socket.SOCK_STREAM) # this may not work if the forward lookup choses the IPv6 address, as that doesn't # have a reverse entry yet # socket.gethostbyaddr('?????????.python.org') -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 3 21:13:36 2014 From: python-checkins at python.org (benjamin.peterson) Date: Mon, 03 Nov 2014 20:13:36 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAobWVyZ2UgMy4zIC0+IDMuNCk6?= =?utf-8?q?_merge_3=2E3?= Message-ID: <20141103201259.120728.39962@psf.io> https://hg.python.org/cpython/rev/a716afa8e23f changeset: 93373:a716afa8e23f branch: 3.4 parent: 93369:2afe5413d7af parent: 93372:b5d92b52d494 user: Benjamin Peterson date: Mon Nov 03 15:12:06 2014 -0500 summary: merge 3.3 files: Lib/test/test_socket.py | 7 ++++--- 1 files changed, 4 insertions(+), 3 deletions(-) diff --git a/Lib/test/test_socket.py b/Lib/test/test_socket.py --- a/Lib/test/test_socket.py +++ b/Lib/test/test_socket.py @@ -1291,9 +1291,10 @@ if e.errno == socket.EAI_NODATA: self.skipTest('internet access required for this test') # these should all be successful - socket.gethostbyname('?????????.python.org') - socket.gethostbyname_ex('?????????.python.org') - socket.getaddrinfo('?????????.python.org',0,socket.AF_UNSPEC,socket.SOCK_STREAM) + domain = '?????????.pythontest.net' + socket.gethostbyname(domain) + socket.gethostbyname_ex(domain) + socket.getaddrinfo(domain,0,socket.AF_UNSPEC,socket.SOCK_STREAM) # this may not work if the forward lookup choses the IPv6 address, as that doesn't # have a reverse entry yet # socket.gethostbyaddr('?????????.python.org') -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 3 21:13:36 2014 From: python-checkins at python.org (benjamin.peterson) Date: Mon, 03 Nov 2014 20:13:36 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?b?KTogbWVyZ2UgMy40?= Message-ID: <20141103201259.35262.1257@psf.io> https://hg.python.org/cpython/rev/bd3e9dcbd9ab changeset: 93374:bd3e9dcbd9ab parent: 93370:731375f83406 parent: 93373:a716afa8e23f user: Benjamin Peterson date: Mon Nov 03 15:12:52 2014 -0500 summary: merge 3.4 files: Lib/test/test_socket.py | 7 ++++--- 1 files changed, 4 insertions(+), 3 deletions(-) diff --git a/Lib/test/test_socket.py b/Lib/test/test_socket.py --- a/Lib/test/test_socket.py +++ b/Lib/test/test_socket.py @@ -1293,9 +1293,10 @@ if e.errno == socket.EAI_NODATA: self.skipTest('internet access required for this test') # these should all be successful - socket.gethostbyname('?????????.python.org') - socket.gethostbyname_ex('?????????.python.org') - socket.getaddrinfo('?????????.python.org',0,socket.AF_UNSPEC,socket.SOCK_STREAM) + domain = '?????????.pythontest.net' + socket.gethostbyname(domain) + socket.gethostbyname_ex(domain) + socket.getaddrinfo(domain,0,socket.AF_UNSPEC,socket.SOCK_STREAM) # this may not work if the forward lookup choses the IPv6 address, as that doesn't # have a reverse entry yet # socket.gethostbyaddr('?????????.python.org') -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 3 21:13:36 2014 From: python-checkins at python.org (benjamin.peterson) Date: Mon, 03 Nov 2014 20:13:36 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E2=29=3A_move_idna_test?= =?utf-8?q?_domain_to_pythontest=2Enet?= Message-ID: <20141103201257.101692.78642@psf.io> https://hg.python.org/cpython/rev/c16e047965a2 changeset: 93371:c16e047965a2 branch: 3.2 parent: 92975:eac54f7a8018 user: Benjamin Peterson date: Mon Nov 03 15:10:47 2014 -0500 summary: move idna test domain to pythontest.net files: Lib/test/test_socket.py | 7 ++++--- 1 files changed, 4 insertions(+), 3 deletions(-) diff --git a/Lib/test/test_socket.py b/Lib/test/test_socket.py --- a/Lib/test/test_socket.py +++ b/Lib/test/test_socket.py @@ -775,9 +775,10 @@ def test_idna(self): support.requires('network') # these should all be successful - socket.gethostbyname('?????????.python.org') - socket.gethostbyname_ex('?????????.python.org') - socket.getaddrinfo('?????????.python.org',0,socket.AF_UNSPEC,socket.SOCK_STREAM) + domain = '?????????.pythontest.net' + socket.gethostbyname(domain) + socket.gethostbyname_ex(domain) + socket.getaddrinfo(domain,0,socket.AF_UNSPEC,socket.SOCK_STREAM) # this may not work if the forward lookup choses the IPv6 address, as that doesn't # have a reverse entry yet # socket.gethostbyaddr('?????????.python.org') -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 3 23:04:09 2014 From: python-checkins at python.org (benjamin.peterson) Date: Mon, 03 Nov 2014 22:04:09 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_context_has_been_backporte?= =?utf-8?q?d_so_fix_versionchanged?= Message-ID: <20141103220404.120724.36937@psf.io> https://hg.python.org/cpython/rev/aeb1f941663f changeset: 93375:aeb1f941663f user: Benjamin Peterson date: Mon Nov 03 17:04:01 2014 -0500 summary: context has been backported so fix versionchanged files: Doc/library/urllib.request.rst | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Doc/library/urllib.request.rst b/Doc/library/urllib.request.rst --- a/Doc/library/urllib.request.rst +++ b/Doc/library/urllib.request.rst @@ -110,7 +110,7 @@ .. versionchanged:: 3.3 *cadefault* was added. - .. versionchanged:: 3.5 + .. versionchanged:: 3.4.3 *context* was added. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 4 03:12:17 2014 From: python-checkins at python.org (benjamin.peterson) Date: Tue, 04 Nov 2014 02:12:17 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=282=2E7=29=3A_test_that_keyf?= =?utf-8?q?ile_can_be_None?= Message-ID: <20141104021216.108377.16235@psf.io> https://hg.python.org/cpython/rev/f9a72b3eca7c changeset: 93378:f9a72b3eca7c branch: 2.7 parent: 93368:515331e0ca0c user: Benjamin Peterson date: Mon Nov 03 21:05:01 2014 -0500 summary: test that keyfile can be None files: Lib/test/test_ssl.py | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Lib/test/test_ssl.py b/Lib/test/test_ssl.py --- a/Lib/test/test_ssl.py +++ b/Lib/test/test_ssl.py @@ -766,7 +766,7 @@ def test_load_cert_chain(self): ctx = ssl.SSLContext(ssl.PROTOCOL_TLSv1) # Combined key and cert in a single file - ctx.load_cert_chain(CERTFILE) + ctx.load_cert_chain(CERTFILE, keyfile=None) ctx.load_cert_chain(CERTFILE, keyfile=CERTFILE) self.assertRaises(TypeError, ctx.load_cert_chain, keyfile=CERTFILE) with self.assertRaises(IOError) as cm: -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 4 03:12:17 2014 From: python-checkins at python.org (benjamin.peterson) Date: Tue, 04 Nov 2014 02:12:17 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E4=29=3A_test_that_keyf?= =?utf-8?q?ile_can_be_None?= Message-ID: <20141104021216.108085.58940@psf.io> https://hg.python.org/cpython/rev/b9d9e7762783 changeset: 93376:b9d9e7762783 branch: 3.4 parent: 93373:a716afa8e23f user: Benjamin Peterson date: Mon Nov 03 21:05:01 2014 -0500 summary: test that keyfile can be None files: Lib/test/test_ssl.py | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Lib/test/test_ssl.py b/Lib/test/test_ssl.py --- a/Lib/test/test_ssl.py +++ b/Lib/test/test_ssl.py @@ -727,7 +727,7 @@ def test_load_cert_chain(self): ctx = ssl.SSLContext(ssl.PROTOCOL_TLSv1) # Combined key and cert in a single file - ctx.load_cert_chain(CERTFILE) + ctx.load_cert_chain(CERTFILE, keyfile=None) ctx.load_cert_chain(CERTFILE, keyfile=CERTFILE) self.assertRaises(TypeError, ctx.load_cert_chain, keyfile=CERTFILE) with self.assertRaises(OSError) as cm: -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 4 03:12:17 2014 From: python-checkins at python.org (benjamin.peterson) Date: Tue, 04 Nov 2014 02:12:17 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?b?KTogbWVyZ2UgMy40?= Message-ID: <20141104021216.85190.90487@psf.io> https://hg.python.org/cpython/rev/205810ca5069 changeset: 93377:205810ca5069 parent: 93375:aeb1f941663f parent: 93376:b9d9e7762783 user: Benjamin Peterson date: Mon Nov 03 21:06:07 2014 -0500 summary: merge 3.4 files: Lib/test/test_ssl.py | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Lib/test/test_ssl.py b/Lib/test/test_ssl.py --- a/Lib/test/test_ssl.py +++ b/Lib/test/test_ssl.py @@ -811,7 +811,7 @@ def test_load_cert_chain(self): ctx = ssl.SSLContext(ssl.PROTOCOL_TLSv1) # Combined key and cert in a single file - ctx.load_cert_chain(CERTFILE) + ctx.load_cert_chain(CERTFILE, keyfile=None) ctx.load_cert_chain(CERTFILE, keyfile=CERTFILE) self.assertRaises(TypeError, ctx.load_cert_chain, keyfile=CERTFILE) with self.assertRaises(OSError) as cm: -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 4 03:12:17 2014 From: python-checkins at python.org (benjamin.peterson) Date: Tue, 04 Nov 2014 02:12:17 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=282=2E7=29=3A_allow_keyfile_?= =?utf-8?q?argument_to_be_None_=28closes_=2322787=29?= Message-ID: <20141104021217.108365.12999@psf.io> https://hg.python.org/cpython/rev/e54d0b197c82 changeset: 93379:e54d0b197c82 branch: 2.7 user: Benjamin Peterson date: Mon Nov 03 21:12:05 2014 -0500 summary: allow keyfile argument to be None (closes #22787) files: Misc/NEWS | 3 +++ Modules/_ssl.c | 30 +++++++++++++++++++++++------- 2 files changed, 26 insertions(+), 7 deletions(-) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -37,6 +37,9 @@ Library ------- +- Issue #22787: Allow the keyfile argument of SSLContext.load_cert_chain to be + None. + - Issue #22775: Fixed unpickling of Cookie.SimpleCookie with protocol 2. Patch by Tim Graham. diff --git a/Modules/_ssl.c b/Modules/_ssl.c --- a/Modules/_ssl.c +++ b/Modules/_ssl.c @@ -2447,8 +2447,8 @@ load_cert_chain(PySSLContext *self, PyObject *args, PyObject *kwds) { char *kwlist[] = {"certfile", "keyfile", "password", NULL}; - PyObject *password = NULL; - char *certfile_bytes = NULL, *keyfile_bytes = NULL; + PyObject *keyfile = NULL, *keyfile_bytes = NULL, *password = NULL; + char *certfile_bytes = NULL; pem_password_cb *orig_passwd_cb = self->ctx->default_passwd_callback; void *orig_passwd_userdata = self->ctx->default_passwd_callback_userdata; _PySSLPasswordInfo pw_info = { NULL, NULL, NULL, 0, 0 }; @@ -2457,11 +2457,27 @@ errno = 0; ERR_clear_error(); if (!PyArg_ParseTupleAndKeywords(args, kwds, - "et|etO:load_cert_chain", kwlist, + "et|OO:load_cert_chain", kwlist, Py_FileSystemDefaultEncoding, &certfile_bytes, - Py_FileSystemDefaultEncoding, &keyfile_bytes, - &password)) + &keyfile, &password)) return NULL; + + if (keyfile && keyfile != Py_None) { + if (PyString_Check(keyfile)) { + Py_INCREF(keyfile); + keyfile_bytes = keyfile; + } else { + PyObject *u = PyUnicode_FromObject(keyfile); + if (!u) + goto error; + keyfile_bytes = PyUnicode_AsEncodedString( + u, Py_FileSystemDefaultEncoding, NULL); + Py_DECREF(u); + if (!keyfile_bytes) + goto error; + } + } + if (password && password != Py_None) { if (PyCallable_Check(password)) { pw_info.callable = password; @@ -2491,7 +2507,7 @@ } PySSL_BEGIN_ALLOW_THREADS_S(pw_info.thread_state); r = SSL_CTX_use_PrivateKey_file(self->ctx, - keyfile_bytes ? keyfile_bytes : certfile_bytes, + keyfile_bytes ? PyBytes_AS_STRING(keyfile_bytes) : certfile_bytes, SSL_FILETYPE_PEM); PySSL_END_ALLOW_THREADS_S(pw_info.thread_state); if (r != 1) { @@ -2523,8 +2539,8 @@ error: SSL_CTX_set_default_passwd_cb(self->ctx, orig_passwd_cb); SSL_CTX_set_default_passwd_cb_userdata(self->ctx, orig_passwd_userdata); + Py_XDECREF(keyfile_bytes); PyMem_Free(pw_info.password); - PyMem_Free(keyfile_bytes); PyMem_Free(certfile_bytes); return NULL; } -- Repository URL: https://hg.python.org/cpython From solipsis at pitrou.net Tue Nov 4 09:37:53 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Tue, 04 Nov 2014 09:37:53 +0100 Subject: [Python-checkins] Daily reference leaks (205810ca5069): sum=3 Message-ID: results for 205810ca5069 on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflog0pEFkg', '-x'] From python-checkins at python.org Tue Nov 4 14:53:32 2014 From: python-checkins at python.org (antoine.pitrou) Date: Tue, 04 Nov 2014 13:53:32 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2322773=3A_fix_failing_test_with_old_readline_ver?= =?utf-8?q?sions_due_to_issue_=2319884=2E?= Message-ID: <20141104135308.703.68639@psf.io> https://hg.python.org/cpython/rev/be374b8c40c8 changeset: 93381:be374b8c40c8 parent: 93377:205810ca5069 parent: 93380:c4b5a5d44254 user: Antoine Pitrou date: Tue Nov 04 14:53:01 2014 +0100 summary: Issue #22773: fix failing test with old readline versions due to issue #19884. files: Lib/test/test_readline.py | 4 ++++ Modules/readline.c | 4 ++++ 2 files changed, 8 insertions(+), 0 deletions(-) diff --git a/Lib/test/test_readline.py b/Lib/test/test_readline.py --- a/Lib/test/test_readline.py +++ b/Lib/test/test_readline.py @@ -44,6 +44,10 @@ class TestReadline(unittest.TestCase): + + @unittest.skipIf(readline._READLINE_VERSION < 0x0600 + and "libedit" not in readline.__doc__, + "not supported in this library version") def test_init(self): # Issue #19884: Ensure that the ANSI sequence "\033[1034h" is not # written into stdout when the readline module is imported and stdout diff --git a/Modules/readline.c b/Modules/readline.c --- a/Modules/readline.c +++ b/Modules/readline.c @@ -1285,5 +1285,9 @@ mod_state = (readlinestate *) PyModule_GetState(m); PyOS_ReadlineFunctionPointer = call_readline; setup_readline(mod_state); + + PyModule_AddIntConstant(m, "_READLINE_VERSION", RL_READLINE_VERSION); + PyModule_AddIntConstant(m, "_READLINE_RUNTIME_VERSION", rl_readline_version); + return m; } -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 4 14:53:32 2014 From: python-checkins at python.org (antoine.pitrou) Date: Tue, 04 Nov 2014 13:53:32 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyNzcz?= =?utf-8?q?=3A_fix_failing_test_with_old_readline_versions_due_to_issue_?= =?utf-8?q?=2319884=2E?= Message-ID: <20141104135308.85190.63752@psf.io> https://hg.python.org/cpython/rev/c4b5a5d44254 changeset: 93380:c4b5a5d44254 branch: 3.4 parent: 93376:b9d9e7762783 user: Antoine Pitrou date: Tue Nov 04 14:52:10 2014 +0100 summary: Issue #22773: fix failing test with old readline versions due to issue #19884. files: Lib/test/test_readline.py | 4 ++++ Modules/readline.c | 4 ++++ 2 files changed, 8 insertions(+), 0 deletions(-) diff --git a/Lib/test/test_readline.py b/Lib/test/test_readline.py --- a/Lib/test/test_readline.py +++ b/Lib/test/test_readline.py @@ -44,6 +44,10 @@ class TestReadline(unittest.TestCase): + + @unittest.skipIf(readline._READLINE_VERSION < 0x0600 + and "libedit" not in readline.__doc__, + "not supported in this library version") def test_init(self): # Issue #19884: Ensure that the ANSI sequence "\033[1034h" is not # written into stdout when the readline module is imported and stdout diff --git a/Modules/readline.c b/Modules/readline.c --- a/Modules/readline.c +++ b/Modules/readline.c @@ -1285,5 +1285,9 @@ mod_state = (readlinestate *) PyModule_GetState(m); PyOS_ReadlineFunctionPointer = call_readline; setup_readline(mod_state); + + PyModule_AddIntConstant(m, "_READLINE_VERSION", RL_READLINE_VERSION); + PyModule_AddIntConstant(m, "_READLINE_RUNTIME_VERSION", rl_readline_version); + return m; } -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 4 14:55:00 2014 From: python-checkins at python.org (antoine.pitrou) Date: Tue, 04 Nov 2014 13:55:00 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzIyNzcz?= =?utf-8?q?=3A_fix_failing_test_with_old_readline_versions_due_to_issue_?= =?utf-8?q?=2319884=2E?= Message-ID: <20141104135456.108393.94114@psf.io> https://hg.python.org/cpython/rev/eba6e68e818c changeset: 93382:eba6e68e818c branch: 2.7 parent: 93379:e54d0b197c82 user: Antoine Pitrou date: Tue Nov 04 14:52:10 2014 +0100 summary: Issue #22773: fix failing test with old readline versions due to issue #19884. files: Lib/test/test_readline.py | 4 ++++ Modules/readline.c | 3 +++ 2 files changed, 7 insertions(+), 0 deletions(-) diff --git a/Lib/test/test_readline.py b/Lib/test/test_readline.py --- a/Lib/test/test_readline.py +++ b/Lib/test/test_readline.py @@ -43,6 +43,10 @@ class TestReadline(unittest.TestCase): + + @unittest.skipIf(readline._READLINE_VERSION < 0x0600 + and "libedit" not in readline.__doc__, + "not supported in this library version") def test_init(self): # Issue #19884: Ensure that the ANSI sequence "\033[1034h" is not # written into stdout when the readline module is imported and stdout diff --git a/Modules/readline.c b/Modules/readline.c --- a/Modules/readline.c +++ b/Modules/readline.c @@ -1184,4 +1184,7 @@ PyOS_ReadlineFunctionPointer = call_readline; setup_readline(); + + PyModule_AddIntConstant(m, "_READLINE_VERSION", RL_READLINE_VERSION); + PyModule_AddIntConstant(m, "_READLINE_RUNTIME_VERSION", rl_readline_version); } -- Repository URL: https://hg.python.org/cpython From benjamin at python.org Tue Nov 4 14:58:29 2014 From: benjamin at python.org (Benjamin Peterson) Date: Tue, 04 Nov 2014 09:58:29 -0400 Subject: [Python-checkins] cpython (2.7): Issue #22773: fix failing test with old readline versions due to issue #19884. In-Reply-To: <20141104135456.108393.94114@psf.io> References: <20141104135456.108393.94114@psf.io> Message-ID: <1415109509.2950700.186901193.57C2BE56@webmail.messagingengine.com> On Tue, Nov 4, 2014, at 09:55, antoine.pitrou wrote: > https://hg.python.org/cpython/rev/eba6e68e818c > changeset: 93382:eba6e68e818c > branch: 2.7 > parent: 93379:e54d0b197c82 > user: Antoine Pitrou > date: Tue Nov 04 14:52:10 2014 +0100 > summary: > Issue #22773: fix failing test with old readline versions due to issue > #19884. > > files: > Lib/test/test_readline.py | 4 ++++ > Modules/readline.c | 3 +++ > 2 files changed, 7 insertions(+), 0 deletions(-) > > > diff --git a/Lib/test/test_readline.py b/Lib/test/test_readline.py > --- a/Lib/test/test_readline.py > +++ b/Lib/test/test_readline.py > @@ -43,6 +43,10 @@ > > > class TestReadline(unittest.TestCase): > + > + @unittest.skipIf(readline._READLINE_VERSION < 0x0600 Shouldn't this use the runtime version? From python-checkins at python.org Tue Nov 4 15:09:42 2014 From: python-checkins at python.org (robert.collins) Date: Tue, 04 Nov 2014 14:09:42 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Close_=2322457=3A_Honour_l?= =?utf-8?q?oad=5Ftests_in_the_start=5Fdir_of_discovery=2E?= Message-ID: <20141104140917.719.34141@psf.io> https://hg.python.org/cpython/rev/ce0dd5e4b801 changeset: 93383:ce0dd5e4b801 parent: 93381:be374b8c40c8 user: Robert Collins date: Wed Nov 05 03:09:01 2014 +1300 summary: Close #22457: Honour load_tests in the start_dir of discovery. We were not honouring load_tests in a package/__init__.py when that was the start_dir parameter, though we do when it is a child package. The fix required a little care since it introduces the possibility of infinite recursion. files: Doc/library/unittest.rst | 6 +- Lib/unittest/__init__.py | 9 + Lib/unittest/loader.py | 160 ++++++++++----- Lib/unittest/test/test_discovery.py | 45 ++++ Lib/unittest/test/test_loader.py | 2 +- Misc/NEWS | 2 + 6 files changed, 166 insertions(+), 58 deletions(-) diff --git a/Doc/library/unittest.rst b/Doc/library/unittest.rst --- a/Doc/library/unittest.rst +++ b/Doc/library/unittest.rst @@ -1668,7 +1668,11 @@ If a package (a directory containing a file named :file:`__init__.py`) is found, the package will be checked for a ``load_tests`` function. If this - exists then it will be called with *loader*, *tests*, *pattern*. + exists then it will be called + ``package.load_tests(loader, tests, pattern)``. Test discovery takes care + to ensure that a package is only checked for tests once during an + invocation, even if the load_tests function itself calls + ``loader.discover``. If ``load_tests`` exists then discovery does *not* recurse into the package, ``load_tests`` is responsible for loading all tests in the diff --git a/Lib/unittest/__init__.py b/Lib/unittest/__init__.py --- a/Lib/unittest/__init__.py +++ b/Lib/unittest/__init__.py @@ -67,3 +67,12 @@ # deprecated _TextTestResult = TextTestResult + +# There are no tests here, so don't try to run anything discovered from +# introspecting the symbols (e.g. FunctionTestCase). Instead, all our +# tests come from within unittest.test. +def load_tests(loader, tests, pattern): + import os.path + # top level directory cached on loader instance + this_dir = os.path.dirname(__file__) + return loader.discover(start_dir=this_dir, pattern=pattern) diff --git a/Lib/unittest/loader.py b/Lib/unittest/loader.py --- a/Lib/unittest/loader.py +++ b/Lib/unittest/loader.py @@ -65,6 +65,9 @@ def __init__(self): super(TestLoader, self).__init__() self.errors = [] + # Tracks packages which we have called into via load_tests, to + # avoid infinite re-entrancy. + self._loading_packages = set() def loadTestsFromTestCase(self, testCaseClass): """Return a suite of all tests cases contained in testCaseClass""" @@ -229,9 +232,13 @@ If a test package name (directory with '__init__.py') matches the pattern then the package will be checked for a 'load_tests' function. If - this exists then it will be called with loader, tests, pattern. + this exists then it will be called with (loader, tests, pattern) unless + the package has already had load_tests called from the same discovery + invocation, in which case the package module object is not scanned for + tests - this ensures that when a package uses discover to further + discover child tests that infinite recursion does not happen. - If load_tests exists then discovery does *not* recurse into the package, + If load_tests exists then discovery does *not* recurse into the package, load_tests is responsible for loading all tests in the package. The pattern is deliberately not stored as a loader attribute so that @@ -355,69 +362,110 @@ def _find_tests(self, start_dir, pattern, namespace=False): """Used by discovery. Yields test suites it loads.""" + # Handle the __init__ in this package + name = self._get_name_from_path(start_dir) + # name is '.' when start_dir == top_level_dir (and top_level_dir is by + # definition not a package). + if name != '.' and name not in self._loading_packages: + # name is in self._loading_packages while we have called into + # loadTestsFromModule with name. + tests, should_recurse = self._find_test_path( + start_dir, pattern, namespace) + if tests is not None: + yield tests + if not should_recurse: + # Either an error occured, or load_tests was used by the + # package. + return + # Handle the contents. paths = sorted(os.listdir(start_dir)) - for path in paths: full_path = os.path.join(start_dir, path) - if os.path.isfile(full_path): - if not VALID_MODULE_NAME.match(path): - # valid Python identifiers only - continue - if not self._match_path(path, full_path, pattern): - continue - # if the test file matches, load it + tests, should_recurse = self._find_test_path( + full_path, pattern, namespace) + if tests is not None: + yield tests + if should_recurse: + # we found a package that didn't use load_tests. name = self._get_name_from_path(full_path) + self._loading_packages.add(name) try: - module = self._get_module_from_name(name) - except case.SkipTest as e: - yield _make_skipped_test(name, e, self.suiteClass) - except: - error_case, error_message = \ - _make_failed_import_test(name, self.suiteClass) - self.errors.append(error_message) - yield error_case - else: - mod_file = os.path.abspath(getattr(module, '__file__', full_path)) - realpath = _jython_aware_splitext(os.path.realpath(mod_file)) - fullpath_noext = _jython_aware_splitext(os.path.realpath(full_path)) - if realpath.lower() != fullpath_noext.lower(): - module_dir = os.path.dirname(realpath) - mod_name = _jython_aware_splitext(os.path.basename(full_path)) - expected_dir = os.path.dirname(full_path) - msg = ("%r module incorrectly imported from %r. Expected %r. " - "Is this module globally installed?") - raise ImportError(msg % (mod_name, module_dir, expected_dir)) - yield self.loadTestsFromModule(module, pattern=pattern) - elif os.path.isdir(full_path): - if (not namespace and - not os.path.isfile(os.path.join(full_path, '__init__.py'))): - continue + yield from self._find_tests(full_path, pattern, namespace) + finally: + self._loading_packages.discard(name) - load_tests = None - tests = None - name = self._get_name_from_path(full_path) + def _find_test_path(self, full_path, pattern, namespace=False): + """Used by discovery. + + Loads tests from a single file, or a directories' __init__.py when + passed the directory. + + Returns a tuple (None_or_tests_from_file, should_recurse). + """ + basename = os.path.basename(full_path) + if os.path.isfile(full_path): + if not VALID_MODULE_NAME.match(basename): + # valid Python identifiers only + return None, False + if not self._match_path(basename, full_path, pattern): + return None, False + # if the test file matches, load it + name = self._get_name_from_path(full_path) + try: + module = self._get_module_from_name(name) + except case.SkipTest as e: + return _make_skipped_test(name, e, self.suiteClass), False + except: + error_case, error_message = \ + _make_failed_import_test(name, self.suiteClass) + self.errors.append(error_message) + return error_case, False + else: + mod_file = os.path.abspath( + getattr(module, '__file__', full_path)) + realpath = _jython_aware_splitext( + os.path.realpath(mod_file)) + fullpath_noext = _jython_aware_splitext( + os.path.realpath(full_path)) + if realpath.lower() != fullpath_noext.lower(): + module_dir = os.path.dirname(realpath) + mod_name = _jython_aware_splitext( + os.path.basename(full_path)) + expected_dir = os.path.dirname(full_path) + msg = ("%r module incorrectly imported from %r. Expected " + "%r. Is this module globally installed?") + raise ImportError( + msg % (mod_name, module_dir, expected_dir)) + return self.loadTestsFromModule(module, pattern=pattern), False + elif os.path.isdir(full_path): + if (not namespace and + not os.path.isfile(os.path.join(full_path, '__init__.py'))): + return None, False + + load_tests = None + tests = None + name = self._get_name_from_path(full_path) + try: + package = self._get_module_from_name(name) + except case.SkipTest as e: + return _make_skipped_test(name, e, self.suiteClass), False + except: + error_case, error_message = \ + _make_failed_import_test(name, self.suiteClass) + self.errors.append(error_message) + return error_case, False + else: + load_tests = getattr(package, 'load_tests', None) + # Mark this package as being in load_tests (possibly ;)) + self._loading_packages.add(name) try: - package = self._get_module_from_name(name) - except case.SkipTest as e: - yield _make_skipped_test(name, e, self.suiteClass) - except: - error_case, error_message = \ - _make_failed_import_test(name, self.suiteClass) - self.errors.append(error_message) - yield error_case - else: - load_tests = getattr(package, 'load_tests', None) tests = self.loadTestsFromModule(package, pattern=pattern) - if tests is not None: - # tests loaded from package file - yield tests - if load_tests is not None: - # loadTestsFromModule(package) has load_tests for us. - continue - # recurse into the package - yield from self._find_tests(full_path, pattern, - namespace=namespace) + # loadTestsFromModule(package) has loaded tests for us. + return tests, False + return tests, True + finally: + self._loading_packages.discard(name) defaultTestLoader = TestLoader() diff --git a/Lib/unittest/test/test_discovery.py b/Lib/unittest/test/test_discovery.py --- a/Lib/unittest/test/test_discovery.py +++ b/Lib/unittest/test/test_discovery.py @@ -368,6 +368,51 @@ self.assertEqual(_find_tests_args, [(start_dir, 'pattern')]) self.assertIn(top_level_dir, sys.path) + def test_discover_start_dir_is_package_calls_package_load_tests(self): + # This test verifies that the package load_tests in a package is indeed + # invoked when the start_dir is a package (and not the top level). + # http://bugs.python.org/issue22457 + + # Test data: we expect the following: + # an isfile to verify the package, then importing and scanning + # as per _find_tests' normal behaviour. + # We expect to see our load_tests hook called once. + vfs = {abspath('/toplevel'): ['startdir'], + abspath('/toplevel/startdir'): ['__init__.py']} + def list_dir(path): + return list(vfs[path]) + self.addCleanup(setattr, os, 'listdir', os.listdir) + os.listdir = list_dir + self.addCleanup(setattr, os.path, 'isfile', os.path.isfile) + os.path.isfile = lambda path: path.endswith('.py') + self.addCleanup(setattr, os.path, 'isdir', os.path.isdir) + os.path.isdir = lambda path: not path.endswith('.py') + self.addCleanup(sys.path.remove, abspath('/toplevel')) + + class Module(object): + paths = [] + load_tests_args = [] + + def __init__(self, path): + self.path = path + + def load_tests(self, loader, tests, pattern): + return ['load_tests called ' + self.path] + + def __eq__(self, other): + return self.path == other.path + + loader = unittest.TestLoader() + loader._get_module_from_name = lambda name: Module(name) + loader.suiteClass = lambda thing: thing + + suite = loader.discover('/toplevel/startdir', top_level_dir='/toplevel') + + # We should have loaded tests from the package __init__. + # (normally this would be nested TestSuites.) + self.assertEqual(suite, + [['load_tests called startdir']]) + def setup_import_issue_tests(self, fakefile): listdir = os.listdir os.listdir = lambda _: [fakefile] diff --git a/Lib/unittest/test/test_loader.py b/Lib/unittest/test/test_loader.py --- a/Lib/unittest/test/test_loader.py +++ b/Lib/unittest/test/test_loader.py @@ -841,7 +841,7 @@ loader = unittest.TestLoader() suite = loader.loadTestsFromNames( - ['unittest.loader.sdasfasfasdf', 'unittest']) + ['unittest.loader.sdasfasfasdf', 'unittest.test.dummy']) error, test = self.check_deferred_error(loader, list(suite)[0]) expected = "module 'unittest.loader' has no attribute 'sdasfasfasdf'" self.assertIn( diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -212,6 +212,8 @@ - Issue #22217: Implemented reprs of classes in the zipfile module. +- Issue #22457: Honour load_tests in the start_dir of discovery. + - Issue #18216: gettext now raises an error when a .mo file has an unsupported major version number. Patch by Aaron Hill. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 4 15:44:12 2014 From: python-checkins at python.org (robert.collins) Date: Tue, 04 Nov 2014 14:44:12 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Fix_regression_in_issue_22?= =?utf-8?q?457_fix=2E?= Message-ID: <20141104144402.727.47162@psf.io> https://hg.python.org/cpython/rev/2aac2d76035e changeset: 93384:2aac2d76035e user: Robert Collins date: Wed Nov 05 03:43:36 2014 +1300 summary: Fix regression in issue 22457 fix. When used in the real world it can under some situations trigger " assert not _relpath.startswith('..'), "Path must be within the project" AssertionError: Path must be within the project " Because _get_name_from_path was not expecting to be called with the top level directory. files: Lib/unittest/loader.py | 2 ++ 1 files changed, 2 insertions(+), 0 deletions(-) diff --git a/Lib/unittest/loader.py b/Lib/unittest/loader.py --- a/Lib/unittest/loader.py +++ b/Lib/unittest/loader.py @@ -343,6 +343,8 @@ return os.path.dirname(full_path) def _get_name_from_path(self, path): + if path == self._top_level_dir: + return '.' path = _jython_aware_splitext(os.path.normpath(path)) _relpath = os.path.relpath(path, self._top_level_dir) -- Repository URL: https://hg.python.org/cpython From solipsis at pitrou.net Wed Nov 5 09:37:34 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Wed, 05 Nov 2014 09:37:34 +0100 Subject: [Python-checkins] Daily reference leaks (2aac2d76035e): sum=58 Message-ID: results for 2aac2d76035e on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 test_multiprocessing_fork leaked [38, 0, 0] references, sum=38 test_multiprocessing_fork leaked [17, 0, 0] memory blocks, sum=17 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogP2dcoq', '-x'] From python-checkins at python.org Wed Nov 5 15:12:13 2014 From: python-checkins at python.org (victor.stinner) Date: Wed, 05 Nov 2014 14:12:13 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2320597=3A_Remove_u?= =?utf-8?q?nused_definition_of_PATH=5FMAX_on_Windows=2C_MAXPATHLEN_is?= Message-ID: <20141105141204.108095.73110@psf.io> https://hg.python.org/cpython/rev/6aaa0aab1e93 changeset: 93386:6aaa0aab1e93 parent: 93384:2aac2d76035e user: Victor Stinner date: Wed Nov 05 15:11:34 2014 +0100 summary: Issue #20597: Remove unused definition of PATH_MAX on Windows, MAXPATHLEN is now preferred. Patch written by Jeffrey Armstrong. files: Modules/main.c | 1 - Python/pythonrun.c | 1 - 2 files changed, 0 insertions(+), 2 deletions(-) diff --git a/Modules/main.c b/Modules/main.c --- a/Modules/main.c +++ b/Modules/main.c @@ -9,7 +9,6 @@ #include #ifdef HAVE_FCNTL_H #include -#define PATH_MAX MAXPATHLEN #endif #endif diff --git a/Python/pythonrun.c b/Python/pythonrun.c --- a/Python/pythonrun.c +++ b/Python/pythonrun.c @@ -32,7 +32,6 @@ #ifdef MS_WINDOWS #undef BYTE #include "windows.h" -#define PATH_MAX MAXPATHLEN #endif #ifdef __gnu_hurd__ -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 15:12:13 2014 From: python-checkins at python.org (victor.stinner) Date: Wed, 05 Nov 2014 14:12:13 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzE5NzUz?= =?utf-8?q?=3A_Fix_test=5Fgdb_on_SystemZ_buildbot=2C_ignore_warnings?= Message-ID: <20141105140725.108073.96591@psf.io> https://hg.python.org/cpython/rev/4c260cf1ba39 changeset: 93385:4c260cf1ba39 branch: 2.7 parent: 93382:eba6e68e818c user: Victor Stinner date: Wed Nov 05 15:07:18 2014 +0100 summary: Issue #19753: Fix test_gdb on SystemZ buildbot, ignore warnings files: Lib/test/test_gdb.py | 4 ++++ 1 files changed, 4 insertions(+), 0 deletions(-) diff --git a/Lib/test/test_gdb.py b/Lib/test/test_gdb.py --- a/Lib/test/test_gdb.py +++ b/Lib/test/test_gdb.py @@ -163,6 +163,10 @@ 'linux-gate.so', 'Do you need "set solib-search-path" or ' '"set sysroot"?', + 'warning: Source file is more recent than executable.', + # Issue #19753: missing symbols on System Z + 'Missing separate debuginfo for ', + 'Try: zypper install -C ', ) for line in errlines: if not line.startswith(ignore_patterns): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 15:15:35 2014 From: python-checkins at python.org (victor.stinner) Date: Wed, 05 Nov 2014 14:15:35 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2320597=2C_=2321274?= =?utf-8?q?=3A_Remove_unused_definition_of_PATH=5FMAX_on_GNU/Hurd=2C?= Message-ID: <20141105141451.108395.76675@psf.io> https://hg.python.org/cpython/rev/d6fb87972dee changeset: 93387:d6fb87972dee user: Victor Stinner date: Wed Nov 05 15:13:51 2014 +0100 summary: Issue #20597, #21274: Remove unused definition of PATH_MAX on GNU/Hurd, MAXPATHLEN is now preferred. files: Python/pythonrun.c | 4 ---- 1 files changed, 0 insertions(+), 4 deletions(-) diff --git a/Python/pythonrun.c b/Python/pythonrun.c --- a/Python/pythonrun.c +++ b/Python/pythonrun.c @@ -34,10 +34,6 @@ #include "windows.h" #endif -#ifdef __gnu_hurd__ -#define PATH_MAX MAXPATHLEN -#endif - _Py_IDENTIFIER(builtins); _Py_IDENTIFIER(excepthook); _Py_IDENTIFIER(flush); -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 15:31:30 2014 From: python-checkins at python.org (victor.stinner) Date: Wed, 05 Nov 2014 14:31:30 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogYXN5bmNpbzogTW92?= =?utf-8?q?e_loop_attribute_to_=5FFlowControlMixin?= Message-ID: <20141105143124.113470.80565@psf.io> https://hg.python.org/cpython/rev/d05ba48cfc29 changeset: 93388:d05ba48cfc29 branch: 3.4 parent: 93380:c4b5a5d44254 user: Victor Stinner date: Wed Nov 05 15:27:41 2014 +0100 summary: asyncio: Move loop attribute to _FlowControlMixin Move the _loop attribute from the constructor of _SelectorTransport, _ProactorBasePipeTransport and _UnixWritePipeTransport classes to the constructor of the _FlowControlMixin class. Add also an assertion to explicit that the parent class must ensure that the loop is defined (not None) files: Lib/asyncio/proactor_events.py | 3 +-- Lib/asyncio/selector_events.py | 3 +-- Lib/asyncio/transports.py | 4 +++- Lib/asyncio/unix_events.py | 3 +-- Lib/test/test_asyncio/test_transports.py | 3 ++- 5 files changed, 8 insertions(+), 8 deletions(-) diff --git a/Lib/asyncio/proactor_events.py b/Lib/asyncio/proactor_events.py --- a/Lib/asyncio/proactor_events.py +++ b/Lib/asyncio/proactor_events.py @@ -21,9 +21,8 @@ def __init__(self, loop, sock, protocol, waiter=None, extra=None, server=None): - super().__init__(extra) + super().__init__(extra, loop) self._set_extra(sock) - self._loop = loop self._sock = sock self._protocol = protocol self._server = server diff --git a/Lib/asyncio/selector_events.py b/Lib/asyncio/selector_events.py --- a/Lib/asyncio/selector_events.py +++ b/Lib/asyncio/selector_events.py @@ -447,7 +447,7 @@ _buffer_factory = bytearray # Constructs initial value for self._buffer. def __init__(self, loop, sock, protocol, extra, server=None): - super().__init__(extra) + super().__init__(extra, loop) self._extra['socket'] = sock self._extra['sockname'] = sock.getsockname() if 'peername' not in self._extra: @@ -455,7 +455,6 @@ self._extra['peername'] = sock.getpeername() except socket.error: self._extra['peername'] = None - self._loop = loop self._sock = sock self._sock_fd = sock.fileno() self._protocol = protocol diff --git a/Lib/asyncio/transports.py b/Lib/asyncio/transports.py --- a/Lib/asyncio/transports.py +++ b/Lib/asyncio/transports.py @@ -238,8 +238,10 @@ resume_writing() may be called. """ - def __init__(self, extra=None): + def __init__(self, extra=None, loop=None): super().__init__(extra) + assert loop is not None + self._loop = loop self._protocol_paused = False self._set_write_buffer_limits() diff --git a/Lib/asyncio/unix_events.py b/Lib/asyncio/unix_events.py --- a/Lib/asyncio/unix_events.py +++ b/Lib/asyncio/unix_events.py @@ -369,9 +369,8 @@ transports.WriteTransport): def __init__(self, loop, pipe, protocol, waiter=None, extra=None): - super().__init__(extra) + super().__init__(extra, loop) self._extra['pipe'] = pipe - self._loop = loop self._pipe = pipe self._fileno = pipe.fileno() mode = os.fstat(self._fileno).st_mode diff --git a/Lib/test/test_asyncio/test_transports.py b/Lib/test/test_asyncio/test_transports.py --- a/Lib/test/test_asyncio/test_transports.py +++ b/Lib/test/test_asyncio/test_transports.py @@ -69,7 +69,8 @@ def get_write_buffer_size(self): return 512 - transport = MyTransport() + loop = mock.Mock() + transport = MyTransport(loop=loop) transport._protocol = mock.Mock() self.assertFalse(transport._protocol_paused) -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 15:31:30 2014 From: python-checkins at python.org (victor.stinner) Date: Wed, 05 Nov 2014 14:31:30 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_=28Merge_3=2E4=29_asyncio=3A_Move_loop_attribute_to_=5FF?= =?utf-8?q?lowControlMixin?= Message-ID: <20141105143125.108099.70234@psf.io> https://hg.python.org/cpython/rev/b9ee2082256d changeset: 93389:b9ee2082256d parent: 93387:d6fb87972dee parent: 93388:d05ba48cfc29 user: Victor Stinner date: Wed Nov 05 15:27:54 2014 +0100 summary: (Merge 3.4) asyncio: Move loop attribute to _FlowControlMixin Move the _loop attribute from the constructor of _SelectorTransport, _ProactorBasePipeTransport and _UnixWritePipeTransport classes to the constructor of the _FlowControlMixin class. Add also an assertion to explicit that the parent class must ensure that the loop is defined (not None) files: Lib/asyncio/proactor_events.py | 3 +-- Lib/asyncio/selector_events.py | 3 +-- Lib/asyncio/transports.py | 4 +++- Lib/asyncio/unix_events.py | 3 +-- Lib/test/test_asyncio/test_transports.py | 3 ++- 5 files changed, 8 insertions(+), 8 deletions(-) diff --git a/Lib/asyncio/proactor_events.py b/Lib/asyncio/proactor_events.py --- a/Lib/asyncio/proactor_events.py +++ b/Lib/asyncio/proactor_events.py @@ -21,9 +21,8 @@ def __init__(self, loop, sock, protocol, waiter=None, extra=None, server=None): - super().__init__(extra) + super().__init__(extra, loop) self._set_extra(sock) - self._loop = loop self._sock = sock self._protocol = protocol self._server = server diff --git a/Lib/asyncio/selector_events.py b/Lib/asyncio/selector_events.py --- a/Lib/asyncio/selector_events.py +++ b/Lib/asyncio/selector_events.py @@ -447,7 +447,7 @@ _buffer_factory = bytearray # Constructs initial value for self._buffer. def __init__(self, loop, sock, protocol, extra, server=None): - super().__init__(extra) + super().__init__(extra, loop) self._extra['socket'] = sock self._extra['sockname'] = sock.getsockname() if 'peername' not in self._extra: @@ -455,7 +455,6 @@ self._extra['peername'] = sock.getpeername() except socket.error: self._extra['peername'] = None - self._loop = loop self._sock = sock self._sock_fd = sock.fileno() self._protocol = protocol diff --git a/Lib/asyncio/transports.py b/Lib/asyncio/transports.py --- a/Lib/asyncio/transports.py +++ b/Lib/asyncio/transports.py @@ -238,8 +238,10 @@ resume_writing() may be called. """ - def __init__(self, extra=None): + def __init__(self, extra=None, loop=None): super().__init__(extra) + assert loop is not None + self._loop = loop self._protocol_paused = False self._set_write_buffer_limits() diff --git a/Lib/asyncio/unix_events.py b/Lib/asyncio/unix_events.py --- a/Lib/asyncio/unix_events.py +++ b/Lib/asyncio/unix_events.py @@ -369,9 +369,8 @@ transports.WriteTransport): def __init__(self, loop, pipe, protocol, waiter=None, extra=None): - super().__init__(extra) + super().__init__(extra, loop) self._extra['pipe'] = pipe - self._loop = loop self._pipe = pipe self._fileno = pipe.fileno() mode = os.fstat(self._fileno).st_mode diff --git a/Lib/test/test_asyncio/test_transports.py b/Lib/test/test_asyncio/test_transports.py --- a/Lib/test/test_asyncio/test_transports.py +++ b/Lib/test/test_asyncio/test_transports.py @@ -69,7 +69,8 @@ def get_write_buffer_size(self): return 512 - transport = MyTransport() + loop = mock.Mock() + transport = MyTransport(loop=loop) transport._protocol = mock.Mock() self.assertFalse(transport._protocol_paused) -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 16:19:40 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 05 Nov 2014 15:19:40 +0000 Subject: [Python-checkins] =?utf-8?q?pythontestdotnet=3A_add_self-signed_c?= =?utf-8?q?ert_and_key?= Message-ID: <20141105151933.108373.56056@psf.io> https://hg.python.org/pythontestdotnet/rev/075864c8191e changeset: 0:075864c8191e user: Benjamin Peterson date: Wed Nov 05 10:19:31 2014 -0500 summary: add self-signed cert and key files: tls/self-signed-cert.pem | 16 ++++++++++++++++ tls/self-signed-key.pem | 16 ++++++++++++++++ 2 files changed, 32 insertions(+), 0 deletions(-) diff --git a/tls/self-signed-cert.pem b/tls/self-signed-cert.pem new file mode 100644 --- /dev/null +++ b/tls/self-signed-cert.pem @@ -0,0 +1,16 @@ +-----BEGIN CERTIFICATE----- +MIIChzCCAfCgAwIBAgIJAKGU95wKR8pSMA0GCSqGSIb3DQEBBQUAMHAxCzAJBgNV +BAYTAlhZMRcwFQYDVQQHDA5DYXN0bGUgQW50aHJheDEjMCEGA1UECgwaUHl0aG9u +IFNvZnR3YXJlIEZvdW5kYXRpb24xIzAhBgNVBAMMGnNlbGYtc2lnbmVkLnB5dGhv +bnRlc3QubmV0MB4XDTE0MTEwMjE4MDkyOVoXDTI0MTAzMDE4MDkyOVowcDELMAkG +A1UEBhMCWFkxFzAVBgNVBAcMDkNhc3RsZSBBbnRocmF4MSMwIQYDVQQKDBpQeXRo +b24gU29mdHdhcmUgRm91bmRhdGlvbjEjMCEGA1UEAwwac2VsZi1zaWduZWQucHl0 +aG9udGVzdC5uZXQwgZ8wDQYJKoZIhvcNAQEBBQADgY0AMIGJAoGBANDXQXW9tjyZ +Xt0Iv2tLL1+jinr4wGg36ioLDLFkMf+2Y1GL0v0BnKYG4N1OKlAU15LXGeGer8vm +Sv/yIvmdrELvhAbbo3w4a9TMYQA4XkIVLdvu3mvNOAet+8PMJxn26dbDhG809ALv +EHY57lQsBS3G59RZyBPVqAqmImWNJnVzAgMBAAGjKTAnMCUGA1UdEQQeMByCGnNl +bGYtc2lnbmVkLnB5dGhvbnRlc3QubmV0MA0GCSqGSIb3DQEBBQUAA4GBAIOXmdtM +eG9qzP9TiXW/Gc/zI4cBfdCpC+Y4gOfC9bQUC7hefix4iO3+iZjgy3X/FaRxUUoV +HKiXcXIaWqTSUWp45cSh0MbwZXudp6JIAptzdAhvvCrPKeC9i9GvxsPD4LtDAL97 +vSaxQBezA7hdxZd90/EeyMgVZgAnTCnvAWX9 +-----END CERTIFICATE----- diff --git a/tls/self-signed-key.pem b/tls/self-signed-key.pem new file mode 100644 --- /dev/null +++ b/tls/self-signed-key.pem @@ -0,0 +1,16 @@ +-----BEGIN PRIVATE KEY----- +MIICdwIBADANBgkqhkiG9w0BAQEFAASCAmEwggJdAgEAAoGBANDXQXW9tjyZXt0I +v2tLL1+jinr4wGg36ioLDLFkMf+2Y1GL0v0BnKYG4N1OKlAU15LXGeGer8vmSv/y +IvmdrELvhAbbo3w4a9TMYQA4XkIVLdvu3mvNOAet+8PMJxn26dbDhG809ALvEHY5 +7lQsBS3G59RZyBPVqAqmImWNJnVzAgMBAAECgYEArO8iwJn5FxM1r7j3saRPtVWa +bZwgz+xFVs1RlG9Qy9w/QB6V93ZnPkCB4iBA/5FStcCzKNab4i9wOaNLfQIoysDZ +jOonRG6pbdFSIBnH4lw1UGi8SS34gFhvWuDW6QHya1enMu2eyOz0W756FUIy9uLx +V1//jNjeT7UcsFowgkkCQQD4ZlMnCWwygGKO3KXlHp0X44UL3HjIObBhaoBECkci +kxsbk8Iwarcq5BBKgwKtTaGvcnzlM9N5xTZ7v30nukANAkEA1zsSmB0P9k5pZsAs +xqRQggVdnjZ55zI6q6KrP69f9LJy8bEQ2Xz1MluAUwKsG26gsThzMPBdn2rWmjYf +9NirfwJAXhWr0zJfd/Vm30O11kW1LNIxl5+HZBdttkg3kw3tiav8bYKW3+3buPQv +M3nR7sBjyGdt5QavSAUpsM+D4SNLlQJAJ4flCWVFGkMantGrJ6zkUI01vapZx3n1 +RrLw6xiF8kaYUAXqh1epHV+q+RQjkkJGZ2Zr2dA8Edyon9hTFEB7dwJBAPRRChg8 +9fcihtNMiRwzGGr7rHtS1TpoA5hbIjPCbY8rHMkLdMnoxBa11E9PmXqyyyctrN+z +o54iWWshXKtbx24= +-----END PRIVATE KEY----- -- Repository URL: https://hg.python.org/pythontestdotnet From python-checkins at python.org Wed Nov 5 17:00:42 2014 From: python-checkins at python.org (victor.stinner) Date: Wed, 05 Nov 2014 16:00:42 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2322793=2C_=2322637?= =?utf-8?q?=3A_Add_missing_=22import_os=22_in_uuid=2E=5Fifconfig=5Fgetnode?= =?utf-8?b?KCk=?= Message-ID: <20141105160036.108371.72610@psf.io> https://hg.python.org/cpython/rev/16d6c2443131 changeset: 93390:16d6c2443131 user: Victor Stinner date: Wed Nov 05 16:55:36 2014 +0100 summary: Issue #22793, #22637: Add missing "import os" in uuid._ifconfig_getnode() files: Lib/uuid.py | 1 + 1 files changed, 1 insertions(+), 0 deletions(-) diff --git a/Lib/uuid.py b/Lib/uuid.py --- a/Lib/uuid.py +++ b/Lib/uuid.py @@ -346,6 +346,7 @@ def _ifconfig_getnode(): """Get the hardware address on Unix by running ifconfig.""" + import os # This works on Linux ('' or '-a'), Tru64 ('-av'), but not all Unixes. for args in ('', '-a', '-av'): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 17:09:19 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 05 Nov 2014 16:09:19 +0000 Subject: [Python-checkins] =?utf-8?q?pythontestdotnet=3A_add_index_page?= Message-ID: <20141105160822.113480.79170@psf.io> https://hg.python.org/pythontestdotnet/rev/607a33b35ad4 changeset: 1:607a33b35ad4 user: Benjamin Peterson date: Wed Nov 05 11:08:16 2014 -0500 summary: add index page files: www/index.html | 10 ++++++++++ 1 files changed, 10 insertions(+), 0 deletions(-) diff --git a/www/index.html b/www/index.html new file mode 100644 --- /dev/null +++ b/www/index.html @@ -0,0 +1,10 @@ + + + + (C)Python test resources + + + This domain is hosted to host various services contacted by + the Python test suite. + + -- Repository URL: https://hg.python.org/pythontestdotnet From python-checkins at python.org Wed Nov 5 17:12:37 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 05 Nov 2014 16:12:37 +0000 Subject: [Python-checkins] =?utf-8?q?pythontestdotnet=3A_fix_wording?= Message-ID: <20141105161220.113462.77297@psf.io> https://hg.python.org/pythontestdotnet/rev/92f2abd2f88b changeset: 2:92f2abd2f88b user: Benjamin Peterson date: Wed Nov 05 11:12:18 2014 -0500 summary: fix wording files: www/index.html | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/www/index.html b/www/index.html --- a/www/index.html +++ b/www/index.html @@ -4,7 +4,7 @@ (C)Python test resources - This domain is hosted to host various services contacted by + This domain is used to host various services contacted by the Python test suite. -- Repository URL: https://hg.python.org/pythontestdotnet From python-checkins at python.org Wed Nov 5 17:31:12 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 05 Nov 2014 16:31:12 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E2=29=3A_use_pythontest?= =?utf-8?q?=2Enet_for_url_fragment_test?= Message-ID: <20141105163108.108071.41985@psf.io> https://hg.python.org/cpython/rev/4fbf1a7c1e40 changeset: 93392:4fbf1a7c1e40 branch: 3.2 parent: 93371:c16e047965a2 user: Benjamin Peterson date: Wed Nov 05 11:27:14 2014 -0500 summary: use pythontest.net for url fragment test files: Lib/test/test_urllib2net.py | 4 ++-- 1 files changed, 2 insertions(+), 2 deletions(-) diff --git a/Lib/test/test_urllib2net.py b/Lib/test/test_urllib2net.py --- a/Lib/test/test_urllib2net.py +++ b/Lib/test/test_urllib2net.py @@ -156,12 +156,12 @@ ## self._test_urls(urls, self._extra_handlers()+[bauth, dauth]) def test_urlwithfrag(self): - urlwith_frag = "https://docs.python.org/2/glossary.html#glossary" + urlwith_frag = "http://www.pythontest.net/index.html#frag" with support.transient_internet(urlwith_frag): req = urllib.request.Request(urlwith_frag) res = urllib.request.urlopen(req) self.assertEqual(res.geturl(), - "https://docs.python.org/2/glossary.html#glossary") + "http://www.pythontest.net/index.html#frag") def test_custom_headers(self): url = "http://www.example.com" -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 17:31:12 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 05 Nov 2014 16:31:12 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E4=29=3A_remove_require?= =?utf-8?q?s=5Fssl_decorator?= Message-ID: <20141105163109.108099.11204@psf.io> https://hg.python.org/cpython/rev/2bad07298c5c changeset: 93395:2bad07298c5c branch: 3.4 user: Benjamin Peterson date: Wed Nov 05 11:30:21 2014 -0500 summary: remove requires_ssl decorator files: Lib/test/test_urllib2net.py | 1 - 1 files changed, 0 insertions(+), 1 deletions(-) diff --git a/Lib/test/test_urllib2net.py b/Lib/test/test_urllib2net.py --- a/Lib/test/test_urllib2net.py +++ b/Lib/test/test_urllib2net.py @@ -159,7 +159,6 @@ ## self._test_urls(urls, self._extra_handlers()+[bauth, dauth]) - @requires_ssl def test_urlwithfrag(self): urlwith_frag = "http://www.pythontest.net/index.html#frag" with support.transient_internet(urlwith_frag): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 17:31:12 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 05 Nov 2014 16:31:12 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?b?KTogbWVyZ2UgMy40?= Message-ID: <20141105163109.108369.18083@psf.io> https://hg.python.org/cpython/rev/826566b1b219 changeset: 93396:826566b1b219 parent: 93390:16d6c2443131 parent: 93395:2bad07298c5c user: Benjamin Peterson date: Wed Nov 05 11:31:02 2014 -0500 summary: merge 3.4 files: Lib/test/test_urllib2net.py | 5 ++--- 1 files changed, 2 insertions(+), 3 deletions(-) diff --git a/Lib/test/test_urllib2net.py b/Lib/test/test_urllib2net.py --- a/Lib/test/test_urllib2net.py +++ b/Lib/test/test_urllib2net.py @@ -159,14 +159,13 @@ ## self._test_urls(urls, self._extra_handlers()+[bauth, dauth]) - @requires_ssl def test_urlwithfrag(self): - urlwith_frag = "https://docs.python.org/2/glossary.html#glossary" + urlwith_frag = "http://www.pythontest.net/index.html#frag" with support.transient_internet(urlwith_frag): req = urllib.request.Request(urlwith_frag) res = urllib.request.urlopen(req) self.assertEqual(res.geturl(), - "https://docs.python.org/2/glossary.html#glossary") + "http://www.pythontest.net/index.html#frag") @requires_ssl def test_redirect_url_withfrag(self): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 17:31:12 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 05 Nov 2014 16:31:12 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAobWVyZ2UgMy4zIC0+IDMuNCk6?= =?utf-8?q?_merge_3=2E3?= Message-ID: <20141105163109.113482.67959@psf.io> https://hg.python.org/cpython/rev/4045f28ccbec changeset: 93394:4045f28ccbec branch: 3.4 parent: 93388:d05ba48cfc29 parent: 93393:6c46859edfd7 user: Benjamin Peterson date: Wed Nov 05 11:30:00 2014 -0500 summary: merge 3.3 files: Lib/test/test_urllib2net.py | 4 ++-- 1 files changed, 2 insertions(+), 2 deletions(-) diff --git a/Lib/test/test_urllib2net.py b/Lib/test/test_urllib2net.py --- a/Lib/test/test_urllib2net.py +++ b/Lib/test/test_urllib2net.py @@ -161,12 +161,12 @@ @requires_ssl def test_urlwithfrag(self): - urlwith_frag = "https://docs.python.org/2/glossary.html#glossary" + urlwith_frag = "http://www.pythontest.net/index.html#frag" with support.transient_internet(urlwith_frag): req = urllib.request.Request(urlwith_frag) res = urllib.request.urlopen(req) self.assertEqual(res.geturl(), - "https://docs.python.org/2/glossary.html#glossary") + "http://www.pythontest.net/index.html#frag") @requires_ssl def test_redirect_url_withfrag(self): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 17:31:12 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 05 Nov 2014 16:31:12 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAobWVyZ2UgMy4yIC0+IDMuMyk6?= =?utf-8?q?_merge_3=2E2?= Message-ID: <20141105163108.85216.21957@psf.io> https://hg.python.org/cpython/rev/6c46859edfd7 changeset: 93393:6c46859edfd7 branch: 3.3 parent: 93372:b5d92b52d494 parent: 93392:4fbf1a7c1e40 user: Benjamin Peterson date: Wed Nov 05 11:29:39 2014 -0500 summary: merge 3.2 files: Lib/test/test_urllib2net.py | 4 ++-- 1 files changed, 2 insertions(+), 2 deletions(-) diff --git a/Lib/test/test_urllib2net.py b/Lib/test/test_urllib2net.py --- a/Lib/test/test_urllib2net.py +++ b/Lib/test/test_urllib2net.py @@ -155,12 +155,12 @@ ## self._test_urls(urls, self._extra_handlers()+[bauth, dauth]) def test_urlwithfrag(self): - urlwith_frag = "https://docs.python.org/2/glossary.html#glossary" + urlwith_frag = "http://www.pythontest.net/index.html#frag" with support.transient_internet(urlwith_frag): req = urllib.request.Request(urlwith_frag) res = urllib.request.urlopen(req) self.assertEqual(res.geturl(), - "https://docs.python.org/2/glossary.html#glossary") + "http://www.pythontest.net/index.html#frag") def test_custom_headers(self): url = "http://www.example.com" -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 17:31:12 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 05 Nov 2014 16:31:12 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=282=2E7=29=3A_use_pythontest?= =?utf-8?q?=2Enet_for_url_fragment_test?= Message-ID: <20141105163108.108087.44767@psf.io> https://hg.python.org/cpython/rev/603bd221527c changeset: 93391:603bd221527c branch: 2.7 parent: 93385:4c260cf1ba39 user: Benjamin Peterson date: Wed Nov 05 11:27:14 2014 -0500 summary: use pythontest.net for url fragment test files: Lib/test/test_urllib2net.py | 4 ++-- 1 files changed, 2 insertions(+), 2 deletions(-) diff --git a/Lib/test/test_urllib2net.py b/Lib/test/test_urllib2net.py --- a/Lib/test/test_urllib2net.py +++ b/Lib/test/test_urllib2net.py @@ -155,12 +155,12 @@ ## self._test_urls(urls, self._extra_handlers()+[bauth, dauth]) def test_urlwithfrag(self): - urlwith_frag = "https://docs.python.org/2/glossary.html#glossary" + urlwith_frag = "http://www.pythontest.net/index.html#frag" with test_support.transient_internet(urlwith_frag): req = urllib2.Request(urlwith_frag) res = urllib2.urlopen(req) self.assertEqual(res.geturl(), - "https://docs.python.org/2/glossary.html#glossary") + "http://www.pythontest.net/index.html#frag") def test_fileno(self): req = urllib2.Request("http://www.example.com") -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 18:59:57 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 05 Nov 2014 17:59:57 +0000 Subject: [Python-checkins] =?utf-8?q?pythontestdotnet=3A_add_redirect_targ?= =?utf-8?q?et?= Message-ID: <20141105175950.108073.64464@psf.io> https://hg.python.org/pythontestdotnet/rev/5fdf30f78cf1 changeset: 3:5fdf30f78cf1 user: Benjamin Peterson date: Wed Nov 05 12:59:48 2014 -0500 summary: add redirect target files: www/elsewhere/index.html | 10 ++++++++++ 1 files changed, 10 insertions(+), 0 deletions(-) diff --git a/www/elsewhere/index.html b/www/elsewhere/index.html new file mode 100644 --- /dev/null +++ b/www/elsewhere/index.html @@ -0,0 +1,10 @@ + + + +Redirect target + + +This is a redirect target. + + + -- Repository URL: https://hg.python.org/pythontestdotnet From python-checkins at python.org Wed Nov 5 19:10:35 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 05 Nov 2014 18:10:35 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?b?KTogbWVyZ2UgMy40?= Message-ID: <20141105181020.108081.93656@psf.io> https://hg.python.org/cpython/rev/98ee59f61940 changeset: 93398:98ee59f61940 parent: 93396:826566b1b219 parent: 93397:ffa326335c4d user: Benjamin Peterson date: Wed Nov 05 13:10:16 2014 -0500 summary: merge 3.4 files: Lib/test/test_urllib2net.py | 12 ++---------- 1 files changed, 2 insertions(+), 10 deletions(-) diff --git a/Lib/test/test_urllib2net.py b/Lib/test/test_urllib2net.py --- a/Lib/test/test_urllib2net.py +++ b/Lib/test/test_urllib2net.py @@ -8,13 +8,6 @@ import urllib.request import sys -try: - import ssl -except ImportError: - ssl = None - -requires_ssl = unittest.skipIf(ssl is None, "SSL not supported") - support.requires("network") TIMEOUT = 60 # seconds @@ -167,14 +160,13 @@ self.assertEqual(res.geturl(), "http://www.pythontest.net/index.html#frag") - @requires_ssl def test_redirect_url_withfrag(self): - redirect_url_with_frag = "http://bit.ly/1iSHToT" + redirect_url_with_frag = "http://www.pythontest.net/redir/with_frag/" with support.transient_internet(redirect_url_with_frag): req = urllib.request.Request(redirect_url_with_frag) res = urllib.request.urlopen(req) self.assertEqual(res.geturl(), - "https://docs.python.org/3.4/glossary.html#term-global-interpreter-lock") + "http://www.pythontest.net/elsewhere/#frag") def test_custom_headers(self): url = "http://www.example.com" -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 19:10:36 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 05 Nov 2014 18:10:36 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E4=29=3A_use_pythontest?= =?utf-8?q?=2Enet_for_fragment_redirection_test?= Message-ID: <20141105181019.703.92636@psf.io> https://hg.python.org/cpython/rev/ffa326335c4d changeset: 93397:ffa326335c4d branch: 3.4 parent: 93395:2bad07298c5c user: Benjamin Peterson date: Wed Nov 05 13:10:08 2014 -0500 summary: use pythontest.net for fragment redirection test files: Lib/test/test_urllib2net.py | 12 ++---------- 1 files changed, 2 insertions(+), 10 deletions(-) diff --git a/Lib/test/test_urllib2net.py b/Lib/test/test_urllib2net.py --- a/Lib/test/test_urllib2net.py +++ b/Lib/test/test_urllib2net.py @@ -8,13 +8,6 @@ import urllib.request import sys -try: - import ssl -except ImportError: - ssl = None - -requires_ssl = unittest.skipIf(ssl is None, "SSL not supported") - support.requires("network") TIMEOUT = 60 # seconds @@ -167,14 +160,13 @@ self.assertEqual(res.geturl(), "http://www.pythontest.net/index.html#frag") - @requires_ssl def test_redirect_url_withfrag(self): - redirect_url_with_frag = "http://bit.ly/1iSHToT" + redirect_url_with_frag = "http://www.pythontest.net/redir/with_frag/" with support.transient_internet(redirect_url_with_frag): req = urllib.request.Request(redirect_url_with_frag) res = urllib.request.urlopen(req) self.assertEqual(res.geturl(), - "https://docs.python.org/3.4/glossary.html#term-global-interpreter-lock") + "http://www.pythontest.net/elsewhere/#frag") def test_custom_headers(self): url = "http://www.example.com" -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 20:22:45 2014 From: python-checkins at python.org (georg.brandl) Date: Wed, 05 Nov 2014 19:22:45 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogQ2xvc2VzICMyMjUy?= =?utf-8?q?5=3A_clarify_documentation_for_ast=2Eliteral=5Feval=28=29=2E?= Message-ID: <20141105192105.719.63871@psf.io> https://hg.python.org/cpython/rev/5c5909740026 changeset: 93399:5c5909740026 branch: 3.4 parent: 93397:ffa326335c4d user: Georg Brandl date: Wed Nov 05 20:20:28 2014 +0100 summary: Closes #22525: clarify documentation for ast.literal_eval(). files: Doc/library/ast.rst | 14 ++++++++------ 1 files changed, 8 insertions(+), 6 deletions(-) diff --git a/Doc/library/ast.rst b/Doc/library/ast.rst --- a/Doc/library/ast.rst +++ b/Doc/library/ast.rst @@ -115,13 +115,15 @@ .. function:: literal_eval(node_or_string) - Safely evaluate an expression node or a string containing a Python - expression. The string or node provided may only consist of the following - Python literal structures: strings, bytes, numbers, tuples, lists, dicts, - sets, booleans, and ``None``. + Safely evaluate an expression node or a string containing a Python literal or + container display. The string or node provided may only consist of the + following Python literal structures: strings, bytes, numbers, tuples, lists, + dicts, sets, booleans, and ``None``. - This can be used for safely evaluating strings containing Python expressions - from untrusted sources without the need to parse the values oneself. + This can be used for safely evaluating strings containing Python values from + untrusted sources without the need to parse the values oneself. It is not + capable of evaluating arbitrarily complex expressions, for example involving + operators or indexing. .. versionchanged:: 3.2 Now allows bytes and set literals. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 20:22:45 2014 From: python-checkins at python.org (georg.brandl) Date: Wed, 05 Nov 2014 19:22:45 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_merge_with_3=2E4?= Message-ID: <20141105192105.85200.29777@psf.io> https://hg.python.org/cpython/rev/ce07253e384f changeset: 93400:ce07253e384f parent: 93398:98ee59f61940 parent: 93399:5c5909740026 user: Georg Brandl date: Wed Nov 05 20:20:45 2014 +0100 summary: merge with 3.4 files: Doc/library/ast.rst | 14 ++++++++------ 1 files changed, 8 insertions(+), 6 deletions(-) diff --git a/Doc/library/ast.rst b/Doc/library/ast.rst --- a/Doc/library/ast.rst +++ b/Doc/library/ast.rst @@ -115,13 +115,15 @@ .. function:: literal_eval(node_or_string) - Safely evaluate an expression node or a string containing a Python - expression. The string or node provided may only consist of the following - Python literal structures: strings, bytes, numbers, tuples, lists, dicts, - sets, booleans, and ``None``. + Safely evaluate an expression node or a string containing a Python literal or + container display. The string or node provided may only consist of the + following Python literal structures: strings, bytes, numbers, tuples, lists, + dicts, sets, booleans, and ``None``. - This can be used for safely evaluating strings containing Python expressions - from untrusted sources without the need to parse the values oneself. + This can be used for safely evaluating strings containing Python values from + untrusted sources without the need to parse the values oneself. It is not + capable of evaluating arbitrarily complex expressions, for example involving + operators or indexing. .. versionchanged:: 3.2 Now allows bytes and set literals. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 20:24:15 2014 From: python-checkins at python.org (georg.brandl) Date: Wed, 05 Nov 2014 19:24:15 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogQ2xvc2VzICMyMjUy?= =?utf-8?q?5=3A_clarify_documentation_for_ast=2Eliteral=5Feval=28=29=2E?= Message-ID: <20141105192409.108379.34047@psf.io> https://hg.python.org/cpython/rev/3e8d3c4bc17e changeset: 93401:3e8d3c4bc17e branch: 2.7 parent: 93391:603bd221527c user: Georg Brandl date: Wed Nov 05 20:20:28 2014 +0100 summary: Closes #22525: clarify documentation for ast.literal_eval(). files: Doc/library/ast.rst | 12 +++++++----- 1 files changed, 7 insertions(+), 5 deletions(-) diff --git a/Doc/library/ast.rst b/Doc/library/ast.rst --- a/Doc/library/ast.rst +++ b/Doc/library/ast.rst @@ -132,12 +132,14 @@ .. function:: literal_eval(node_or_string) Safely evaluate an expression node or a Unicode or *Latin-1* encoded string - containing a Python expression. The string or node provided may only consist - of the following Python literal structures: strings, numbers, tuples, lists, - dicts, booleans, and ``None``. + containing a Python literal or container display. The string or node + provided may only consist of the following Python literal structures: + strings, numbers, tuples, lists, dicts, booleans, and ``None``. - This can be used for safely evaluating strings containing Python expressions - from untrusted sources without the need to parse the values oneself. + This can be used for safely evaluating strings containing Python values from + untrusted sources without the need to parse the values oneself. It is not + capable of evaluating arbitrarily complex expressions, for example involving + operators or indexing. .. function:: get_docstring(node, clean=True) -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 20:49:36 2014 From: python-checkins at python.org (antoine.pitrou) Date: Wed, 05 Nov 2014 19:49:36 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogQ2xvc2VzICMyMjc4?= =?utf-8?q?4=3A_fix_test=5Fasyncio_when_the_ssl_module_isn=27t_available?= Message-ID: <20141105194914.113480.30880@psf.io> https://hg.python.org/cpython/rev/7e9e2b17ac6f changeset: 93402:7e9e2b17ac6f branch: 3.4 parent: 93399:5c5909740026 user: Antoine Pitrou date: Wed Nov 05 20:48:16 2014 +0100 summary: Closes #22784: fix test_asyncio when the ssl module isn't available files: Lib/test/test_asyncio/test_events.py | 17 ++++++++------- 1 files changed, 9 insertions(+), 8 deletions(-) diff --git a/Lib/test/test_asyncio/test_events.py b/Lib/test/test_asyncio/test_events.py --- a/Lib/test/test_asyncio/test_events.py +++ b/Lib/test/test_asyncio/test_events.py @@ -606,14 +606,15 @@ self.assertGreater(pr.nbytes, 0) tr.close() - def _dummy_ssl_create_context(self, purpose=ssl.Purpose.SERVER_AUTH, *, - cafile=None, capath=None, cadata=None): - """ - A ssl.create_default_context() replacement that doesn't enable - cert validation. - """ - self.assertEqual(purpose, ssl.Purpose.SERVER_AUTH) - return test_utils.dummy_ssl_context() + if ssl: + def _dummy_ssl_create_context(self, purpose=ssl.Purpose.SERVER_AUTH, *, + cafile=None, capath=None, cadata=None): + """ + A ssl.create_default_context() replacement that doesn't enable + cert validation. + """ + self.assertEqual(purpose, ssl.Purpose.SERVER_AUTH) + return test_utils.dummy_ssl_context() def _test_create_ssl_connection(self, httpd, create_connection, check_sockname=True): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 20:49:36 2014 From: python-checkins at python.org (antoine.pitrou) Date: Wed, 05 Nov 2014 19:49:36 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Closes_=2322784=3A_fix_test=5Fasyncio_when_the_ssl_modul?= =?utf-8?q?e_isn=27t_available?= Message-ID: <20141105194914.108393.60951@psf.io> https://hg.python.org/cpython/rev/028c729714af changeset: 93403:028c729714af parent: 93400:ce07253e384f parent: 93402:7e9e2b17ac6f user: Antoine Pitrou date: Wed Nov 05 20:48:40 2014 +0100 summary: Closes #22784: fix test_asyncio when the ssl module isn't available files: Lib/test/test_asyncio/test_events.py | 17 ++++++++------- 1 files changed, 9 insertions(+), 8 deletions(-) diff --git a/Lib/test/test_asyncio/test_events.py b/Lib/test/test_asyncio/test_events.py --- a/Lib/test/test_asyncio/test_events.py +++ b/Lib/test/test_asyncio/test_events.py @@ -606,14 +606,15 @@ self.assertGreater(pr.nbytes, 0) tr.close() - def _dummy_ssl_create_context(self, purpose=ssl.Purpose.SERVER_AUTH, *, - cafile=None, capath=None, cadata=None): - """ - A ssl.create_default_context() replacement that doesn't enable - cert validation. - """ - self.assertEqual(purpose, ssl.Purpose.SERVER_AUTH) - return test_utils.dummy_ssl_context() + if ssl: + def _dummy_ssl_create_context(self, purpose=ssl.Purpose.SERVER_AUTH, *, + cafile=None, capath=None, cadata=None): + """ + A ssl.create_default_context() replacement that doesn't enable + cert validation. + """ + self.assertEqual(purpose, ssl.Purpose.SERVER_AUTH) + return test_utils.dummy_ssl_context() def _test_create_ssl_connection(self, httpd, create_connection, check_sockname=True): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 22:18:37 2014 From: python-checkins at python.org (georg.brandl) Date: Wed, 05 Nov 2014 21:18:37 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogdGVzdF9odHRwbGli?= =?utf-8?q?=3A_use_self-signed=2Epythontest=2Enet_for_verification_test_wi?= =?utf-8?q?th?= Message-ID: <20141105211833.108387.70219@psf.io> https://hg.python.org/cpython/rev/4985375db40f changeset: 93404:4985375db40f branch: 3.4 parent: 93402:7e9e2b17ac6f user: Georg Brandl date: Wed Nov 05 20:37:40 2014 +0100 summary: test_httplib: use self-signed.pythontest.net for verification test with non-root-CA cert files: Lib/test/selfsigned_pythontestdotnet.pem | 16 +++++++++ Lib/test/test_httplib.py | 20 ++++------- 2 files changed, 24 insertions(+), 12 deletions(-) diff --git a/Lib/test/selfsigned_pythontestdotnet.pem b/Lib/test/selfsigned_pythontestdotnet.pem new file mode 100644 --- /dev/null +++ b/Lib/test/selfsigned_pythontestdotnet.pem @@ -0,0 +1,16 @@ +-----BEGIN CERTIFICATE----- +MIIChzCCAfCgAwIBAgIJAKGU95wKR8pSMA0GCSqGSIb3DQEBBQUAMHAxCzAJBgNV +BAYTAlhZMRcwFQYDVQQHDA5DYXN0bGUgQW50aHJheDEjMCEGA1UECgwaUHl0aG9u +IFNvZnR3YXJlIEZvdW5kYXRpb24xIzAhBgNVBAMMGnNlbGYtc2lnbmVkLnB5dGhv +bnRlc3QubmV0MB4XDTE0MTEwMjE4MDkyOVoXDTI0MTAzMDE4MDkyOVowcDELMAkG +A1UEBhMCWFkxFzAVBgNVBAcMDkNhc3RsZSBBbnRocmF4MSMwIQYDVQQKDBpQeXRo +b24gU29mdHdhcmUgRm91bmRhdGlvbjEjMCEGA1UEAwwac2VsZi1zaWduZWQucHl0 +aG9udGVzdC5uZXQwgZ8wDQYJKoZIhvcNAQEBBQADgY0AMIGJAoGBANDXQXW9tjyZ +Xt0Iv2tLL1+jinr4wGg36ioLDLFkMf+2Y1GL0v0BnKYG4N1OKlAU15LXGeGer8vm +Sv/yIvmdrELvhAbbo3w4a9TMYQA4XkIVLdvu3mvNOAet+8PMJxn26dbDhG809ALv +EHY57lQsBS3G59RZyBPVqAqmImWNJnVzAgMBAAGjKTAnMCUGA1UdEQQeMByCGnNl +bGYtc2lnbmVkLnB5dGhvbnRlc3QubmV0MA0GCSqGSIb3DQEBBQUAA4GBAIOXmdtM +eG9qzP9TiXW/Gc/zI4cBfdCpC+Y4gOfC9bQUC7hefix4iO3+iZjgy3X/FaRxUUoV +HKiXcXIaWqTSUWp45cSh0MbwZXudp6JIAptzdAhvvCrPKeC9i9GvxsPD4LtDAL97 +vSaxQBezA7hdxZd90/EeyMgVZgAnTCnvAWX9 +-----END CERTIFICATE----- diff --git a/Lib/test/test_httplib.py b/Lib/test/test_httplib.py --- a/Lib/test/test_httplib.py +++ b/Lib/test/test_httplib.py @@ -15,8 +15,8 @@ CERT_localhost = os.path.join(here, 'keycert.pem') # Self-signed cert file for 'fakehostname' CERT_fakehostname = os.path.join(here, 'keycert2.pem') -# Root cert file (CA) for svn.python.org's cert -CACERT_svn_python_org = os.path.join(here, 'https_svn_python_org_root.pem') +# Self-signed cert file for self-signed.pythontest.net +CERT_selfsigned_pythontestdotnet = os.path.join(here, 'selfsigned_pythontestdotnet.pem') HOST = support.HOST @@ -772,11 +772,6 @@ h = client.HTTPSConnection(HOST, TimeoutTest.PORT, timeout=30) self.assertEqual(h.timeout, 30) - def _check_svn_python_org(self, resp): - # Just a simple check that everything went fine - server_string = resp.getheader('server') - self.assertIn('Apache', server_string) - def test_networked(self): # Default settings: requires a valid cert from a trusted CA import ssl @@ -810,17 +805,18 @@ self.assertIn('text/html', content_type) def test_networked_good_cert(self): - # We feed a CA cert that validates the server's cert + # We feed the server's cert as a validating cert import ssl support.requires('network') - with support.transient_internet('svn.python.org'): + with support.transient_internet('self-signed.pythontest.net'): context = ssl.SSLContext(ssl.PROTOCOL_TLSv1) context.verify_mode = ssl.CERT_REQUIRED - context.load_verify_locations(CACERT_svn_python_org) - h = client.HTTPSConnection('svn.python.org', 443, context=context) + context.load_verify_locations(CERT_selfsigned_pythontestdotnet) + h = client.HTTPSConnection('self-signed.pythontest.net', 443, context=context) h.request('GET', '/') resp = h.getresponse() - self._check_svn_python_org(resp) + server_string = resp.getheader('server') + self.assertIn('nginx', server_string) def test_networked_bad_cert(self): # We feed a "CA" cert that is unrelated to the server's cert -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 5 22:18:39 2014 From: python-checkins at python.org (georg.brandl) Date: Wed, 05 Nov 2014 21:18:39 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_merge_with_3=2E4?= Message-ID: <20141105211834.113474.4902@psf.io> https://hg.python.org/cpython/rev/089573725c77 changeset: 93405:089573725c77 parent: 93403:028c729714af parent: 93404:4985375db40f user: Georg Brandl date: Wed Nov 05 22:17:29 2014 +0100 summary: merge with 3.4 files: Lib/test/selfsigned_pythontestdotnet.pem | 16 +++++++++ Lib/test/test_httplib.py | 20 ++++------- 2 files changed, 24 insertions(+), 12 deletions(-) diff --git a/Lib/test/selfsigned_pythontestdotnet.pem b/Lib/test/selfsigned_pythontestdotnet.pem new file mode 100644 --- /dev/null +++ b/Lib/test/selfsigned_pythontestdotnet.pem @@ -0,0 +1,16 @@ +-----BEGIN CERTIFICATE----- +MIIChzCCAfCgAwIBAgIJAKGU95wKR8pSMA0GCSqGSIb3DQEBBQUAMHAxCzAJBgNV +BAYTAlhZMRcwFQYDVQQHDA5DYXN0bGUgQW50aHJheDEjMCEGA1UECgwaUHl0aG9u +IFNvZnR3YXJlIEZvdW5kYXRpb24xIzAhBgNVBAMMGnNlbGYtc2lnbmVkLnB5dGhv +bnRlc3QubmV0MB4XDTE0MTEwMjE4MDkyOVoXDTI0MTAzMDE4MDkyOVowcDELMAkG +A1UEBhMCWFkxFzAVBgNVBAcMDkNhc3RsZSBBbnRocmF4MSMwIQYDVQQKDBpQeXRo +b24gU29mdHdhcmUgRm91bmRhdGlvbjEjMCEGA1UEAwwac2VsZi1zaWduZWQucHl0 +aG9udGVzdC5uZXQwgZ8wDQYJKoZIhvcNAQEBBQADgY0AMIGJAoGBANDXQXW9tjyZ +Xt0Iv2tLL1+jinr4wGg36ioLDLFkMf+2Y1GL0v0BnKYG4N1OKlAU15LXGeGer8vm +Sv/yIvmdrELvhAbbo3w4a9TMYQA4XkIVLdvu3mvNOAet+8PMJxn26dbDhG809ALv +EHY57lQsBS3G59RZyBPVqAqmImWNJnVzAgMBAAGjKTAnMCUGA1UdEQQeMByCGnNl +bGYtc2lnbmVkLnB5dGhvbnRlc3QubmV0MA0GCSqGSIb3DQEBBQUAA4GBAIOXmdtM +eG9qzP9TiXW/Gc/zI4cBfdCpC+Y4gOfC9bQUC7hefix4iO3+iZjgy3X/FaRxUUoV +HKiXcXIaWqTSUWp45cSh0MbwZXudp6JIAptzdAhvvCrPKeC9i9GvxsPD4LtDAL97 +vSaxQBezA7hdxZd90/EeyMgVZgAnTCnvAWX9 +-----END CERTIFICATE----- diff --git a/Lib/test/test_httplib.py b/Lib/test/test_httplib.py --- a/Lib/test/test_httplib.py +++ b/Lib/test/test_httplib.py @@ -15,8 +15,8 @@ CERT_localhost = os.path.join(here, 'keycert.pem') # Self-signed cert file for 'fakehostname' CERT_fakehostname = os.path.join(here, 'keycert2.pem') -# Root cert file (CA) for svn.python.org's cert -CACERT_svn_python_org = os.path.join(here, 'https_svn_python_org_root.pem') +# Self-signed cert file for self-signed.pythontest.net +CERT_selfsigned_pythontestdotnet = os.path.join(here, 'selfsigned_pythontestdotnet.pem') # constants for testing chunked encoding chunked_start = ( @@ -1006,11 +1006,6 @@ h = client.HTTPSConnection(HOST, TimeoutTest.PORT, timeout=30) self.assertEqual(h.timeout, 30) - def _check_svn_python_org(self, resp): - # Just a simple check that everything went fine - server_string = resp.getheader('server') - self.assertIn('Apache', server_string) - def test_networked(self): # Default settings: requires a valid cert from a trusted CA import ssl @@ -1044,17 +1039,18 @@ self.assertIn('text/html', content_type) def test_networked_good_cert(self): - # We feed a CA cert that validates the server's cert + # We feed the server's cert as a validating cert import ssl support.requires('network') - with support.transient_internet('svn.python.org'): + with support.transient_internet('self-signed.pythontest.net'): context = ssl.SSLContext(ssl.PROTOCOL_TLSv1) context.verify_mode = ssl.CERT_REQUIRED - context.load_verify_locations(CACERT_svn_python_org) - h = client.HTTPSConnection('svn.python.org', 443, context=context) + context.load_verify_locations(CERT_selfsigned_pythontestdotnet) + h = client.HTTPSConnection('self-signed.pythontest.net', 443, context=context) h.request('GET', '/') resp = h.getresponse() - self._check_svn_python_org(resp) + server_string = resp.getheader('server') + self.assertIn('nginx', server_string) def test_networked_bad_cert(self): # We feed a "CA" cert that is unrelated to the server's cert -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 6 04:31:08 2014 From: python-checkins at python.org (steve.dower) Date: Thu, 06 Nov 2014 03:31:08 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzIwMTYw?= =?utf-8?q?=3A_broken_ctypes_calling_convention_on_MSVC_/_64-bit_Windows_?= =?utf-8?q?=28large?= Message-ID: <20141106033103.85196.11331@psf.io> https://hg.python.org/cpython/rev/f75b0470168b changeset: 93406:f75b0470168b branch: 2.7 parent: 93401:3e8d3c4bc17e user: Steve Dower date: Wed Nov 05 19:16:05 2014 -0800 summary: Issue #20160: broken ctypes calling convention on MSVC / 64-bit Windows (large structs). Patch by mattip files: Lib/ctypes/test/test_win32.py | 26 +++++++- Modules/_ctypes/_ctypes_test.c | 43 ++++++++++++++ Modules/_ctypes/callproc.c | 6 +- Modules/_ctypes/libffi_msvc/ffi.c | 29 +++++++- Modules/_ctypes/libffi_msvc/prep_cif.c | 18 ++++- Modules/_ctypes/libffi_msvc/types.c | 2 +- 6 files changed, 106 insertions(+), 18 deletions(-) diff --git a/Lib/ctypes/test/test_win32.py b/Lib/ctypes/test/test_win32.py --- a/Lib/ctypes/test/test_win32.py +++ b/Lib/ctypes/test/test_win32.py @@ -90,9 +90,29 @@ dll = CDLL(_ctypes_test.__file__) - pt = POINT(10, 10) - rect = RECT(0, 0, 20, 20) - self.assertEqual(1, dll.PointInRect(byref(rect), pt)) + pt = POINT(15, 25) + left = c_long.in_dll(dll, 'left') + top = c_long.in_dll(dll, 'top') + right = c_long.in_dll(dll, 'right') + bottom = c_long.in_dll(dll, 'bottom') + rect = RECT(left, top, right, bottom) + PointInRect = dll.PointInRect + PointInRect.argtypes = [POINTER(RECT), POINT] + self.assertEqual(1, PointInRect(byref(rect), pt)) + + ReturnRect = dll.ReturnRect + ReturnRect.argtypes = [c_int, RECT, POINTER(RECT), POINT, RECT, + POINTER(RECT), POINT, RECT] + ReturnRect.restype = RECT + for i in range(4): + ret = ReturnRect(i, rect, pointer(rect), pt, rect, + byref(rect), pt, rect) + # the c function will check and modify ret if something is + # passed in improperly + self.assertEqual(ret.left, left.value) + self.assertEqual(ret.right, right.value) + self.assertEqual(ret.top, top.value) + self.assertEqual(ret.bottom, bottom.value) if __name__ == '__main__': unittest.main() diff --git a/Modules/_ctypes/_ctypes_test.c b/Modules/_ctypes/_ctypes_test.c --- a/Modules/_ctypes/_ctypes_test.c +++ b/Modules/_ctypes/_ctypes_test.c @@ -540,6 +540,49 @@ return 1; } +EXPORT(int left = 10); +EXPORT(int top = 20); +EXPORT(int right = 30); +EXPORT(int bottom = 40); + +EXPORT(RECT) ReturnRect(int i, RECT ar, RECT* br, POINT cp, RECT dr, + RECT *er, POINT fp, RECT gr) +{ + /*Check input */ + if (ar.left + br->left + dr.left + er->left + gr.left != left * 5) + { + ar.left = 100; + return ar; + } + if (ar.right + br->right + dr.right + er->right + gr.right != right * 5) + { + ar.right = 100; + return ar; + } + if (cp.x != fp.x) + { + ar.left = -100; + } + if (cp.y != fp.y) + { + ar.left = -200; + } + switch(i) + { + case 0: + return ar; + break; + case 1: + return dr; + break; + case 2: + return gr; + break; + + } + return ar; +} + typedef struct { short x; short y; diff --git a/Modules/_ctypes/callproc.c b/Modules/_ctypes/callproc.c --- a/Modules/_ctypes/callproc.c +++ b/Modules/_ctypes/callproc.c @@ -1170,11 +1170,7 @@ } for (i = 0; i < argcount; ++i) { atypes[i] = args[i].ffi_type; - if (atypes[i]->type == FFI_TYPE_STRUCT -#ifdef _WIN64 - && atypes[i]->size <= sizeof(void *) -#endif - ) + if (atypes[i]->type == FFI_TYPE_STRUCT) avalues[i] = (void *)args[i].value.p; else avalues[i] = (void *)&args[i].value; diff --git a/Modules/_ctypes/libffi_msvc/ffi.c b/Modules/_ctypes/libffi_msvc/ffi.c --- a/Modules/_ctypes/libffi_msvc/ffi.c +++ b/Modules/_ctypes/libffi_msvc/ffi.c @@ -102,6 +102,15 @@ FFI_ASSERT(0); } } +#ifdef _WIN64 + else if (z > 8) + { + /* On Win64, if a single argument takes more than 8 bytes, + then it is always passed by reference. */ + *(void **)argp = *p_argv; + z = 8; + } +#endif else { memcpy(argp, *p_argv, z); @@ -124,7 +133,6 @@ switch (cif->rtype->type) { case FFI_TYPE_VOID: - case FFI_TYPE_STRUCT: case FFI_TYPE_SINT64: case FFI_TYPE_FLOAT: case FFI_TYPE_DOUBLE: @@ -132,6 +140,18 @@ cif->flags = (unsigned) cif->rtype->type; break; + case FFI_TYPE_STRUCT: + /* MSVC returns small structures in registers. Put in cif->flags + the value FFI_TYPE_STRUCT only if the structure is big enough; + otherwise, put the 4- or 8-bytes integer type. */ + if (cif->rtype->size <= 4) + cif->flags = FFI_TYPE_INT; + else if (cif->rtype->size <= 8) + cif->flags = FFI_TYPE_SINT64; + else + cif->flags = FFI_TYPE_STRUCT; + break; + case FFI_TYPE_UINT64: #ifdef _WIN64 case FFI_TYPE_POINTER: @@ -201,8 +221,7 @@ #else case FFI_SYSV: /*@-usedef@*/ - /* Function call needs at least 40 bytes stack size, on win64 AMD64 */ - return ffi_call_AMD64(ffi_prep_args, &ecif, cif->bytes ? cif->bytes : 40, + return ffi_call_AMD64(ffi_prep_args, &ecif, cif->bytes, cif->flags, ecif.rvalue, fn); /*@=usedef@*/ break; @@ -227,7 +246,7 @@ #else static void __fastcall #endif -ffi_closure_SYSV (ffi_closure *closure, int *argp) +ffi_closure_SYSV (ffi_closure *closure, char *argp) { // this is our return value storage long double res; @@ -237,7 +256,7 @@ void **arg_area; unsigned short rtype; void *resp = (void*)&res; - void *args = &argp[1]; + void *args = argp + sizeof(void*); cif = closure->cif; arg_area = (void**) alloca (cif->nargs * sizeof (void*)); diff --git a/Modules/_ctypes/libffi_msvc/prep_cif.c b/Modules/_ctypes/libffi_msvc/prep_cif.c --- a/Modules/_ctypes/libffi_msvc/prep_cif.c +++ b/Modules/_ctypes/libffi_msvc/prep_cif.c @@ -116,9 +116,9 @@ #if !defined M68K && !defined __x86_64__ && !defined S390 /* Make space for the return structure pointer */ if (cif->rtype->type == FFI_TYPE_STRUCT - /* MSVC returns small structures in registers. But we have a different - workaround: pretend int32 or int64 return type, and converting to - structure afterwards. */ +#ifdef _WIN32 + && (cif->rtype->size > 8) /* MSVC returns small structs in registers */ +#endif #ifdef SPARC && (cif->abi != FFI_V9 || cif->rtype->size > 32) #endif @@ -143,7 +143,11 @@ && ((*ptr)->size > 16 || cif->abi != FFI_V9)) || ((*ptr)->type == FFI_TYPE_LONGDOUBLE && cif->abi != FFI_V9)) - bytes += sizeof(void*); + bytes += sizeof(void*); + else +#elif defined (_WIN64) + if ((*ptr)->type == FFI_TYPE_STRUCT && ((*ptr)->size > 8)) + bytes += sizeof(void*); else #endif { @@ -168,6 +172,12 @@ #endif } +#ifdef _WIN64 + /* Function call needs at least 40 bytes stack size, on win64 AMD64 */ + if (bytes < 40) + bytes = 40; +#endif + cif->bytes = bytes; /* Perform machine dependent cif processing */ diff --git a/Modules/_ctypes/libffi_msvc/types.c b/Modules/_ctypes/libffi_msvc/types.c --- a/Modules/_ctypes/libffi_msvc/types.c +++ b/Modules/_ctypes/libffi_msvc/types.c @@ -43,7 +43,7 @@ FFI_INTEGRAL_TYPEDEF(float, 4, 4, FFI_TYPE_FLOAT); #if defined ALPHA || defined SPARC64 || defined X86_64 || defined S390X \ - || defined IA64 + || defined IA64 || defined _WIN64 FFI_INTEGRAL_TYPEDEF(pointer, 8, 8, FFI_TYPE_POINTER); -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 6 04:31:26 2014 From: python-checkins at python.org (steve.dower) Date: Thu, 06 Nov 2014 03:31:26 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIwMTYw?= =?utf-8?q?=3A_broken_ctypes_calling_convention_on_MSVC_/_64-bit_Windows_?= =?utf-8?q?=28large?= Message-ID: <20141106033126.108373.87640@psf.io> https://hg.python.org/cpython/rev/cd36ba22602d changeset: 93407:cd36ba22602d branch: 3.4 parent: 93404:4985375db40f user: Steve Dower date: Tue Nov 04 21:21:22 2014 -0800 summary: Issue #20160: broken ctypes calling convention on MSVC / 64-bit Windows (large structs) Patch by mattip files: Lib/ctypes/test/test_win32.py | 26 +++++++- Modules/_ctypes/_ctypes_test.c | 43 ++++++++++++++ Modules/_ctypes/callproc.c | 3 - Modules/_ctypes/libffi_msvc/ffi.c | 29 +++++++- Modules/_ctypes/libffi_msvc/prep_cif.c | 16 ++++- Modules/_ctypes/libffi_msvc/types.c | 2 +- 6 files changed, 104 insertions(+), 15 deletions(-) diff --git a/Lib/ctypes/test/test_win32.py b/Lib/ctypes/test/test_win32.py --- a/Lib/ctypes/test/test_win32.py +++ b/Lib/ctypes/test/test_win32.py @@ -111,9 +111,29 @@ dll = CDLL(_ctypes_test.__file__) - pt = POINT(10, 10) - rect = RECT(0, 0, 20, 20) - self.assertEqual(1, dll.PointInRect(byref(rect), pt)) + pt = POINT(15, 25) + left = c_long.in_dll(dll, 'left') + top = c_long.in_dll(dll, 'top') + right = c_long.in_dll(dll, 'right') + bottom = c_long.in_dll(dll, 'bottom') + rect = RECT(left, top, right, bottom) + PointInRect = dll.PointInRect + PointInRect.argtypes = [POINTER(RECT), POINT] + self.assertEqual(1, PointInRect(byref(rect), pt)) + + ReturnRect = dll.ReturnRect + ReturnRect.argtypes = [c_int, RECT, POINTER(RECT), POINT, RECT, + POINTER(RECT), POINT, RECT] + ReturnRect.restype = RECT + for i in range(4): + ret = ReturnRect(i, rect, pointer(rect), pt, rect, + byref(rect), pt, rect) + # the c function will check and modify ret if something is + # passed in improperly + self.assertEqual(ret.left, left.value) + self.assertEqual(ret.right, right.value) + self.assertEqual(ret.top, top.value) + self.assertEqual(ret.bottom, bottom.value) if __name__ == '__main__': unittest.main() diff --git a/Modules/_ctypes/_ctypes_test.c b/Modules/_ctypes/_ctypes_test.c --- a/Modules/_ctypes/_ctypes_test.c +++ b/Modules/_ctypes/_ctypes_test.c @@ -527,6 +527,49 @@ return 1; } +EXPORT(int left = 10); +EXPORT(int top = 20); +EXPORT(int right = 30); +EXPORT(int bottom = 40); + +EXPORT(RECT) ReturnRect(int i, RECT ar, RECT* br, POINT cp, RECT dr, + RECT *er, POINT fp, RECT gr) +{ + /*Check input */ + if (ar.left + br->left + dr.left + er->left + gr.left != left * 5) + { + ar.left = 100; + return ar; + } + if (ar.right + br->right + dr.right + er->right + gr.right != right * 5) + { + ar.right = 100; + return ar; + } + if (cp.x != fp.x) + { + ar.left = -100; + } + if (cp.y != fp.y) + { + ar.left = -200; + } + switch(i) + { + case 0: + return ar; + break; + case 1: + return dr; + break; + case 2: + return gr; + break; + + } + return ar; +} + typedef struct { short x; short y; diff --git a/Modules/_ctypes/callproc.c b/Modules/_ctypes/callproc.c --- a/Modules/_ctypes/callproc.c +++ b/Modules/_ctypes/callproc.c @@ -1140,9 +1140,6 @@ for (i = 0; i < argcount; ++i) { atypes[i] = args[i].ffi_type; if (atypes[i]->type == FFI_TYPE_STRUCT -#ifdef _WIN64 - && atypes[i]->size <= sizeof(void *) -#endif ) avalues[i] = (void *)args[i].value.p; else diff --git a/Modules/_ctypes/libffi_msvc/ffi.c b/Modules/_ctypes/libffi_msvc/ffi.c --- a/Modules/_ctypes/libffi_msvc/ffi.c +++ b/Modules/_ctypes/libffi_msvc/ffi.c @@ -102,6 +102,15 @@ FFI_ASSERT(0); } } +#ifdef _WIN64 + else if (z > 8) + { + /* On Win64, if a single argument takes more than 8 bytes, + then it is always passed by reference. */ + *(void **)argp = *p_argv; + z = 8; + } +#endif else { memcpy(argp, *p_argv, z); @@ -124,7 +133,6 @@ switch (cif->rtype->type) { case FFI_TYPE_VOID: - case FFI_TYPE_STRUCT: case FFI_TYPE_SINT64: case FFI_TYPE_FLOAT: case FFI_TYPE_DOUBLE: @@ -132,6 +140,18 @@ cif->flags = (unsigned) cif->rtype->type; break; + case FFI_TYPE_STRUCT: + /* MSVC returns small structures in registers. Put in cif->flags + the value FFI_TYPE_STRUCT only if the structure is big enough; + otherwise, put the 4- or 8-bytes integer type. */ + if (cif->rtype->size <= 4) + cif->flags = FFI_TYPE_INT; + else if (cif->rtype->size <= 8) + cif->flags = FFI_TYPE_SINT64; + else + cif->flags = FFI_TYPE_STRUCT; + break; + case FFI_TYPE_UINT64: #ifdef _WIN64 case FFI_TYPE_POINTER: @@ -201,8 +221,7 @@ #else case FFI_SYSV: /*@-usedef@*/ - /* Function call needs at least 40 bytes stack size, on win64 AMD64 */ - return ffi_call_AMD64(ffi_prep_args, &ecif, cif->bytes ? cif->bytes : 40, + return ffi_call_AMD64(ffi_prep_args, &ecif, cif->bytes, cif->flags, ecif.rvalue, fn); /*@=usedef@*/ break; @@ -227,7 +246,7 @@ #else static void __fastcall #endif -ffi_closure_SYSV (ffi_closure *closure, int *argp) +ffi_closure_SYSV (ffi_closure *closure, char *argp) { // this is our return value storage long double res; @@ -237,7 +256,7 @@ void **arg_area; unsigned short rtype; void *resp = (void*)&res; - void *args = &argp[1]; + void *args = argp + sizeof(void*); cif = closure->cif; arg_area = (void**) alloca (cif->nargs * sizeof (void*)); diff --git a/Modules/_ctypes/libffi_msvc/prep_cif.c b/Modules/_ctypes/libffi_msvc/prep_cif.c --- a/Modules/_ctypes/libffi_msvc/prep_cif.c +++ b/Modules/_ctypes/libffi_msvc/prep_cif.c @@ -116,9 +116,9 @@ #if !defined M68K && !defined __x86_64__ && !defined S390 /* Make space for the return structure pointer */ if (cif->rtype->type == FFI_TYPE_STRUCT - /* MSVC returns small structures in registers. But we have a different - workaround: pretend int32 or int64 return type, and converting to - structure afterwards. */ +#ifdef _WIN32 + && (cif->rtype->size > 8) /* MSVC returns small structs in registers */ +#endif #ifdef SPARC && (cif->abi != FFI_V9 || cif->rtype->size > 32) #endif @@ -145,6 +145,10 @@ && cif->abi != FFI_V9)) bytes += sizeof(void*); else +#elif defined (_WIN64) + if ((*ptr)->type == FFI_TYPE_STRUCT && ((*ptr)->size > 8)) + bytes += sizeof(void*); + else #endif { #if !defined(_MSC_VER) && !defined(__MINGW32__) @@ -168,6 +172,12 @@ #endif } +#ifdef _WIN64 + /* Function call needs at least 40 bytes stack size, on win64 AMD64 */ + if (bytes < 40) + bytes = 40; +#endif + cif->bytes = bytes; /* Perform machine dependent cif processing */ diff --git a/Modules/_ctypes/libffi_msvc/types.c b/Modules/_ctypes/libffi_msvc/types.c --- a/Modules/_ctypes/libffi_msvc/types.c +++ b/Modules/_ctypes/libffi_msvc/types.c @@ -43,7 +43,7 @@ FFI_INTEGRAL_TYPEDEF(float, 4, 4, FFI_TYPE_FLOAT); #if defined ALPHA || defined SPARC64 || defined X86_64 || defined S390X \ - || defined IA64 + || defined IA64 || defined _WIN64 FFI_INTEGRAL_TYPEDEF(pointer, 8, 8, FFI_TYPE_POINTER); -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 6 04:31:27 2014 From: python-checkins at python.org (steve.dower) Date: Thu, 06 Nov 2014 03:31:27 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2320160=3A_broken_ctypes_calling_convention_on_MS?= =?utf-8?q?VC_/_64-bit_Windows_=28large?= Message-ID: <20141106033126.113470.87820@psf.io> https://hg.python.org/cpython/rev/b701eb69260d changeset: 93408:b701eb69260d parent: 93405:089573725c77 parent: 93407:cd36ba22602d user: Steve Dower date: Wed Nov 05 19:30:30 2014 -0800 summary: Issue #20160: broken ctypes calling convention on MSVC / 64-bit Windows (large structs) Patch by mattip files: Lib/ctypes/test/test_win32.py | 26 +++++++- Modules/_ctypes/_ctypes_test.c | 43 ++++++++++++++ Modules/_ctypes/callproc.c | 3 - Modules/_ctypes/libffi_msvc/ffi.c | 29 +++++++- Modules/_ctypes/libffi_msvc/prep_cif.c | 16 ++++- Modules/_ctypes/libffi_msvc/types.c | 2 +- 6 files changed, 104 insertions(+), 15 deletions(-) diff --git a/Lib/ctypes/test/test_win32.py b/Lib/ctypes/test/test_win32.py --- a/Lib/ctypes/test/test_win32.py +++ b/Lib/ctypes/test/test_win32.py @@ -111,9 +111,29 @@ dll = CDLL(_ctypes_test.__file__) - pt = POINT(10, 10) - rect = RECT(0, 0, 20, 20) - self.assertEqual(1, dll.PointInRect(byref(rect), pt)) + pt = POINT(15, 25) + left = c_long.in_dll(dll, 'left') + top = c_long.in_dll(dll, 'top') + right = c_long.in_dll(dll, 'right') + bottom = c_long.in_dll(dll, 'bottom') + rect = RECT(left, top, right, bottom) + PointInRect = dll.PointInRect + PointInRect.argtypes = [POINTER(RECT), POINT] + self.assertEqual(1, PointInRect(byref(rect), pt)) + + ReturnRect = dll.ReturnRect + ReturnRect.argtypes = [c_int, RECT, POINTER(RECT), POINT, RECT, + POINTER(RECT), POINT, RECT] + ReturnRect.restype = RECT + for i in range(4): + ret = ReturnRect(i, rect, pointer(rect), pt, rect, + byref(rect), pt, rect) + # the c function will check and modify ret if something is + # passed in improperly + self.assertEqual(ret.left, left.value) + self.assertEqual(ret.right, right.value) + self.assertEqual(ret.top, top.value) + self.assertEqual(ret.bottom, bottom.value) if __name__ == '__main__': unittest.main() diff --git a/Modules/_ctypes/_ctypes_test.c b/Modules/_ctypes/_ctypes_test.c --- a/Modules/_ctypes/_ctypes_test.c +++ b/Modules/_ctypes/_ctypes_test.c @@ -527,6 +527,49 @@ return 1; } +EXPORT(int left = 10); +EXPORT(int top = 20); +EXPORT(int right = 30); +EXPORT(int bottom = 40); + +EXPORT(RECT) ReturnRect(int i, RECT ar, RECT* br, POINT cp, RECT dr, + RECT *er, POINT fp, RECT gr) +{ + /*Check input */ + if (ar.left + br->left + dr.left + er->left + gr.left != left * 5) + { + ar.left = 100; + return ar; + } + if (ar.right + br->right + dr.right + er->right + gr.right != right * 5) + { + ar.right = 100; + return ar; + } + if (cp.x != fp.x) + { + ar.left = -100; + } + if (cp.y != fp.y) + { + ar.left = -200; + } + switch(i) + { + case 0: + return ar; + break; + case 1: + return dr; + break; + case 2: + return gr; + break; + + } + return ar; +} + typedef struct { short x; short y; diff --git a/Modules/_ctypes/callproc.c b/Modules/_ctypes/callproc.c --- a/Modules/_ctypes/callproc.c +++ b/Modules/_ctypes/callproc.c @@ -1140,9 +1140,6 @@ for (i = 0; i < argcount; ++i) { atypes[i] = args[i].ffi_type; if (atypes[i]->type == FFI_TYPE_STRUCT -#ifdef _WIN64 - && atypes[i]->size <= sizeof(void *) -#endif ) avalues[i] = (void *)args[i].value.p; else diff --git a/Modules/_ctypes/libffi_msvc/ffi.c b/Modules/_ctypes/libffi_msvc/ffi.c --- a/Modules/_ctypes/libffi_msvc/ffi.c +++ b/Modules/_ctypes/libffi_msvc/ffi.c @@ -102,6 +102,15 @@ FFI_ASSERT(0); } } +#ifdef _WIN64 + else if (z > 8) + { + /* On Win64, if a single argument takes more than 8 bytes, + then it is always passed by reference. */ + *(void **)argp = *p_argv; + z = 8; + } +#endif else { memcpy(argp, *p_argv, z); @@ -124,7 +133,6 @@ switch (cif->rtype->type) { case FFI_TYPE_VOID: - case FFI_TYPE_STRUCT: case FFI_TYPE_SINT64: case FFI_TYPE_FLOAT: case FFI_TYPE_DOUBLE: @@ -132,6 +140,18 @@ cif->flags = (unsigned) cif->rtype->type; break; + case FFI_TYPE_STRUCT: + /* MSVC returns small structures in registers. Put in cif->flags + the value FFI_TYPE_STRUCT only if the structure is big enough; + otherwise, put the 4- or 8-bytes integer type. */ + if (cif->rtype->size <= 4) + cif->flags = FFI_TYPE_INT; + else if (cif->rtype->size <= 8) + cif->flags = FFI_TYPE_SINT64; + else + cif->flags = FFI_TYPE_STRUCT; + break; + case FFI_TYPE_UINT64: #ifdef _WIN64 case FFI_TYPE_POINTER: @@ -201,8 +221,7 @@ #else case FFI_SYSV: /*@-usedef@*/ - /* Function call needs at least 40 bytes stack size, on win64 AMD64 */ - return ffi_call_AMD64(ffi_prep_args, &ecif, cif->bytes ? cif->bytes : 40, + return ffi_call_AMD64(ffi_prep_args, &ecif, cif->bytes, cif->flags, ecif.rvalue, fn); /*@=usedef@*/ break; @@ -227,7 +246,7 @@ #else static void __fastcall #endif -ffi_closure_SYSV (ffi_closure *closure, int *argp) +ffi_closure_SYSV (ffi_closure *closure, char *argp) { // this is our return value storage long double res; @@ -237,7 +256,7 @@ void **arg_area; unsigned short rtype; void *resp = (void*)&res; - void *args = &argp[1]; + void *args = argp + sizeof(void*); cif = closure->cif; arg_area = (void**) alloca (cif->nargs * sizeof (void*)); diff --git a/Modules/_ctypes/libffi_msvc/prep_cif.c b/Modules/_ctypes/libffi_msvc/prep_cif.c --- a/Modules/_ctypes/libffi_msvc/prep_cif.c +++ b/Modules/_ctypes/libffi_msvc/prep_cif.c @@ -116,9 +116,9 @@ #if !defined M68K && !defined __x86_64__ && !defined S390 /* Make space for the return structure pointer */ if (cif->rtype->type == FFI_TYPE_STRUCT - /* MSVC returns small structures in registers. But we have a different - workaround: pretend int32 or int64 return type, and converting to - structure afterwards. */ +#ifdef _WIN32 + && (cif->rtype->size > 8) /* MSVC returns small structs in registers */ +#endif #ifdef SPARC && (cif->abi != FFI_V9 || cif->rtype->size > 32) #endif @@ -145,6 +145,10 @@ && cif->abi != FFI_V9)) bytes += sizeof(void*); else +#elif defined (_WIN64) + if ((*ptr)->type == FFI_TYPE_STRUCT && ((*ptr)->size > 8)) + bytes += sizeof(void*); + else #endif { #if !defined(_MSC_VER) && !defined(__MINGW32__) @@ -168,6 +172,12 @@ #endif } +#ifdef _WIN64 + /* Function call needs at least 40 bytes stack size, on win64 AMD64 */ + if (bytes < 40) + bytes = 40; +#endif + cif->bytes = bytes; /* Perform machine dependent cif processing */ diff --git a/Modules/_ctypes/libffi_msvc/types.c b/Modules/_ctypes/libffi_msvc/types.c --- a/Modules/_ctypes/libffi_msvc/types.c +++ b/Modules/_ctypes/libffi_msvc/types.c @@ -43,7 +43,7 @@ FFI_INTEGRAL_TYPEDEF(float, 4, 4, FFI_TYPE_FLOAT); #if defined ALPHA || defined SPARC64 || defined X86_64 || defined S390X \ - || defined IA64 + || defined IA64 || defined _WIN64 FFI_INTEGRAL_TYPEDEF(pointer, 8, 8, FFI_TYPE_POINTER); -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 6 05:14:08 2014 From: python-checkins at python.org (steve.dower) Date: Thu, 06 Nov 2014 04:14:08 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=282=2E7=29=3A_Fixes_path_to_?= =?utf-8?q?patchlevel=2Epy_in_doc/make=2Ebat?= Message-ID: <20141106041405.715.78789@psf.io> https://hg.python.org/cpython/rev/71d5a69e122b changeset: 93409:71d5a69e122b branch: 2.7 parent: 93406:f75b0470168b user: Steve Dower date: Wed Nov 05 20:13:46 2014 -0800 summary: Fixes path to patchlevel.py in doc/make.bat files: Doc/make.bat | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Doc/make.bat b/Doc/make.bat --- a/Doc/make.bat +++ b/Doc/make.bat @@ -12,7 +12,7 @@ if NOT DEFINED ProgramFiles(x86) set _PRGMFLS=%ProgramFiles% if "%HTMLHELP%" EQU "" set HTMLHELP=%_PRGMFLS%\HTML Help Workshop\hhc.exe -if "%DISTVERSION%" EQU "" for /f "usebackq" %%v in (`%PYTHON% tools/patchlevel.py`) do set DISTVERSION=%%v +if "%DISTVERSION%" EQU "" for /f "usebackq" %%v in (`%PYTHON% tools/extensions/patchlevel.py`) do set DISTVERSION=%%v if "%BUILDDIR%" EQU "" set BUILDDIR=build -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 6 06:28:49 2014 From: python-checkins at python.org (raymond.hettinger) Date: Thu, 06 Nov 2014 05:28:49 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_merge?= Message-ID: <20141106052827.85220.56425@psf.io> https://hg.python.org/cpython/rev/9ed44777331d changeset: 93411:9ed44777331d parent: 93408:b701eb69260d parent: 93410:501edbbb74ff user: Raymond Hettinger date: Wed Nov 05 21:28:19 2014 -0800 summary: merge files: Doc/library/textwrap.rst | 2 ++ 1 files changed, 2 insertions(+), 0 deletions(-) diff --git a/Doc/library/textwrap.rst b/Doc/library/textwrap.rst --- a/Doc/library/textwrap.rst +++ b/Doc/library/textwrap.rst @@ -113,6 +113,8 @@ + + world + .. versionadded:: 3.3 + :func:`wrap`, :func:`fill` and :func:`shorten` work by creating a :class:`TextWrapper` instance and calling a single method on it. That -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 6 06:28:49 2014 From: python-checkins at python.org (raymond.hettinger) Date: Thu, 06 Nov 2014 05:28:49 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgMjI4MDM6?= =?utf-8?q?__Add_missing_versionadded_directive=2E?= Message-ID: <20141106052826.113470.15360@psf.io> https://hg.python.org/cpython/rev/501edbbb74ff changeset: 93410:501edbbb74ff branch: 3.4 parent: 93407:cd36ba22602d user: Raymond Hettinger date: Wed Nov 05 21:27:56 2014 -0800 summary: Issue 22803: Add missing versionadded directive. files: Doc/library/textwrap.rst | 2 ++ 1 files changed, 2 insertions(+), 0 deletions(-) diff --git a/Doc/library/textwrap.rst b/Doc/library/textwrap.rst --- a/Doc/library/textwrap.rst +++ b/Doc/library/textwrap.rst @@ -113,6 +113,8 @@ + + world + .. versionadded:: 3.3 + :func:`wrap`, :func:`fill` and :func:`shorten` work by creating a :class:`TextWrapper` instance and calling a single method on it. That -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 6 06:53:28 2014 From: python-checkins at python.org (benjamin.peterson) Date: Thu, 06 Nov 2014 05:53:28 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E4=29=3A_fix_test_where?= =?utf-8?q?_sizeof=28long=29_!=3D_sizeof=28int=29?= Message-ID: <20141106055322.108101.16413@psf.io> https://hg.python.org/cpython/rev/d9fbe4fb2afc changeset: 93412:d9fbe4fb2afc branch: 3.4 parent: 93410:501edbbb74ff user: Benjamin Peterson date: Thu Nov 06 00:52:58 2014 -0500 summary: fix test where sizeof(long) != sizeof(int) files: Modules/_ctypes/_ctypes_test.c | 8 ++++---- 1 files changed, 4 insertions(+), 4 deletions(-) diff --git a/Modules/_ctypes/_ctypes_test.c b/Modules/_ctypes/_ctypes_test.c --- a/Modules/_ctypes/_ctypes_test.c +++ b/Modules/_ctypes/_ctypes_test.c @@ -527,10 +527,10 @@ return 1; } -EXPORT(int left = 10); -EXPORT(int top = 20); -EXPORT(int right = 30); -EXPORT(int bottom = 40); +EXPORT(long left = 10); +EXPORT(long top = 20); +EXPORT(long right = 30); +EXPORT(long bottom = 40); EXPORT(RECT) ReturnRect(int i, RECT ar, RECT* br, POINT cp, RECT dr, RECT *er, POINT fp, RECT gr) -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 6 06:53:27 2014 From: python-checkins at python.org (benjamin.peterson) Date: Thu, 06 Nov 2014 05:53:27 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=282=2E7=29=3A_fix_test_where?= =?utf-8?q?_sizeof=28long=29_!=3D_sizeof=28int=29?= Message-ID: <20141106055322.113482.2215@psf.io> https://hg.python.org/cpython/rev/5a2d40435dfe changeset: 93413:5a2d40435dfe branch: 2.7 parent: 93409:71d5a69e122b user: Benjamin Peterson date: Thu Nov 06 00:52:58 2014 -0500 summary: fix test where sizeof(long) != sizeof(int) files: Modules/_ctypes/_ctypes_test.c | 8 ++++---- 1 files changed, 4 insertions(+), 4 deletions(-) diff --git a/Modules/_ctypes/_ctypes_test.c b/Modules/_ctypes/_ctypes_test.c --- a/Modules/_ctypes/_ctypes_test.c +++ b/Modules/_ctypes/_ctypes_test.c @@ -540,10 +540,10 @@ return 1; } -EXPORT(int left = 10); -EXPORT(int top = 20); -EXPORT(int right = 30); -EXPORT(int bottom = 40); +EXPORT(long left = 10); +EXPORT(long top = 20); +EXPORT(long right = 30); +EXPORT(long bottom = 40); EXPORT(RECT) ReturnRect(int i, RECT ar, RECT* br, POINT cp, RECT dr, RECT *er, POINT fp, RECT gr) -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 6 06:53:27 2014 From: python-checkins at python.org (benjamin.peterson) Date: Thu, 06 Nov 2014 05:53:27 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?b?KTogbWVyZ2UgMy40?= Message-ID: <20141106055322.85204.98811@psf.io> https://hg.python.org/cpython/rev/123369631063 changeset: 93414:123369631063 parent: 93411:9ed44777331d parent: 93412:d9fbe4fb2afc user: Benjamin Peterson date: Thu Nov 06 00:53:18 2014 -0500 summary: merge 3.4 files: Modules/_ctypes/_ctypes_test.c | 8 ++++---- 1 files changed, 4 insertions(+), 4 deletions(-) diff --git a/Modules/_ctypes/_ctypes_test.c b/Modules/_ctypes/_ctypes_test.c --- a/Modules/_ctypes/_ctypes_test.c +++ b/Modules/_ctypes/_ctypes_test.c @@ -527,10 +527,10 @@ return 1; } -EXPORT(int left = 10); -EXPORT(int top = 20); -EXPORT(int right = 30); -EXPORT(int bottom = 40); +EXPORT(long left = 10); +EXPORT(long top = 20); +EXPORT(long right = 30); +EXPORT(long bottom = 40); EXPORT(RECT) ReturnRect(int i, RECT ar, RECT* br, POINT cp, RECT dr, RECT *er, POINT fp, RECT gr) -- Repository URL: https://hg.python.org/cpython From solipsis at pitrou.net Thu Nov 6 10:33:02 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Thu, 06 Nov 2014 10:33:02 +0100 Subject: [Python-checkins] Daily reference leaks (089573725c77): sum=3 Message-ID: results for 089573725c77 on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogc_f6Zi', '-x'] From python-checkins at python.org Thu Nov 6 14:38:37 2014 From: python-checkins at python.org (georg.brandl) Date: Thu, 06 Nov 2014 13:38:37 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_merge_with_3=2E4?= Message-ID: <20141106133833.707.24395@psf.io> https://hg.python.org/cpython/rev/124e9547cb36 changeset: 93416:124e9547cb36 parent: 93414:123369631063 parent: 93415:39536b377241 user: Georg Brandl date: Thu Nov 06 14:38:23 2014 +0100 summary: merge with 3.4 files: Lib/test/test_codecmaps_cn.py | 8 +++----- Lib/test/test_codecmaps_hk.py | 2 +- Lib/test/test_codecmaps_jp.py | 12 +++++------- Lib/test/test_codecmaps_kr.py | 8 +++----- Lib/test/test_codecmaps_tw.py | 6 ++---- Lib/test/test_normalization.py | 2 +- Lib/test/test_ucn.py | 2 +- 7 files changed, 16 insertions(+), 24 deletions(-) diff --git a/Lib/test/test_codecmaps_cn.py b/Lib/test/test_codecmaps_cn.py --- a/Lib/test/test_codecmaps_cn.py +++ b/Lib/test/test_codecmaps_cn.py @@ -10,19 +10,17 @@ class TestGB2312Map(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'gb2312' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-CN.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/EUC-CN.TXT' class TestGBKMap(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'gbk' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/' \ - 'MICSFT/WINDOWS/CP936.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/CP936.TXT' class TestGB18030Map(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'gb18030' - mapfileurl = 'http://source.icu-project.org/repos/icu/data/' \ - 'trunk/charset/data/xml/gb-18030-2000.xml' + mapfileurl = 'http://www.pythontest.net/unicode/gb-18030-2000.xml' if __name__ == "__main__": diff --git a/Lib/test/test_codecmaps_hk.py b/Lib/test/test_codecmaps_hk.py --- a/Lib/test/test_codecmaps_hk.py +++ b/Lib/test/test_codecmaps_hk.py @@ -10,7 +10,7 @@ class TestBig5HKSCSMap(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'big5hkscs' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/BIG5HKSCS-2004.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/BIG5HKSCS-2004.TXT' if __name__ == "__main__": unittest.main() diff --git a/Lib/test/test_codecmaps_jp.py b/Lib/test/test_codecmaps_jp.py --- a/Lib/test/test_codecmaps_jp.py +++ b/Lib/test/test_codecmaps_jp.py @@ -10,8 +10,7 @@ class TestCP932Map(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'cp932' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/' \ - 'WINDOWS/CP932.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/CP932.TXT' supmaps = [ (b'\x80', '\u0080'), (b'\xa0', '\uf8f0'), @@ -27,15 +26,14 @@ unittest.TestCase): encoding = 'euc_jp' mapfilename = 'EUC-JP.TXT' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-JP.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/EUC-JP.TXT' class TestSJISCOMPATMap(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'shift_jis' mapfilename = 'SHIFTJIS.TXT' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE' \ - '/EASTASIA/JIS/SHIFTJIS.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/SHIFTJIS.TXT' pass_enctest = [ (b'\x81_', '\\'), ] @@ -49,14 +47,14 @@ unittest.TestCase): encoding = 'euc_jisx0213' mapfilename = 'EUC-JISX0213.TXT' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-JISX0213.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/EUC-JISX0213.TXT' class TestSJISX0213Map(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'shift_jisx0213' mapfilename = 'SHIFT_JISX0213.TXT' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/SHIFT_JISX0213.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/SHIFT_JISX0213.TXT' if __name__ == "__main__": diff --git a/Lib/test/test_codecmaps_kr.py b/Lib/test/test_codecmaps_kr.py --- a/Lib/test/test_codecmaps_kr.py +++ b/Lib/test/test_codecmaps_kr.py @@ -10,14 +10,13 @@ class TestCP949Map(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'cp949' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT' \ - '/WINDOWS/CP949.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/CP949.TXT' class TestEUCKRMap(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'euc_kr' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-KR.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/EUC-KR.TXT' # A4D4 HANGUL FILLER indicates the begin of 8-bytes make-up sequence. pass_enctest = [(b'\xa4\xd4', '\u3164')] @@ -27,8 +26,7 @@ class TestJOHABMap(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'johab' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE/EASTASIA/' \ - 'KSC/JOHAB.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/JOHAB.TXT' # KS X 1001 standard assigned 0x5c as WON SIGN. # but, in early 90s that is the only era used johab widely, # the most softwares implements it as REVERSE SOLIDUS. diff --git a/Lib/test/test_codecmaps_tw.py b/Lib/test/test_codecmaps_tw.py --- a/Lib/test/test_codecmaps_tw.py +++ b/Lib/test/test_codecmaps_tw.py @@ -10,14 +10,12 @@ class TestBIG5Map(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'big5' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE/' \ - 'EASTASIA/OTHER/BIG5.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/BIG5.TXT' class TestCP950Map(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'cp950' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/' \ - 'WINDOWS/CP950.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/CP950.TXT' pass_enctest = [ (b'\xa2\xcc', '\u5341'), (b'\xa2\xce', '\u5345'), diff --git a/Lib/test/test_normalization.py b/Lib/test/test_normalization.py --- a/Lib/test/test_normalization.py +++ b/Lib/test/test_normalization.py @@ -7,7 +7,7 @@ from unicodedata import normalize, unidata_version TESTDATAFILE = "NormalizationTest.txt" -TESTDATAURL = "http://www.unicode.org/Public/" + unidata_version + "/ucd/" + TESTDATAFILE +TESTDATAURL = "http://www.pythontest.net/unicode/" + unidata_version + "/" + TESTDATAFILE def check_version(testfile): hdr = testfile.readline() diff --git a/Lib/test/test_ucn.py b/Lib/test/test_ucn.py --- a/Lib/test/test_ucn.py +++ b/Lib/test/test_ucn.py @@ -172,7 +172,7 @@ def test_named_sequences_full(self): # Check all the named sequences - url = ("http://www.unicode.org/Public/%s/ucd/NamedSequences.txt" % + url = ("http://www.pythontest.net/unicode/%s/NamedSequences.txt" % unicodedata.unidata_version) try: testdata = support.open_urlresource(url, encoding="utf-8", -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 6 14:38:37 2014 From: python-checkins at python.org (georg.brandl) Date: Thu, 06 Nov 2014 13:38:37 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogIzIyNjUwOiB0ZXN0?= =?utf-8?q?_suite=3A_load_Unicode_test_data_files_from_www=2Epythontest=2E?= =?utf-8?q?net?= Message-ID: <20141106133833.113470.37898@psf.io> https://hg.python.org/cpython/rev/39536b377241 changeset: 93415:39536b377241 branch: 3.4 parent: 93412:d9fbe4fb2afc user: Georg Brandl date: Thu Nov 06 14:37:49 2014 +0100 summary: #22650: test suite: load Unicode test data files from www.pythontest.net files: Lib/test/test_codecmaps_cn.py | 8 +++----- Lib/test/test_codecmaps_hk.py | 2 +- Lib/test/test_codecmaps_jp.py | 12 +++++------- Lib/test/test_codecmaps_kr.py | 8 +++----- Lib/test/test_codecmaps_tw.py | 6 ++---- Lib/test/test_normalization.py | 2 +- Lib/test/test_ucn.py | 2 +- 7 files changed, 16 insertions(+), 24 deletions(-) diff --git a/Lib/test/test_codecmaps_cn.py b/Lib/test/test_codecmaps_cn.py --- a/Lib/test/test_codecmaps_cn.py +++ b/Lib/test/test_codecmaps_cn.py @@ -10,19 +10,17 @@ class TestGB2312Map(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'gb2312' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-CN.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/EUC-CN.TXT' class TestGBKMap(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'gbk' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/' \ - 'MICSFT/WINDOWS/CP936.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/CP936.TXT' class TestGB18030Map(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'gb18030' - mapfileurl = 'http://source.icu-project.org/repos/icu/data/' \ - 'trunk/charset/data/xml/gb-18030-2000.xml' + mapfileurl = 'http://www.pythontest.net/unicode/gb-18030-2000.xml' if __name__ == "__main__": diff --git a/Lib/test/test_codecmaps_hk.py b/Lib/test/test_codecmaps_hk.py --- a/Lib/test/test_codecmaps_hk.py +++ b/Lib/test/test_codecmaps_hk.py @@ -10,7 +10,7 @@ class TestBig5HKSCSMap(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'big5hkscs' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/BIG5HKSCS-2004.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/BIG5HKSCS-2004.TXT' if __name__ == "__main__": unittest.main() diff --git a/Lib/test/test_codecmaps_jp.py b/Lib/test/test_codecmaps_jp.py --- a/Lib/test/test_codecmaps_jp.py +++ b/Lib/test/test_codecmaps_jp.py @@ -10,8 +10,7 @@ class TestCP932Map(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'cp932' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/' \ - 'WINDOWS/CP932.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/CP932.TXT' supmaps = [ (b'\x80', '\u0080'), (b'\xa0', '\uf8f0'), @@ -27,15 +26,14 @@ unittest.TestCase): encoding = 'euc_jp' mapfilename = 'EUC-JP.TXT' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-JP.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/EUC-JP.TXT' class TestSJISCOMPATMap(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'shift_jis' mapfilename = 'SHIFTJIS.TXT' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE' \ - '/EASTASIA/JIS/SHIFTJIS.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/SHIFTJIS.TXT' pass_enctest = [ (b'\x81_', '\\'), ] @@ -49,14 +47,14 @@ unittest.TestCase): encoding = 'euc_jisx0213' mapfilename = 'EUC-JISX0213.TXT' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-JISX0213.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/EUC-JISX0213.TXT' class TestSJISX0213Map(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'shift_jisx0213' mapfilename = 'SHIFT_JISX0213.TXT' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/SHIFT_JISX0213.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/SHIFT_JISX0213.TXT' if __name__ == "__main__": diff --git a/Lib/test/test_codecmaps_kr.py b/Lib/test/test_codecmaps_kr.py --- a/Lib/test/test_codecmaps_kr.py +++ b/Lib/test/test_codecmaps_kr.py @@ -10,14 +10,13 @@ class TestCP949Map(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'cp949' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT' \ - '/WINDOWS/CP949.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/CP949.TXT' class TestEUCKRMap(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'euc_kr' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-KR.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/EUC-KR.TXT' # A4D4 HANGUL FILLER indicates the begin of 8-bytes make-up sequence. pass_enctest = [(b'\xa4\xd4', '\u3164')] @@ -27,8 +26,7 @@ class TestJOHABMap(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'johab' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE/EASTASIA/' \ - 'KSC/JOHAB.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/JOHAB.TXT' # KS X 1001 standard assigned 0x5c as WON SIGN. # but, in early 90s that is the only era used johab widely, # the most softwares implements it as REVERSE SOLIDUS. diff --git a/Lib/test/test_codecmaps_tw.py b/Lib/test/test_codecmaps_tw.py --- a/Lib/test/test_codecmaps_tw.py +++ b/Lib/test/test_codecmaps_tw.py @@ -10,14 +10,12 @@ class TestBIG5Map(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'big5' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE/' \ - 'EASTASIA/OTHER/BIG5.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/BIG5.TXT' class TestCP950Map(multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'cp950' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/' \ - 'WINDOWS/CP950.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/CP950.TXT' pass_enctest = [ (b'\xa2\xcc', '\u5341'), (b'\xa2\xce', '\u5345'), diff --git a/Lib/test/test_normalization.py b/Lib/test/test_normalization.py --- a/Lib/test/test_normalization.py +++ b/Lib/test/test_normalization.py @@ -7,7 +7,7 @@ from unicodedata import normalize, unidata_version TESTDATAFILE = "NormalizationTest.txt" -TESTDATAURL = "http://www.unicode.org/Public/" + unidata_version + "/ucd/" + TESTDATAFILE +TESTDATAURL = "http://www.pythontest.net/unicode/" + unidata_version + "/" + TESTDATAFILE def check_version(testfile): hdr = testfile.readline() diff --git a/Lib/test/test_ucn.py b/Lib/test/test_ucn.py --- a/Lib/test/test_ucn.py +++ b/Lib/test/test_ucn.py @@ -172,7 +172,7 @@ def test_named_sequences_full(self): # Check all the named sequences - url = ("http://www.unicode.org/Public/%s/ucd/NamedSequences.txt" % + url = ("http://www.pythontest.net/unicode/%s/NamedSequences.txt" % unicodedata.unidata_version) try: testdata = support.open_urlresource(url, encoding="utf-8", -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 6 14:57:08 2014 From: python-checkins at python.org (georg.brandl) Date: Thu, 06 Nov 2014 13:57:08 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAobWVyZ2UgMi43IC0+IDIuNyk6?= =?utf-8?q?_merge_heads?= Message-ID: <20141106135653.85206.51901@psf.io> https://hg.python.org/cpython/rev/14a69e40dbb0 changeset: 93418:14a69e40dbb0 branch: 2.7 parent: 93417:0af36ea1d010 parent: 93413:5a2d40435dfe user: Georg Brandl date: Thu Nov 06 14:56:47 2014 +0100 summary: merge heads files: Doc/make.bat | 2 +- Lib/ctypes/test/test_win32.py | 26 +++++++- Modules/_ctypes/_ctypes_test.c | 43 ++++++++++++++ Modules/_ctypes/callproc.c | 6 +- Modules/_ctypes/libffi_msvc/ffi.c | 29 +++++++- Modules/_ctypes/libffi_msvc/prep_cif.c | 18 ++++- Modules/_ctypes/libffi_msvc/types.c | 2 +- 7 files changed, 107 insertions(+), 19 deletions(-) diff --git a/Doc/make.bat b/Doc/make.bat --- a/Doc/make.bat +++ b/Doc/make.bat @@ -12,7 +12,7 @@ if NOT DEFINED ProgramFiles(x86) set _PRGMFLS=%ProgramFiles% if "%HTMLHELP%" EQU "" set HTMLHELP=%_PRGMFLS%\HTML Help Workshop\hhc.exe -if "%DISTVERSION%" EQU "" for /f "usebackq" %%v in (`%PYTHON% tools/patchlevel.py`) do set DISTVERSION=%%v +if "%DISTVERSION%" EQU "" for /f "usebackq" %%v in (`%PYTHON% tools/extensions/patchlevel.py`) do set DISTVERSION=%%v if "%BUILDDIR%" EQU "" set BUILDDIR=build diff --git a/Lib/ctypes/test/test_win32.py b/Lib/ctypes/test/test_win32.py --- a/Lib/ctypes/test/test_win32.py +++ b/Lib/ctypes/test/test_win32.py @@ -90,9 +90,29 @@ dll = CDLL(_ctypes_test.__file__) - pt = POINT(10, 10) - rect = RECT(0, 0, 20, 20) - self.assertEqual(1, dll.PointInRect(byref(rect), pt)) + pt = POINT(15, 25) + left = c_long.in_dll(dll, 'left') + top = c_long.in_dll(dll, 'top') + right = c_long.in_dll(dll, 'right') + bottom = c_long.in_dll(dll, 'bottom') + rect = RECT(left, top, right, bottom) + PointInRect = dll.PointInRect + PointInRect.argtypes = [POINTER(RECT), POINT] + self.assertEqual(1, PointInRect(byref(rect), pt)) + + ReturnRect = dll.ReturnRect + ReturnRect.argtypes = [c_int, RECT, POINTER(RECT), POINT, RECT, + POINTER(RECT), POINT, RECT] + ReturnRect.restype = RECT + for i in range(4): + ret = ReturnRect(i, rect, pointer(rect), pt, rect, + byref(rect), pt, rect) + # the c function will check and modify ret if something is + # passed in improperly + self.assertEqual(ret.left, left.value) + self.assertEqual(ret.right, right.value) + self.assertEqual(ret.top, top.value) + self.assertEqual(ret.bottom, bottom.value) if __name__ == '__main__': unittest.main() diff --git a/Modules/_ctypes/_ctypes_test.c b/Modules/_ctypes/_ctypes_test.c --- a/Modules/_ctypes/_ctypes_test.c +++ b/Modules/_ctypes/_ctypes_test.c @@ -540,6 +540,49 @@ return 1; } +EXPORT(long left = 10); +EXPORT(long top = 20); +EXPORT(long right = 30); +EXPORT(long bottom = 40); + +EXPORT(RECT) ReturnRect(int i, RECT ar, RECT* br, POINT cp, RECT dr, + RECT *er, POINT fp, RECT gr) +{ + /*Check input */ + if (ar.left + br->left + dr.left + er->left + gr.left != left * 5) + { + ar.left = 100; + return ar; + } + if (ar.right + br->right + dr.right + er->right + gr.right != right * 5) + { + ar.right = 100; + return ar; + } + if (cp.x != fp.x) + { + ar.left = -100; + } + if (cp.y != fp.y) + { + ar.left = -200; + } + switch(i) + { + case 0: + return ar; + break; + case 1: + return dr; + break; + case 2: + return gr; + break; + + } + return ar; +} + typedef struct { short x; short y; diff --git a/Modules/_ctypes/callproc.c b/Modules/_ctypes/callproc.c --- a/Modules/_ctypes/callproc.c +++ b/Modules/_ctypes/callproc.c @@ -1170,11 +1170,7 @@ } for (i = 0; i < argcount; ++i) { atypes[i] = args[i].ffi_type; - if (atypes[i]->type == FFI_TYPE_STRUCT -#ifdef _WIN64 - && atypes[i]->size <= sizeof(void *) -#endif - ) + if (atypes[i]->type == FFI_TYPE_STRUCT) avalues[i] = (void *)args[i].value.p; else avalues[i] = (void *)&args[i].value; diff --git a/Modules/_ctypes/libffi_msvc/ffi.c b/Modules/_ctypes/libffi_msvc/ffi.c --- a/Modules/_ctypes/libffi_msvc/ffi.c +++ b/Modules/_ctypes/libffi_msvc/ffi.c @@ -102,6 +102,15 @@ FFI_ASSERT(0); } } +#ifdef _WIN64 + else if (z > 8) + { + /* On Win64, if a single argument takes more than 8 bytes, + then it is always passed by reference. */ + *(void **)argp = *p_argv; + z = 8; + } +#endif else { memcpy(argp, *p_argv, z); @@ -124,7 +133,6 @@ switch (cif->rtype->type) { case FFI_TYPE_VOID: - case FFI_TYPE_STRUCT: case FFI_TYPE_SINT64: case FFI_TYPE_FLOAT: case FFI_TYPE_DOUBLE: @@ -132,6 +140,18 @@ cif->flags = (unsigned) cif->rtype->type; break; + case FFI_TYPE_STRUCT: + /* MSVC returns small structures in registers. Put in cif->flags + the value FFI_TYPE_STRUCT only if the structure is big enough; + otherwise, put the 4- or 8-bytes integer type. */ + if (cif->rtype->size <= 4) + cif->flags = FFI_TYPE_INT; + else if (cif->rtype->size <= 8) + cif->flags = FFI_TYPE_SINT64; + else + cif->flags = FFI_TYPE_STRUCT; + break; + case FFI_TYPE_UINT64: #ifdef _WIN64 case FFI_TYPE_POINTER: @@ -201,8 +221,7 @@ #else case FFI_SYSV: /*@-usedef@*/ - /* Function call needs at least 40 bytes stack size, on win64 AMD64 */ - return ffi_call_AMD64(ffi_prep_args, &ecif, cif->bytes ? cif->bytes : 40, + return ffi_call_AMD64(ffi_prep_args, &ecif, cif->bytes, cif->flags, ecif.rvalue, fn); /*@=usedef@*/ break; @@ -227,7 +246,7 @@ #else static void __fastcall #endif -ffi_closure_SYSV (ffi_closure *closure, int *argp) +ffi_closure_SYSV (ffi_closure *closure, char *argp) { // this is our return value storage long double res; @@ -237,7 +256,7 @@ void **arg_area; unsigned short rtype; void *resp = (void*)&res; - void *args = &argp[1]; + void *args = argp + sizeof(void*); cif = closure->cif; arg_area = (void**) alloca (cif->nargs * sizeof (void*)); diff --git a/Modules/_ctypes/libffi_msvc/prep_cif.c b/Modules/_ctypes/libffi_msvc/prep_cif.c --- a/Modules/_ctypes/libffi_msvc/prep_cif.c +++ b/Modules/_ctypes/libffi_msvc/prep_cif.c @@ -116,9 +116,9 @@ #if !defined M68K && !defined __x86_64__ && !defined S390 /* Make space for the return structure pointer */ if (cif->rtype->type == FFI_TYPE_STRUCT - /* MSVC returns small structures in registers. But we have a different - workaround: pretend int32 or int64 return type, and converting to - structure afterwards. */ +#ifdef _WIN32 + && (cif->rtype->size > 8) /* MSVC returns small structs in registers */ +#endif #ifdef SPARC && (cif->abi != FFI_V9 || cif->rtype->size > 32) #endif @@ -143,7 +143,11 @@ && ((*ptr)->size > 16 || cif->abi != FFI_V9)) || ((*ptr)->type == FFI_TYPE_LONGDOUBLE && cif->abi != FFI_V9)) - bytes += sizeof(void*); + bytes += sizeof(void*); + else +#elif defined (_WIN64) + if ((*ptr)->type == FFI_TYPE_STRUCT && ((*ptr)->size > 8)) + bytes += sizeof(void*); else #endif { @@ -168,6 +172,12 @@ #endif } +#ifdef _WIN64 + /* Function call needs at least 40 bytes stack size, on win64 AMD64 */ + if (bytes < 40) + bytes = 40; +#endif + cif->bytes = bytes; /* Perform machine dependent cif processing */ diff --git a/Modules/_ctypes/libffi_msvc/types.c b/Modules/_ctypes/libffi_msvc/types.c --- a/Modules/_ctypes/libffi_msvc/types.c +++ b/Modules/_ctypes/libffi_msvc/types.c @@ -43,7 +43,7 @@ FFI_INTEGRAL_TYPEDEF(float, 4, 4, FFI_TYPE_FLOAT); #if defined ALPHA || defined SPARC64 || defined X86_64 || defined S390X \ - || defined IA64 + || defined IA64 || defined _WIN64 FFI_INTEGRAL_TYPEDEF(pointer, 8, 8, FFI_TYPE_POINTER); -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 6 14:57:08 2014 From: python-checkins at python.org (georg.brandl) Date: Thu, 06 Nov 2014 13:57:08 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogIzIyNjUwOiB0ZXN0?= =?utf-8?q?_suite=3A_load_Unicode_test_data_files_from_www=2Epythontest=2E?= =?utf-8?q?net?= Message-ID: <20141106135652.108375.20457@psf.io> https://hg.python.org/cpython/rev/0af36ea1d010 changeset: 93417:0af36ea1d010 branch: 2.7 parent: 93401:3e8d3c4bc17e user: Georg Brandl date: Thu Nov 06 14:37:49 2014 +0100 summary: #22650: test suite: load Unicode test data files from www.pythontest.net files: Lib/test/test_codecmaps_cn.py | 8 +++----- Lib/test/test_codecmaps_hk.py | 2 +- Lib/test/test_codecmaps_jp.py | 12 +++++------- Lib/test/test_codecmaps_kr.py | 8 +++----- Lib/test/test_codecmaps_tw.py | 6 ++---- Lib/test/test_normalization.py | 2 +- 6 files changed, 15 insertions(+), 23 deletions(-) diff --git a/Lib/test/test_codecmaps_cn.py b/Lib/test/test_codecmaps_cn.py --- a/Lib/test/test_codecmaps_cn.py +++ b/Lib/test/test_codecmaps_cn.py @@ -10,19 +10,17 @@ class TestGB2312Map(test_multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'gb2312' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-CN.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/EUC-CN.TXT' class TestGBKMap(test_multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'gbk' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/' \ - 'MICSFT/WINDOWS/CP936.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/CP936.TXT' class TestGB18030Map(test_multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'gb18030' - mapfileurl = 'http://source.icu-project.org/repos/icu/data/' \ - 'trunk/charset/data/xml/gb-18030-2000.xml' + mapfileurl = 'http://www.pythontest.net/unicode/gb-18030-2000.xml' def test_main(): diff --git a/Lib/test/test_codecmaps_hk.py b/Lib/test/test_codecmaps_hk.py --- a/Lib/test/test_codecmaps_hk.py +++ b/Lib/test/test_codecmaps_hk.py @@ -10,7 +10,7 @@ class TestBig5HKSCSMap(test_multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'big5hkscs' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/BIG5HKSCS-2004.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/BIG5HKSCS-2004.TXT' def test_main(): test_support.run_unittest(__name__) diff --git a/Lib/test/test_codecmaps_jp.py b/Lib/test/test_codecmaps_jp.py --- a/Lib/test/test_codecmaps_jp.py +++ b/Lib/test/test_codecmaps_jp.py @@ -10,8 +10,7 @@ class TestCP932Map(test_multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'cp932' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/' \ - 'WINDOWS/CP932.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/CP932.TXT' supmaps = [ ('\x80', u'\u0080'), ('\xa0', u'\uf8f0'), @@ -27,15 +26,14 @@ unittest.TestCase): encoding = 'euc_jp' mapfilename = 'EUC-JP.TXT' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-JP.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/EUC-JP.TXT' class TestSJISCOMPATMap(test_multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'shift_jis' mapfilename = 'SHIFTJIS.TXT' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE' \ - '/EASTASIA/JIS/SHIFTJIS.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/SHIFTJIS.TXT' pass_enctest = [ ('\x81_', u'\\'), ] @@ -49,14 +47,14 @@ unittest.TestCase): encoding = 'euc_jisx0213' mapfilename = 'EUC-JISX0213.TXT' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-JISX0213.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/EUC-JISX0213.TXT' class TestSJISX0213Map(test_multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'shift_jisx0213' mapfilename = 'SHIFT_JISX0213.TXT' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/SHIFT_JISX0213.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/SHIFT_JISX0213.TXT' def test_main(): diff --git a/Lib/test/test_codecmaps_kr.py b/Lib/test/test_codecmaps_kr.py --- a/Lib/test/test_codecmaps_kr.py +++ b/Lib/test/test_codecmaps_kr.py @@ -10,14 +10,13 @@ class TestCP949Map(test_multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'cp949' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT' \ - '/WINDOWS/CP949.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/CP949.TXT' class TestEUCKRMap(test_multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'euc_kr' - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-KR.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/EUC-KR.TXT' # A4D4 HANGUL FILLER indicates the begin of 8-bytes make-up sequence. pass_enctest = [('\xa4\xd4', u'\u3164')] @@ -27,8 +26,7 @@ class TestJOHABMap(test_multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'johab' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE/EASTASIA/' \ - 'KSC/JOHAB.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/JOHAB.TXT' # KS X 1001 standard assigned 0x5c as WON SIGN. # but, in early 90s that is the only era used johab widely, # the most softwares implements it as REVERSE SOLIDUS. diff --git a/Lib/test/test_codecmaps_tw.py b/Lib/test/test_codecmaps_tw.py --- a/Lib/test/test_codecmaps_tw.py +++ b/Lib/test/test_codecmaps_tw.py @@ -10,14 +10,12 @@ class TestBIG5Map(test_multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'big5' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE/' \ - 'EASTASIA/OTHER/BIG5.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/BIG5.TXT' class TestCP950Map(test_multibytecodec_support.TestBase_Mapping, unittest.TestCase): encoding = 'cp950' - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/' \ - 'WINDOWS/CP950.TXT' + mapfileurl = 'http://www.pythontest.net/unicode/CP950.TXT' pass_enctest = [ ('\xa2\xcc', u'\u5341'), ('\xa2\xce', u'\u5345'), diff --git a/Lib/test/test_normalization.py b/Lib/test/test_normalization.py --- a/Lib/test/test_normalization.py +++ b/Lib/test/test_normalization.py @@ -7,7 +7,7 @@ from unicodedata import normalize, unidata_version TESTDATAFILE = "NormalizationTest.txt" -TESTDATAURL = "http://www.unicode.org/Public/" + unidata_version + "/ucd/" + TESTDATAFILE +TESTDATAURL = "http://www.pythontest.net/unicode/" + unidata_version + "/" + TESTDATAFILE def check_version(testfile): hdr = testfile.readline() -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 6 15:33:48 2014 From: python-checkins at python.org (georg.brandl) Date: Thu, 06 Nov 2014 14:33:48 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E4=29=3A_Try_to_transfe?= =?utf-8?q?r_the_Unicode_test_data_files_gzipped=2E?= Message-ID: <20141106143341.108091.47188@psf.io> https://hg.python.org/cpython/rev/540b022ae7a9 changeset: 93419:540b022ae7a9 branch: 3.4 parent: 93415:39536b377241 user: Georg Brandl date: Thu Nov 06 15:33:30 2014 +0100 summary: Try to transfer the Unicode test data files gzipped. files: Lib/test/support/__init__.py | 7 ++++++- 1 files changed, 6 insertions(+), 1 deletions(-) diff --git a/Lib/test/support/__init__.py b/Lib/test/support/__init__.py --- a/Lib/test/support/__init__.py +++ b/Lib/test/support/__init__.py @@ -1029,7 +1029,12 @@ requires('urlfetch') print('\tfetching %s ...' % url, file=get_original_stdout()) - f = urllib.request.urlopen(url, timeout=15) + opener = urllib.request.build_opener() + if gzip: + opener.addheaders.append(('Accept-Encoding', 'gzip')) + f = opener.open(url, timeout=15) + if gzip and f.headers.get('Content-Encoding') == 'gzip': + f = gzip.GzipFile(fileobj=f) try: with open(fn, "wb") as out: s = f.read() -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 6 15:33:48 2014 From: python-checkins at python.org (georg.brandl) Date: Thu, 06 Nov 2014 14:33:48 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_merge_with_3=2E4?= Message-ID: <20141106143342.108073.34910@psf.io> https://hg.python.org/cpython/rev/a688d3206646 changeset: 93420:a688d3206646 parent: 93416:124e9547cb36 parent: 93419:540b022ae7a9 user: Georg Brandl date: Thu Nov 06 15:33:35 2014 +0100 summary: merge with 3.4 files: Lib/test/support/__init__.py | 7 ++++++- 1 files changed, 6 insertions(+), 1 deletions(-) diff --git a/Lib/test/support/__init__.py b/Lib/test/support/__init__.py --- a/Lib/test/support/__init__.py +++ b/Lib/test/support/__init__.py @@ -1029,7 +1029,12 @@ requires('urlfetch') print('\tfetching %s ...' % url, file=get_original_stdout()) - f = urllib.request.urlopen(url, timeout=15) + opener = urllib.request.build_opener() + if gzip: + opener.addheaders.append(('Accept-Encoding', 'gzip')) + f = opener.open(url, timeout=15) + if gzip and f.headers.get('Content-Encoding') == 'gzip': + f = gzip.GzipFile(fileobj=f) try: with open(fn, "wb") as out: s = f.read() -- Repository URL: https://hg.python.org/cpython From bcannon at gmail.com Thu Nov 6 15:39:03 2014 From: bcannon at gmail.com (Brett Cannon) Date: Thu, 06 Nov 2014 14:39:03 +0000 Subject: [Python-checkins] cpython (2.7): #22650: test suite: load Unicode test data files from www.pythontest.net References: <20141106135652.108375.20457@psf.io> Message-ID: What is pythontest.net? Is it something we control, and if so how do we add things to it for tests? Did I miss an email on python-dev or python-committers about this? On Thu Nov 06 2014 at 8:57:22 AM georg.brandl wrote: > https://hg.python.org/cpython/rev/0af36ea1d010 > changeset: 93417:0af36ea1d010 > branch: 2.7 > parent: 93401:3e8d3c4bc17e > user: Georg Brandl > date: Thu Nov 06 14:37:49 2014 +0100 > summary: > #22650: test suite: load Unicode test data files from www.pythontest.net > > files: > Lib/test/test_codecmaps_cn.py | 8 +++----- > Lib/test/test_codecmaps_hk.py | 2 +- > Lib/test/test_codecmaps_jp.py | 12 +++++------- > Lib/test/test_codecmaps_kr.py | 8 +++----- > Lib/test/test_codecmaps_tw.py | 6 ++---- > Lib/test/test_normalization.py | 2 +- > 6 files changed, 15 insertions(+), 23 deletions(-) > > > diff --git a/Lib/test/test_codecmaps_cn.py b/Lib/test/test_codecmaps_cn.py > --- a/Lib/test/test_codecmaps_cn.py > +++ b/Lib/test/test_codecmaps_cn.py > @@ -10,19 +10,17 @@ > class TestGB2312Map(test_multibytecodec_support.TestBase_Mapping, > unittest.TestCase): > encoding = 'gb2312' > - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-CN.TXT' > + mapfileurl = 'http://www.pythontest.net/unicode/EUC-CN.TXT' > > class TestGBKMap(test_multibytecodec_support.TestBase_Mapping, > unittest.TestCase): > encoding = 'gbk' > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/' \ > - 'MICSFT/WINDOWS/CP936.TXT' > + mapfileurl = 'http://www.pythontest.net/unicode/CP936.TXT' > > class TestGB18030Map(test_multibytecodec_support.TestBase_Mapping, > unittest.TestCase): > encoding = 'gb18030' > - mapfileurl = 'http://source.icu-project.org/repos/icu/data/' \ > - 'trunk/charset/data/xml/gb-18030-2000.xml' > + mapfileurl = 'http://www.pythontest.net/unicode/gb-18030-2000.xml' > > > def test_main(): > diff --git a/Lib/test/test_codecmaps_hk.py b/Lib/test/test_codecmaps_hk.py > --- a/Lib/test/test_codecmaps_hk.py > +++ b/Lib/test/test_codecmaps_hk.py > @@ -10,7 +10,7 @@ > class TestBig5HKSCSMap(test_multibytecodec_support.TestBase_Mapping, > unittest.TestCase): > encoding = 'big5hkscs' > - mapfileurl = 'http://people.freebsd.org/~ > perky/i18n/BIG5HKSCS-2004.TXT' > + mapfileurl = 'http://www.pythontest.net/unicode/BIG5HKSCS-2004.TXT' > > def test_main(): > test_support.run_unittest(__name__) > diff --git a/Lib/test/test_codecmaps_jp.py b/Lib/test/test_codecmaps_jp.py > --- a/Lib/test/test_codecmaps_jp.py > +++ b/Lib/test/test_codecmaps_jp.py > @@ -10,8 +10,7 @@ > class TestCP932Map(test_multibytecodec_support.TestBase_Mapping, > unittest.TestCase): > encoding = 'cp932' > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/' > \ > - 'WINDOWS/CP932.TXT' > + mapfileurl = 'http://www.pythontest.net/unicode/CP932.TXT' > supmaps = [ > ('\x80', u'\u0080'), > ('\xa0', u'\uf8f0'), > @@ -27,15 +26,14 @@ > unittest.TestCase): > encoding = 'euc_jp' > mapfilename = 'EUC-JP.TXT' > - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-JP.TXT' > + mapfileurl = 'http://www.pythontest.net/unicode/EUC-JP.TXT' > > > class TestSJISCOMPATMap(test_multibytecodec_support.TestBase_Mapping, > unittest.TestCase): > encoding = 'shift_jis' > mapfilename = 'SHIFTJIS.TXT' > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE' \ > - '/EASTASIA/JIS/SHIFTJIS.TXT' > + mapfileurl = 'http://www.pythontest.net/unicode/SHIFTJIS.TXT' > pass_enctest = [ > ('\x81_', u'\\'), > ] > @@ -49,14 +47,14 @@ > unittest.TestCase): > encoding = 'euc_jisx0213' > mapfilename = 'EUC-JISX0213.TXT' > - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-JISX0213.TXT' > + mapfileurl = 'http://www.pythontest.net/unicode/EUC-JISX0213.TXT' > > > class TestSJISX0213Map(test_multibytecodec_support.TestBase_Mapping, > unittest.TestCase): > encoding = 'shift_jisx0213' > mapfilename = 'SHIFT_JISX0213.TXT' > - mapfileurl = 'http://people.freebsd.org/~ > perky/i18n/SHIFT_JISX0213.TXT' > + mapfileurl = 'http://www.pythontest.net/unicode/SHIFT_JISX0213.TXT' > > > def test_main(): > diff --git a/Lib/test/test_codecmaps_kr.py b/Lib/test/test_codecmaps_kr.py > --- a/Lib/test/test_codecmaps_kr.py > +++ b/Lib/test/test_codecmaps_kr.py > @@ -10,14 +10,13 @@ > class TestCP949Map(test_multibytecodec_support.TestBase_Mapping, > unittest.TestCase): > encoding = 'cp949' > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT' > \ > - '/WINDOWS/CP949.TXT' > + mapfileurl = 'http://www.pythontest.net/unicode/CP949.TXT' > > > class TestEUCKRMap(test_multibytecodec_support.TestBase_Mapping, > unittest.TestCase): > encoding = 'euc_kr' > - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-KR.TXT' > + mapfileurl = 'http://www.pythontest.net/unicode/EUC-KR.TXT' > > # A4D4 HANGUL FILLER indicates the begin of 8-bytes make-up sequence. > pass_enctest = [('\xa4\xd4', u'\u3164')] > @@ -27,8 +26,7 @@ > class TestJOHABMap(test_multibytecodec_support.TestBase_Mapping, > unittest.TestCase): > encoding = 'johab' > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE/ > EASTASIA/' \ > - 'KSC/JOHAB.TXT' > + mapfileurl = 'http://www.pythontest.net/unicode/JOHAB.TXT' > # KS X 1001 standard assigned 0x5c as WON SIGN. > # but, in early 90s that is the only era used johab widely, > # the most softwares implements it as REVERSE SOLIDUS. > diff --git a/Lib/test/test_codecmaps_tw.py b/Lib/test/test_codecmaps_tw.py > --- a/Lib/test/test_codecmaps_tw.py > +++ b/Lib/test/test_codecmaps_tw.py > @@ -10,14 +10,12 @@ > class TestBIG5Map(test_multibytecodec_support.TestBase_Mapping, > unittest.TestCase): > encoding = 'big5' > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE/' \ > - 'EASTASIA/OTHER/BIG5.TXT' > + mapfileurl = 'http://www.pythontest.net/unicode/BIG5.TXT' > > class TestCP950Map(test_multibytecodec_support.TestBase_Mapping, > unittest.TestCase): > encoding = 'cp950' > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/' > \ > - 'WINDOWS/CP950.TXT' > + mapfileurl = 'http://www.pythontest.net/unicode/CP950.TXT' > pass_enctest = [ > ('\xa2\xcc', u'\u5341'), > ('\xa2\xce', u'\u5345'), > diff --git a/Lib/test/test_normalization.py b/Lib/test/test_normalization. > py > --- a/Lib/test/test_normalization.py > +++ b/Lib/test/test_normalization.py > @@ -7,7 +7,7 @@ > from unicodedata import normalize, unidata_version > > TESTDATAFILE = "NormalizationTest.txt" > -TESTDATAURL = "http://www.unicode.org/Public/" + unidata_version + > "/ucd/" + TESTDATAFILE > +TESTDATAURL = "http://www.pythontest.net/unicode/" + unidata_version + > "/" + TESTDATAFILE > > def check_version(testfile): > hdr = testfile.readline() > > -- > Repository URL: https://hg.python.org/cpython > _______________________________________________ > Python-checkins mailing list > Python-checkins at python.org > https://mail.python.org/mailman/listinfo/python-checkins > -------------- next part -------------- An HTML attachment was scrubbed... URL: From benjamin at python.org Thu Nov 6 15:41:50 2014 From: benjamin at python.org (Benjamin Peterson) Date: Thu, 06 Nov 2014 09:41:50 -0500 Subject: [Python-checkins] cpython (2.7): #22650: test suite: load Unicode test data files from www.pythontest.net In-Reply-To: References: <20141106135652.108375.20457@psf.io> Message-ID: <1415284910.3978287.187837097.131F9A4E@webmail.messagingengine.com> On Thu, Nov 6, 2014, at 09:39, Brett Cannon wrote: > What is pythontest.net? Is it something we control, and if so how do we > add > things to it for tests? Did I miss an email on python-dev or > python-committers about this? See https://bugs.python.org/issue22650 > > On Thu Nov 06 2014 at 8:57:22 AM georg.brandl > > wrote: > > > https://hg.python.org/cpython/rev/0af36ea1d010 > > changeset: 93417:0af36ea1d010 > > branch: 2.7 > > parent: 93401:3e8d3c4bc17e > > user: Georg Brandl > > date: Thu Nov 06 14:37:49 2014 +0100 > > summary: > > #22650: test suite: load Unicode test data files from www.pythontest.net > > > > files: > > Lib/test/test_codecmaps_cn.py | 8 +++----- > > Lib/test/test_codecmaps_hk.py | 2 +- > > Lib/test/test_codecmaps_jp.py | 12 +++++------- > > Lib/test/test_codecmaps_kr.py | 8 +++----- > > Lib/test/test_codecmaps_tw.py | 6 ++---- > > Lib/test/test_normalization.py | 2 +- > > 6 files changed, 15 insertions(+), 23 deletions(-) > > > > > > diff --git a/Lib/test/test_codecmaps_cn.py b/Lib/test/test_codecmaps_cn.py > > --- a/Lib/test/test_codecmaps_cn.py > > +++ b/Lib/test/test_codecmaps_cn.py > > @@ -10,19 +10,17 @@ > > class TestGB2312Map(test_multibytecodec_support.TestBase_Mapping, > > unittest.TestCase): > > encoding = 'gb2312' > > - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-CN.TXT' > > + mapfileurl = 'http://www.pythontest.net/unicode/EUC-CN.TXT' > > > > class TestGBKMap(test_multibytecodec_support.TestBase_Mapping, > > unittest.TestCase): > > encoding = 'gbk' > > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/' \ > > - 'MICSFT/WINDOWS/CP936.TXT' > > + mapfileurl = 'http://www.pythontest.net/unicode/CP936.TXT' > > > > class TestGB18030Map(test_multibytecodec_support.TestBase_Mapping, > > unittest.TestCase): > > encoding = 'gb18030' > > - mapfileurl = 'http://source.icu-project.org/repos/icu/data/' \ > > - 'trunk/charset/data/xml/gb-18030-2000.xml' > > + mapfileurl = 'http://www.pythontest.net/unicode/gb-18030-2000.xml' > > > > > > def test_main(): > > diff --git a/Lib/test/test_codecmaps_hk.py b/Lib/test/test_codecmaps_hk.py > > --- a/Lib/test/test_codecmaps_hk.py > > +++ b/Lib/test/test_codecmaps_hk.py > > @@ -10,7 +10,7 @@ > > class TestBig5HKSCSMap(test_multibytecodec_support.TestBase_Mapping, > > unittest.TestCase): > > encoding = 'big5hkscs' > > - mapfileurl = 'http://people.freebsd.org/~ > > perky/i18n/BIG5HKSCS-2004.TXT' > > + mapfileurl = 'http://www.pythontest.net/unicode/BIG5HKSCS-2004.TXT' > > > > def test_main(): > > test_support.run_unittest(__name__) > > diff --git a/Lib/test/test_codecmaps_jp.py b/Lib/test/test_codecmaps_jp.py > > --- a/Lib/test/test_codecmaps_jp.py > > +++ b/Lib/test/test_codecmaps_jp.py > > @@ -10,8 +10,7 @@ > > class TestCP932Map(test_multibytecodec_support.TestBase_Mapping, > > unittest.TestCase): > > encoding = 'cp932' > > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/' > > \ > > - 'WINDOWS/CP932.TXT' > > + mapfileurl = 'http://www.pythontest.net/unicode/CP932.TXT' > > supmaps = [ > > ('\x80', u'\u0080'), > > ('\xa0', u'\uf8f0'), > > @@ -27,15 +26,14 @@ > > unittest.TestCase): > > encoding = 'euc_jp' > > mapfilename = 'EUC-JP.TXT' > > - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-JP.TXT' > > + mapfileurl = 'http://www.pythontest.net/unicode/EUC-JP.TXT' > > > > > > class TestSJISCOMPATMap(test_multibytecodec_support.TestBase_Mapping, > > unittest.TestCase): > > encoding = 'shift_jis' > > mapfilename = 'SHIFTJIS.TXT' > > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE' \ > > - '/EASTASIA/JIS/SHIFTJIS.TXT' > > + mapfileurl = 'http://www.pythontest.net/unicode/SHIFTJIS.TXT' > > pass_enctest = [ > > ('\x81_', u'\\'), > > ] > > @@ -49,14 +47,14 @@ > > unittest.TestCase): > > encoding = 'euc_jisx0213' > > mapfilename = 'EUC-JISX0213.TXT' > > - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-JISX0213.TXT' > > + mapfileurl = 'http://www.pythontest.net/unicode/EUC-JISX0213.TXT' > > > > > > class TestSJISX0213Map(test_multibytecodec_support.TestBase_Mapping, > > unittest.TestCase): > > encoding = 'shift_jisx0213' > > mapfilename = 'SHIFT_JISX0213.TXT' > > - mapfileurl = 'http://people.freebsd.org/~ > > perky/i18n/SHIFT_JISX0213.TXT' > > + mapfileurl = 'http://www.pythontest.net/unicode/SHIFT_JISX0213.TXT' > > > > > > def test_main(): > > diff --git a/Lib/test/test_codecmaps_kr.py b/Lib/test/test_codecmaps_kr.py > > --- a/Lib/test/test_codecmaps_kr.py > > +++ b/Lib/test/test_codecmaps_kr.py > > @@ -10,14 +10,13 @@ > > class TestCP949Map(test_multibytecodec_support.TestBase_Mapping, > > unittest.TestCase): > > encoding = 'cp949' > > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT' > > \ > > - '/WINDOWS/CP949.TXT' > > + mapfileurl = 'http://www.pythontest.net/unicode/CP949.TXT' > > > > > > class TestEUCKRMap(test_multibytecodec_support.TestBase_Mapping, > > unittest.TestCase): > > encoding = 'euc_kr' > > - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-KR.TXT' > > + mapfileurl = 'http://www.pythontest.net/unicode/EUC-KR.TXT' > > > > # A4D4 HANGUL FILLER indicates the begin of 8-bytes make-up sequence. > > pass_enctest = [('\xa4\xd4', u'\u3164')] > > @@ -27,8 +26,7 @@ > > class TestJOHABMap(test_multibytecodec_support.TestBase_Mapping, > > unittest.TestCase): > > encoding = 'johab' > > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE/ > > EASTASIA/' \ > > - 'KSC/JOHAB.TXT' > > + mapfileurl = 'http://www.pythontest.net/unicode/JOHAB.TXT' > > # KS X 1001 standard assigned 0x5c as WON SIGN. > > # but, in early 90s that is the only era used johab widely, > > # the most softwares implements it as REVERSE SOLIDUS. > > diff --git a/Lib/test/test_codecmaps_tw.py b/Lib/test/test_codecmaps_tw.py > > --- a/Lib/test/test_codecmaps_tw.py > > +++ b/Lib/test/test_codecmaps_tw.py > > @@ -10,14 +10,12 @@ > > class TestBIG5Map(test_multibytecodec_support.TestBase_Mapping, > > unittest.TestCase): > > encoding = 'big5' > > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE/' \ > > - 'EASTASIA/OTHER/BIG5.TXT' > > + mapfileurl = 'http://www.pythontest.net/unicode/BIG5.TXT' > > > > class TestCP950Map(test_multibytecodec_support.TestBase_Mapping, > > unittest.TestCase): > > encoding = 'cp950' > > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/MICSFT/' > > \ > > - 'WINDOWS/CP950.TXT' > > + mapfileurl = 'http://www.pythontest.net/unicode/CP950.TXT' > > pass_enctest = [ > > ('\xa2\xcc', u'\u5341'), > > ('\xa2\xce', u'\u5345'), > > diff --git a/Lib/test/test_normalization.py b/Lib/test/test_normalization. > > py > > --- a/Lib/test/test_normalization.py > > +++ b/Lib/test/test_normalization.py > > @@ -7,7 +7,7 @@ > > from unicodedata import normalize, unidata_version > > > > TESTDATAFILE = "NormalizationTest.txt" > > -TESTDATAURL = "http://www.unicode.org/Public/" + unidata_version + > > "/ucd/" + TESTDATAFILE > > +TESTDATAURL = "http://www.pythontest.net/unicode/" + unidata_version + > > "/" + TESTDATAFILE > > > > def check_version(testfile): > > hdr = testfile.readline() > > > > -- > > Repository URL: https://hg.python.org/cpython > > _______________________________________________ > > Python-checkins mailing list > > Python-checkins at python.org > > https://mail.python.org/mailman/listinfo/python-checkins > > > _______________________________________________ > Python-checkins mailing list > Python-checkins at python.org > https://mail.python.org/mailman/listinfo/python-checkins From mal at egenix.com Thu Nov 6 16:09:54 2014 From: mal at egenix.com (M.-A. Lemburg) Date: Thu, 06 Nov 2014 16:09:54 +0100 Subject: [Python-checkins] [Python-Dev] cpython (2.7): #22650: test suite: load Unicode test data files from www.pythontest.net In-Reply-To: References: <20141106135652.108375.20457@psf.io> Message-ID: <545B8F42.10000@egenix.com> On 06.11.2014 15:39, Brett Cannon wrote: > What is pythontest.net? Is it something we control, and if so how do we add > things to it for tests? Did I miss an email on python-dev or > python-committers about this? pythontest.net is a domain owned by the PSF and run by Donald Stufft and Benjamin (I believe). https://bugs.python.org/issue22650 has the details. > On Thu Nov 06 2014 at 8:57:22 AM georg.brandl > wrote: > >> https://hg.python.org/cpython/rev/0af36ea1d010 >> changeset: 93417:0af36ea1d010 >> branch: 2.7 >> parent: 93401:3e8d3c4bc17e >> user: Georg Brandl >> date: Thu Nov 06 14:37:49 2014 +0100 >> summary: >> #22650: test suite: load Unicode test data files from www.pythontest.net -- Marc-Andre Lemburg eGenix.com Professional Python Services directly from the Source (#1, Nov 06 2014) >>> Python Projects, Consulting and Support ... http://www.egenix.com/ >>> mxODBC.Zope/Plone.Database.Adapter ... http://zope.egenix.com/ >>> mxODBC, mxDateTime, mxTextTools ... http://python.egenix.com/ ________________________________________________________________________ 2014-10-24: Released eGenix pyOpenSSL 0.13.5 ... http://egenix.com/go63 ::::: Try our mxODBC.Connect Python Database Interface for free ! :::::: eGenix.com Software, Skills and Services GmbH Pastor-Loeh-Str.48 D-40764 Langenfeld, Germany. CEO Dipl.-Math. Marc-Andre Lemburg Registered at Amtsgericht Duesseldorf: HRB 46611 http://www.egenix.com/company/contact/ From g.brandl at gmx.net Thu Nov 6 17:43:48 2014 From: g.brandl at gmx.net (Georg Brandl) Date: Thu, 06 Nov 2014 17:43:48 +0100 Subject: [Python-checkins] cpython (2.7): #22650: test suite: load Unicode test data files from www.pythontest.net In-Reply-To: References: <20141106135652.108375.20457@psf.io> Message-ID: On 11/06/2014 03:39 PM, Brett Cannon wrote: > What is pythontest.net ? Is it something we control, and > if so how do we add things to it for tests? Did I miss an email on python-dev or > python-committers about this? Benjamin already gave the link to the related issue. The idea is to make the networking tests depend on as few external hosts as possible, so that we can reduce spurious skips or failures when one of them is not reachable or changes its configuration. The pythontest.net domain was chosen to be able to test things like cookies or certificates without a potential of compromising python.org related services. There is a repository at hg.python.org/pythontestdotnet which can be used by developers; server configuration is maintained together with other Python services on https://github.com/python/psf-salt. cheers, Georg From bcannon at gmail.com Thu Nov 6 16:41:09 2014 From: bcannon at gmail.com (Brett Cannon) Date: Thu, 06 Nov 2014 15:41:09 +0000 Subject: [Python-checkins] cpython (2.7): #22650: test suite: load Unicode test data files from www.pythontest.net References: <20141106135652.108375.20457@psf.io> <1415284910.3978287.187837097.131F9A4E@webmail.messagingengine.com> Message-ID: Ah, cool! Just an FYI, the index.html file is not being served for me. -Brett On Thu Nov 06 2014 at 9:41:59 AM Benjamin Peterson wrote: > > > On Thu, Nov 6, 2014, at 09:39, Brett Cannon wrote: > > What is pythontest.net? Is it something we control, and if so how do we > > add > > things to it for tests? Did I miss an email on python-dev or > > python-committers about this? > > See https://bugs.python.org/issue22650 > > > > > On Thu Nov 06 2014 at 8:57:22 AM georg.brandl > > > > wrote: > > > > > https://hg.python.org/cpython/rev/0af36ea1d010 > > > changeset: 93417:0af36ea1d010 > > > branch: 2.7 > > > parent: 93401:3e8d3c4bc17e > > > user: Georg Brandl > > > date: Thu Nov 06 14:37:49 2014 +0100 > > > summary: > > > #22650: test suite: load Unicode test data files from > www.pythontest.net > > > > > > files: > > > Lib/test/test_codecmaps_cn.py | 8 +++----- > > > Lib/test/test_codecmaps_hk.py | 2 +- > > > Lib/test/test_codecmaps_jp.py | 12 +++++------- > > > Lib/test/test_codecmaps_kr.py | 8 +++----- > > > Lib/test/test_codecmaps_tw.py | 6 ++---- > > > Lib/test/test_normalization.py | 2 +- > > > 6 files changed, 15 insertions(+), 23 deletions(-) > > > > > > > > > diff --git a/Lib/test/test_codecmaps_cn.py > b/Lib/test/test_codecmaps_cn.py > > > --- a/Lib/test/test_codecmaps_cn.py > > > +++ b/Lib/test/test_codecmaps_cn.py > > > @@ -10,19 +10,17 @@ > > > class TestGB2312Map(test_multibytecodec_support.TestBase_Mapping, > > > unittest.TestCase): > > > encoding = 'gb2312' > > > - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-CN.TXT' > > > + mapfileurl = 'http://www.pythontest.net/unicode/EUC-CN.TXT' > > > > > > class TestGBKMap(test_multibytecodec_support.TestBase_Mapping, > > > unittest.TestCase): > > > encoding = 'gbk' > > > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/' \ > > > - 'MICSFT/WINDOWS/CP936.TXT' > > > + mapfileurl = 'http://www.pythontest.net/unicode/CP936.TXT' > > > > > > class TestGB18030Map(test_multibytecodec_support.TestBase_Mapping, > > > unittest.TestCase): > > > encoding = 'gb18030' > > > - mapfileurl = 'http://source.icu-project.org/repos/icu/data/' \ > > > - 'trunk/charset/data/xml/gb-18030-2000.xml' > > > + mapfileurl = 'http://www.pythontest.net/unicode/gb-18030-2000.xml > ' > > > > > > > > > def test_main(): > > > diff --git a/Lib/test/test_codecmaps_hk.py > b/Lib/test/test_codecmaps_hk.py > > > --- a/Lib/test/test_codecmaps_hk.py > > > +++ b/Lib/test/test_codecmaps_hk.py > > > @@ -10,7 +10,7 @@ > > > class TestBig5HKSCSMap(test_multibytecodec_support.TestBase_Mapping, > > > unittest.TestCase): > > > encoding = 'big5hkscs' > > > - mapfileurl = 'http://people.freebsd.org/~ > > > perky/i18n/BIG5HKSCS-2004.TXT' > > > + mapfileurl = 'http://www.pythontest.net/uni > code/BIG5HKSCS-2004.TXT' > > > > > > def test_main(): > > > test_support.run_unittest(__name__) > > > diff --git a/Lib/test/test_codecmaps_jp.py > b/Lib/test/test_codecmaps_jp.py > > > --- a/Lib/test/test_codecmaps_jp.py > > > +++ b/Lib/test/test_codecmaps_jp.py > > > @@ -10,8 +10,7 @@ > > > class TestCP932Map(test_multibytecodec_support.TestBase_Mapping, > > > unittest.TestCase): > > > encoding = 'cp932' > > > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/ > MICSFT/' > > > \ > > > - 'WINDOWS/CP932.TXT' > > > + mapfileurl = 'http://www.pythontest.net/unicode/CP932.TXT' > > > supmaps = [ > > > ('\x80', u'\u0080'), > > > ('\xa0', u'\uf8f0'), > > > @@ -27,15 +26,14 @@ > > > unittest.TestCase): > > > encoding = 'euc_jp' > > > mapfilename = 'EUC-JP.TXT' > > > - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-JP.TXT' > > > + mapfileurl = 'http://www.pythontest.net/unicode/EUC-JP.TXT' > > > > > > > > > class TestSJISCOMPATMap(test_multibytecodec_support.TestBase_Mapping, > > > unittest.TestCase): > > > encoding = 'shift_jis' > > > mapfilename = 'SHIFTJIS.TXT' > > > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE' \ > > > - '/EASTASIA/JIS/SHIFTJIS.TXT' > > > + mapfileurl = 'http://www.pythontest.net/unicode/SHIFTJIS.TXT' > > > pass_enctest = [ > > > ('\x81_', u'\\'), > > > ] > > > @@ -49,14 +47,14 @@ > > > unittest.TestCase): > > > encoding = 'euc_jisx0213' > > > mapfilename = 'EUC-JISX0213.TXT' > > > - mapfileurl = 'http://people.freebsd.org/~pe > rky/i18n/EUC-JISX0213.TXT' > > > + mapfileurl = 'http://www.pythontest.net/unicode/EUC-JISX0213.TXT' > > > > > > > > > class TestSJISX0213Map(test_multibytecodec_support.TestBase_Mapping, > > > unittest.TestCase): > > > encoding = 'shift_jisx0213' > > > mapfilename = 'SHIFT_JISX0213.TXT' > > > - mapfileurl = 'http://people.freebsd.org/~ > > > perky/i18n/SHIFT_JISX0213.TXT' > > > + mapfileurl = 'http://www.pythontest.net/uni > code/SHIFT_JISX0213.TXT' > > > > > > > > > def test_main(): > > > diff --git a/Lib/test/test_codecmaps_kr.py > b/Lib/test/test_codecmaps_kr.py > > > --- a/Lib/test/test_codecmaps_kr.py > > > +++ b/Lib/test/test_codecmaps_kr.py > > > @@ -10,14 +10,13 @@ > > > class TestCP949Map(test_multibytecodec_support.TestBase_Mapping, > > > unittest.TestCase): > > > encoding = 'cp949' > > > - mapfileurl = 'http://www.unicode.org/Public > /MAPPINGS/VENDORS/MICSFT' > > > \ > > > - '/WINDOWS/CP949.TXT' > > > + mapfileurl = 'http://www.pythontest.net/unicode/CP949.TXT' > > > > > > > > > class TestEUCKRMap(test_multibytecodec_support.TestBase_Mapping, > > > unittest.TestCase): > > > encoding = 'euc_kr' > > > - mapfileurl = 'http://people.freebsd.org/~perky/i18n/EUC-KR.TXT' > > > + mapfileurl = 'http://www.pythontest.net/unicode/EUC-KR.TXT' > > > > > > # A4D4 HANGUL FILLER indicates the begin of 8-bytes make-up > sequence. > > > pass_enctest = [('\xa4\xd4', u'\u3164')] > > > @@ -27,8 +26,7 @@ > > > class TestJOHABMap(test_multibytecodec_support.TestBase_Mapping, > > > unittest.TestCase): > > > encoding = 'johab' > > > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE/ > > > EASTASIA/' \ > > > - 'KSC/JOHAB.TXT' > > > + mapfileurl = 'http://www.pythontest.net/unicode/JOHAB.TXT' > > > # KS X 1001 standard assigned 0x5c as WON SIGN. > > > # but, in early 90s that is the only era used johab widely, > > > # the most softwares implements it as REVERSE SOLIDUS. > > > diff --git a/Lib/test/test_codecmaps_tw.py > b/Lib/test/test_codecmaps_tw.py > > > --- a/Lib/test/test_codecmaps_tw.py > > > +++ b/Lib/test/test_codecmaps_tw.py > > > @@ -10,14 +10,12 @@ > > > class TestBIG5Map(test_multibytecodec_support.TestBase_Mapping, > > > unittest.TestCase): > > > encoding = 'big5' > > > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/OBSOLETE/' \ > > > - 'EASTASIA/OTHER/BIG5.TXT' > > > + mapfileurl = 'http://www.pythontest.net/unicode/BIG5.TXT' > > > > > > class TestCP950Map(test_multibytecodec_support.TestBase_Mapping, > > > unittest.TestCase): > > > encoding = 'cp950' > > > - mapfileurl = 'http://www.unicode.org/Public/MAPPINGS/VENDORS/ > MICSFT/' > > > \ > > > - 'WINDOWS/CP950.TXT' > > > + mapfileurl = 'http://www.pythontest.net/unicode/CP950.TXT' > > > pass_enctest = [ > > > ('\xa2\xcc', u'\u5341'), > > > ('\xa2\xce', u'\u5345'), > > > diff --git a/Lib/test/test_normalization.py > b/Lib/test/test_normalization. > > > py > > > --- a/Lib/test/test_normalization.py > > > +++ b/Lib/test/test_normalization.py > > > @@ -7,7 +7,7 @@ > > > from unicodedata import normalize, unidata_version > > > > > > TESTDATAFILE = "NormalizationTest.txt" > > > -TESTDATAURL = "http://www.unicode.org/Public/" + unidata_version + > > > "/ucd/" + TESTDATAFILE > > > +TESTDATAURL = "http://www.pythontest.net/unicode/" + unidata_version > + > > > "/" + TESTDATAFILE > > > > > > def check_version(testfile): > > > hdr = testfile.readline() > > > > > > -- > > > Repository URL: https://hg.python.org/cpython > > > _______________________________________________ > > > Python-checkins mailing list > > > Python-checkins at python.org > > > https://mail.python.org/mailman/listinfo/python-checkins > > > > > _______________________________________________ > > Python-checkins mailing list > > Python-checkins at python.org > > https://mail.python.org/mailman/listinfo/python-checkins > _______________________________________________ > Python-checkins mailing list > Python-checkins at python.org > https://mail.python.org/mailman/listinfo/python-checkins > -------------- next part -------------- An HTML attachment was scrubbed... URL: From benjamin at python.org Thu Nov 6 17:56:31 2014 From: benjamin at python.org (Benjamin Peterson) Date: Thu, 06 Nov 2014 11:56:31 -0500 Subject: [Python-checkins] [Python-Dev] cpython (2.7): #22650: test suite: load Unicode test data files from www.pythontest.net In-Reply-To: References: <20141106135652.108375.20457@psf.io> <1415284910.3978287.187837097.131F9A4E@webmail.messagingengine.com> Message-ID: <1415292991.4007266.187895233.3A8B1517@webmail.messagingengine.com> On Thu, Nov 6, 2014, at 10:41, Brett Cannon wrote: > Ah, cool! Just an FYI, the index.html file is not being served for me. At the moment it's only served on www. From solipsis at pitrou.net Fri Nov 7 10:22:52 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Fri, 07 Nov 2014 10:22:52 +0100 Subject: [Python-checkins] Daily reference leaks (a688d3206646): sum=3 Message-ID: results for a688d3206646 on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogbqyikb', '-x'] From python-checkins at python.org Fri Nov 7 11:12:38 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Fri, 07 Nov 2014 10:12:38 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?b?KTogSXNzdWUgIzIyNzY5OiBGaXhlZCB0dGsuVHJlZXZpZXcudGFnX2hhcygp?= =?utf-8?q?_when_called_without_arguments=2E?= Message-ID: <20141107101238.85210.46022@psf.io> https://hg.python.org/cpython/rev/0b56adcb737d changeset: 93423:0b56adcb737d parent: 93420:a688d3206646 parent: 93422:cd17aa63492e user: Serhiy Storchaka date: Fri Nov 07 12:03:09 2014 +0200 summary: Issue #22769: Fixed ttk.Treeview.tag_has() when called without arguments. files: Lib/tkinter/test/test_ttk/test_widgets.py | 17 ++++++++++- Lib/tkinter/ttk.py | 6 +++- Misc/NEWS | 2 + 3 files changed, 23 insertions(+), 2 deletions(-) diff --git a/Lib/tkinter/test/test_ttk/test_widgets.py b/Lib/tkinter/test/test_ttk/test_widgets.py --- a/Lib/tkinter/test/test_ttk/test_widgets.py +++ b/Lib/tkinter/test/test_ttk/test_widgets.py @@ -1,6 +1,6 @@ import unittest import tkinter -from tkinter import ttk +from tkinter import ttk, TclError from test.support import requires import sys @@ -1563,6 +1563,21 @@ 'blue') self.assertIsInstance(self.tv.tag_configure('test'), dict) + def test_tag_has(self): + item1 = self.tv.insert('', 'end', text='Item 1', tags=['tag1']) + item2 = self.tv.insert('', 'end', text='Item 2', tags=['tag2']) + self.assertRaises(TypeError, self.tv.tag_has) + self.assertRaises(TclError, self.tv.tag_has, 'tag1', 'non-existing') + self.assertTrue(self.tv.tag_has('tag1', item1)) + self.assertFalse(self.tv.tag_has('tag1', item2)) + self.assertFalse(self.tv.tag_has('tag2', item1)) + self.assertTrue(self.tv.tag_has('tag2', item2)) + self.assertFalse(self.tv.tag_has('tag3', item1)) + self.assertFalse(self.tv.tag_has('tag3', item2)) + self.assertEqual(self.tv.tag_has('tag1'), (item1,)) + self.assertEqual(self.tv.tag_has('tag2'), (item2,)) + self.assertEqual(self.tv.tag_has('tag3'), ()) + @add_standard_options(StandardTtkOptionsTests) class SeparatorTest(AbstractWidgetTest, unittest.TestCase): diff --git a/Lib/tkinter/ttk.py b/Lib/tkinter/ttk.py --- a/Lib/tkinter/ttk.py +++ b/Lib/tkinter/ttk.py @@ -1456,7 +1456,11 @@ all items which have the specified tag. * Availability: Tk 8.6""" - return self.tk.getboolean( + if item is None: + return self.tk.splitlist( + self.tk.call(self._w, "tag", "has", tagname)) + else: + return self.tk.getboolean( self.tk.call(self._w, "tag", "has", tagname, item)) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -183,6 +183,8 @@ Library ------- +- Issue #22769: Fixed ttk.Treeview.tag_has() when called without arguments. + - Issue #22417: Verify certificates by default in httplib (PEP 476). - Issue #22775: Fixed unpickling of http.cookies.SimpleCookie with protocol 2 -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 7 11:12:37 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Fri, 07 Nov 2014 10:12:37 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzIyNzY5?= =?utf-8?q?=3A_Fixed_ttk=2ETreeview=2Etag=5Fhas=28=29_when_called_without_?= =?utf-8?q?arguments=2E?= Message-ID: <20141107101237.113474.24233@psf.io> https://hg.python.org/cpython/rev/b3a5b53173c0 changeset: 93421:b3a5b53173c0 branch: 2.7 parent: 93418:14a69e40dbb0 user: Serhiy Storchaka date: Fri Nov 07 12:02:11 2014 +0200 summary: Issue #22769: Fixed ttk.Treeview.tag_has() when called without arguments. files: Lib/lib-tk/test/test_ttk/test_widgets.py | 16 ++++++++++++ Lib/lib-tk/ttk.py | 6 +++- Misc/NEWS | 2 + 3 files changed, 23 insertions(+), 1 deletions(-) diff --git a/Lib/lib-tk/test/test_ttk/test_widgets.py b/Lib/lib-tk/test/test_ttk/test_widgets.py --- a/Lib/lib-tk/test/test_ttk/test_widgets.py +++ b/Lib/lib-tk/test/test_ttk/test_widgets.py @@ -1,5 +1,6 @@ import unittest import Tkinter as tkinter +from Tkinter import TclError import ttk from test.test_support import requires, run_unittest import sys @@ -1564,6 +1565,21 @@ 'blue') self.assertIsInstance(self.tv.tag_configure('test'), dict) + def test_tag_has(self): + item1 = self.tv.insert('', 'end', text='Item 1', tags=['tag1']) + item2 = self.tv.insert('', 'end', text='Item 2', tags=['tag2']) + self.assertRaises(TypeError, self.tv.tag_has) + self.assertRaises(TclError, self.tv.tag_has, 'tag1', 'non-existing') + self.assertTrue(self.tv.tag_has('tag1', item1)) + self.assertFalse(self.tv.tag_has('tag1', item2)) + self.assertFalse(self.tv.tag_has('tag2', item1)) + self.assertTrue(self.tv.tag_has('tag2', item2)) + self.assertFalse(self.tv.tag_has('tag3', item1)) + self.assertFalse(self.tv.tag_has('tag3', item2)) + self.assertEqual(self.tv.tag_has('tag1'), (item1,)) + self.assertEqual(self.tv.tag_has('tag2'), (item2,)) + self.assertEqual(self.tv.tag_has('tag3'), ()) + @add_standard_options(StandardTtkOptionsTests) class SeparatorTest(AbstractWidgetTest, unittest.TestCase): diff --git a/Lib/lib-tk/ttk.py b/Lib/lib-tk/ttk.py --- a/Lib/lib-tk/ttk.py +++ b/Lib/lib-tk/ttk.py @@ -1458,7 +1458,11 @@ all items which have the specified tag. * Availability: Tk 8.6""" - return self.tk.getboolean( + if item is None: + return self.tk.splitlist( + self.tk.call(self._w, "tag", "has", tagname)) + else: + return self.tk.getboolean( self.tk.call(self._w, "tag", "has", tagname, item)) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -37,6 +37,8 @@ Library ------- +- Issue #22769: Fixed ttk.Treeview.tag_has() when called without arguments. + - Issue #22787: Allow the keyfile argument of SSLContext.load_cert_chain to be None. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 7 11:12:38 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Fri, 07 Nov 2014 10:12:38 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyNzY5?= =?utf-8?q?=3A_Fixed_ttk=2ETreeview=2Etag=5Fhas=28=29_when_called_without_?= =?utf-8?q?arguments=2E?= Message-ID: <20141107101237.713.97497@psf.io> https://hg.python.org/cpython/rev/cd17aa63492e changeset: 93422:cd17aa63492e branch: 3.4 parent: 93419:540b022ae7a9 user: Serhiy Storchaka date: Fri Nov 07 12:02:31 2014 +0200 summary: Issue #22769: Fixed ttk.Treeview.tag_has() when called without arguments. files: Lib/tkinter/test/test_ttk/test_widgets.py | 17 ++++++++++- Lib/tkinter/ttk.py | 6 +++- Misc/NEWS | 2 + 3 files changed, 23 insertions(+), 2 deletions(-) diff --git a/Lib/tkinter/test/test_ttk/test_widgets.py b/Lib/tkinter/test/test_ttk/test_widgets.py --- a/Lib/tkinter/test/test_ttk/test_widgets.py +++ b/Lib/tkinter/test/test_ttk/test_widgets.py @@ -1,6 +1,6 @@ import unittest import tkinter -from tkinter import ttk +from tkinter import ttk, TclError from test.support import requires import sys @@ -1563,6 +1563,21 @@ 'blue') self.assertIsInstance(self.tv.tag_configure('test'), dict) + def test_tag_has(self): + item1 = self.tv.insert('', 'end', text='Item 1', tags=['tag1']) + item2 = self.tv.insert('', 'end', text='Item 2', tags=['tag2']) + self.assertRaises(TypeError, self.tv.tag_has) + self.assertRaises(TclError, self.tv.tag_has, 'tag1', 'non-existing') + self.assertTrue(self.tv.tag_has('tag1', item1)) + self.assertFalse(self.tv.tag_has('tag1', item2)) + self.assertFalse(self.tv.tag_has('tag2', item1)) + self.assertTrue(self.tv.tag_has('tag2', item2)) + self.assertFalse(self.tv.tag_has('tag3', item1)) + self.assertFalse(self.tv.tag_has('tag3', item2)) + self.assertEqual(self.tv.tag_has('tag1'), (item1,)) + self.assertEqual(self.tv.tag_has('tag2'), (item2,)) + self.assertEqual(self.tv.tag_has('tag3'), ()) + @add_standard_options(StandardTtkOptionsTests) class SeparatorTest(AbstractWidgetTest, unittest.TestCase): diff --git a/Lib/tkinter/ttk.py b/Lib/tkinter/ttk.py --- a/Lib/tkinter/ttk.py +++ b/Lib/tkinter/ttk.py @@ -1456,7 +1456,11 @@ all items which have the specified tag. * Availability: Tk 8.6""" - return self.tk.getboolean( + if item is None: + return self.tk.splitlist( + self.tk.call(self._w, "tag", "has", tagname)) + else: + return self.tk.getboolean( self.tk.call(self._w, "tag", "has", tagname, item)) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -36,6 +36,8 @@ Library ------- +- Issue #22769: Fixed ttk.Treeview.tag_has() when called without arguments. + - Issue #22417: Verify certificates by default in httplib (PEP 476). - Issue #22775: Fixed unpickling of http.cookies.SimpleCookie with protocol 2 -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 7 11:27:22 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Fri, 07 Nov 2014 10:27:22 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzE3Mjkz?= =?utf-8?q?=3A_uuid=2Egetnode=28=29_now_determines_MAC_address_on_AIX_usin?= =?utf-8?q?g_netstat=2E?= Message-ID: <20141107102720.85196.62034@psf.io> https://hg.python.org/cpython/rev/e80cb046e764 changeset: 93424:e80cb046e764 branch: 2.7 parent: 93421:b3a5b53173c0 user: Serhiy Storchaka date: Fri Nov 07 12:19:23 2014 +0200 summary: Issue #17293: uuid.getnode() now determines MAC address on AIX using netstat. Based on patch by Aivars Kalv?ns. files: Lib/test/test_uuid.py | 18 ++++++++ Lib/uuid.py | 68 ++++++++++++++++++++++-------- Misc/NEWS | 3 + 3 files changed, 71 insertions(+), 18 deletions(-) diff --git a/Lib/test/test_uuid.py b/Lib/test/test_uuid.py --- a/Lib/test/test_uuid.py +++ b/Lib/test/test_uuid.py @@ -307,6 +307,24 @@ if node is not None: self.check_node(node, 'ifconfig') + @unittest.skipUnless(os.name == 'posix', 'requires Posix') + def test_arp_getnode(self): + node = uuid._arp_getnode() + if node is not None: + self.check_node(node, 'arp') + + @unittest.skipUnless(os.name == 'posix', 'requires Posix') + def test_lanscan_getnode(self): + node = uuid._lanscan_getnode() + if node is not None: + self.check_node(node, 'lanscan') + + @unittest.skipUnless(os.name == 'posix', 'requires Posix') + def test_netstat_getnode(self): + node = uuid._netstat_getnode() + if node is not None: + self.check_node(node, 'netstat') + @unittest.skipUnless(os.name == 'nt', 'requires Windows') def test_ipconfig_getnode(self): node = uuid._ipconfig_getnode() diff --git a/Lib/uuid.py b/Lib/uuid.py --- a/Lib/uuid.py +++ b/Lib/uuid.py @@ -291,7 +291,7 @@ version = property(get_version) -def _find_mac(command, args, hw_identifiers, get_index): +def _popen(command, args): import os path = os.environ.get("PATH", os.defpath).split(os.pathsep) path.extend(('/sbin', '/usr/sbin')) @@ -303,19 +303,27 @@ break else: return None + # LC_ALL to ensure English output, 2>/dev/null to prevent output on + # stderr (Note: we don't have an example where the words we search for + # are actually localized, but in theory some system could do so.) + cmd = 'LC_ALL=C %s %s 2>/dev/null' % (executable, args) + return os.popen(cmd) +def _find_mac(command, args, hw_identifiers, get_index): try: - # LC_ALL to ensure English output, 2>/dev/null to - # prevent output on stderr - cmd = 'LC_ALL=C %s %s 2>/dev/null' % (executable, args) - with os.popen(cmd) as pipe: + pipe = _popen(command, args) + if not pipe: + return + with pipe: for line in pipe: - words = line.lower().split() + words = line.lower().rstrip().split() for i in range(len(words)): if words[i] in hw_identifiers: try: - return int( - words[get_index(i)].replace(':', ''), 16) + word = words[get_index(i)] + mac = int(word.replace(':', ''), 16) + if mac: + return mac except (ValueError, IndexError): # Virtual interfaces, such as those provided by # VPNs, do not have a colon-delimited MAC address @@ -328,27 +336,50 @@ def _ifconfig_getnode(): """Get the hardware address on Unix by running ifconfig.""" - # This works on Linux ('' or '-a'), Tru64 ('-av'), but not all Unixes. for args in ('', '-a', '-av'): mac = _find_mac('ifconfig', args, ['hwaddr', 'ether'], lambda i: i+1) if mac: return mac - import socket +def _arp_getnode(): + """Get the hardware address on Unix by running arp.""" + import os, socket ip_addr = socket.gethostbyname(socket.gethostname()) # Try getting the MAC addr from arp based on our IP address (Solaris). - mac = _find_mac('arp', '-an', [ip_addr], lambda i: -1) - if mac: - return mac + return _find_mac('arp', '-an', [ip_addr], lambda i: -1) +def _lanscan_getnode(): + """Get the hardware address on Unix by running lanscan.""" # This might work on HP-UX. - mac = _find_mac('lanscan', '-ai', ['lan0'], lambda i: 0) - if mac: - return mac + return _find_mac('lanscan', '-ai', ['lan0'], lambda i: 0) - return None +def _netstat_getnode(): + """Get the hardware address on Unix by running netstat.""" + # This might work on AIX, Tru64 UNIX and presumably on IRIX. + try: + pipe = _popen('netstat', '-ia') + if not pipe: + return + with pipe: + words = pipe.readline().rstrip().split() + try: + i = words.index('Address') + except ValueError: + return + for line in pipe: + try: + words = line.rstrip().split() + word = words[i] + if len(word) == 17 and word.count(':') == 5: + mac = int(word.replace(':', ''), 16) + if mac: + return mac + except (ValueError, IndexError): + pass + except OSError: + pass def _ipconfig_getnode(): """Get the hardware address on Windows by running ipconfig.exe.""" @@ -488,7 +519,8 @@ if sys.platform == 'win32': getters = [_windll_getnode, _netbios_getnode, _ipconfig_getnode] else: - getters = [_unixdll_getnode, _ifconfig_getnode] + getters = [_unixdll_getnode, _ifconfig_getnode, _arp_getnode, + _lanscan_getnode, _netstat_getnode] for getter in getters + [_random_getnode]: try: diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -37,6 +37,9 @@ Library ------- +- Issue #17293: uuid.getnode() now determines MAC address on AIX using netstat. + Based on patch by Aivars Kalv?ns. + - Issue #22769: Fixed ttk.Treeview.tag_has() when called without arguments. - Issue #22787: Allow the keyfile argument of SSLContext.load_cert_chain to be -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 7 11:27:22 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Fri, 07 Nov 2014 10:27:22 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzE3Mjkz?= =?utf-8?q?=3A_uuid=2Egetnode=28=29_now_determines_MAC_address_on_AIX_usin?= =?utf-8?q?g_netstat=2E?= Message-ID: <20141107102720.108381.11741@psf.io> https://hg.python.org/cpython/rev/ba4b31ed2952 changeset: 93425:ba4b31ed2952 branch: 3.4 parent: 93422:cd17aa63492e user: Serhiy Storchaka date: Fri Nov 07 12:19:40 2014 +0200 summary: Issue #17293: uuid.getnode() now determines MAC address on AIX using netstat. Based on patch by Aivars Kalv?ns. files: Lib/test/test_uuid.py | 18 ++++++++ Lib/uuid.py | 69 ++++++++++++++++++++++-------- Misc/NEWS | 3 + 3 files changed, 71 insertions(+), 19 deletions(-) diff --git a/Lib/test/test_uuid.py b/Lib/test/test_uuid.py --- a/Lib/test/test_uuid.py +++ b/Lib/test/test_uuid.py @@ -319,6 +319,24 @@ if node is not None: self.check_node(node, 'ifconfig') + @unittest.skipUnless(os.name == 'posix', 'requires Posix') + def test_arp_getnode(self): + node = uuid._arp_getnode() + if node is not None: + self.check_node(node, 'arp') + + @unittest.skipUnless(os.name == 'posix', 'requires Posix') + def test_lanscan_getnode(self): + node = uuid._lanscan_getnode() + if node is not None: + self.check_node(node, 'lanscan') + + @unittest.skipUnless(os.name == 'posix', 'requires Posix') + def test_netstat_getnode(self): + node = uuid._netstat_getnode() + if node is not None: + self.check_node(node, 'netstat') + @unittest.skipUnless(os.name == 'nt', 'requires Windows') def test_ipconfig_getnode(self): node = uuid._ipconfig_getnode() diff --git a/Lib/uuid.py b/Lib/uuid.py --- a/Lib/uuid.py +++ b/Lib/uuid.py @@ -311,7 +311,7 @@ if self.variant == RFC_4122: return int((self.int >> 76) & 0xf) -def _find_mac(command, args, hw_identifiers, get_index): +def _popen(command, args): import os, shutil executable = shutil.which(command) if executable is None: @@ -319,20 +319,27 @@ executable = shutil.which(command, path=path) if executable is None: return None + # LC_ALL to ensure English output, 2>/dev/null to prevent output on + # stderr (Note: we don't have an example where the words we search for + # are actually localized, but in theory some system could do so.) + cmd = 'LC_ALL=C %s %s 2>/dev/null' % (executable, args) + return os.popen(cmd) +def _find_mac(command, args, hw_identifiers, get_index): try: - # LC_ALL to ensure English output, 2>/dev/null to prevent output on - # stderr (Note: we don't have an example where the words we search for - # are actually localized, but in theory some system could do so.) - cmd = 'LC_ALL=C %s %s 2>/dev/null' % (executable, args) - with os.popen(cmd) as pipe: + pipe = _popen(command, args) + if not pipe: + return + with pipe: for line in pipe: - words = line.lower().split() + words = line.lower().rstrip().split() for i in range(len(words)): if words[i] in hw_identifiers: try: - return int( - words[get_index(i)].replace(':', ''), 16) + word = words[get_index(i)] + mac = int(word.replace(':', ''), 16) + if mac: + return mac except (ValueError, IndexError): # Virtual interfaces, such as those provided by # VPNs, do not have a colon-delimited MAC address @@ -345,27 +352,50 @@ def _ifconfig_getnode(): """Get the hardware address on Unix by running ifconfig.""" - # This works on Linux ('' or '-a'), Tru64 ('-av'), but not all Unixes. for args in ('', '-a', '-av'): mac = _find_mac('ifconfig', args, ['hwaddr', 'ether'], lambda i: i+1) if mac: return mac - import socket +def _arp_getnode(): + """Get the hardware address on Unix by running arp.""" + import os, socket ip_addr = socket.gethostbyname(socket.gethostname()) # Try getting the MAC addr from arp based on our IP address (Solaris). - mac = _find_mac('arp', '-an', [ip_addr], lambda i: -1) - if mac: - return mac + return _find_mac('arp', '-an', [ip_addr], lambda i: -1) +def _lanscan_getnode(): + """Get the hardware address on Unix by running lanscan.""" # This might work on HP-UX. - mac = _find_mac('lanscan', '-ai', ['lan0'], lambda i: 0) - if mac: - return mac + return _find_mac('lanscan', '-ai', ['lan0'], lambda i: 0) - return None +def _netstat_getnode(): + """Get the hardware address on Unix by running netstat.""" + # This might work on AIX, Tru64 UNIX and presumably on IRIX. + try: + pipe = _popen('netstat', '-ia') + if not pipe: + return + with pipe: + words = pipe.readline().rstrip().split() + try: + i = words.index('Address') + except ValueError: + return + for line in pipe: + try: + words = line.rstrip().split() + word = words[i] + if len(word) == 17 and word.count(':') == 5: + mac = int(word.replace(':', ''), 16) + if mac: + return mac + except (ValueError, IndexError): + pass + except OSError: + pass def _ipconfig_getnode(): """Get the hardware address on Windows by running ipconfig.exe.""" @@ -506,7 +536,8 @@ if sys.platform == 'win32': getters = [_windll_getnode, _netbios_getnode, _ipconfig_getnode] else: - getters = [_unixdll_getnode, _ifconfig_getnode] + getters = [_unixdll_getnode, _ifconfig_getnode, _arp_getnode, + _lanscan_getnode, _netstat_getnode] for getter in getters + [_random_getnode]: try: diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -36,6 +36,9 @@ Library ------- +- Issue #17293: uuid.getnode() now determines MAC address on AIX using netstat. + Based on patch by Aivars Kalv?ns. + - Issue #22769: Fixed ttk.Treeview.tag_has() when called without arguments. - Issue #22417: Verify certificates by default in httplib (PEP 476). -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 7 11:27:22 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Fri, 07 Nov 2014 10:27:22 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2317293=3A_uuid=2Egetnode=28=29_now_determines_MA?= =?utf-8?q?C_address_on_AIX_using_netstat=2E?= Message-ID: <20141107102720.731.88914@psf.io> https://hg.python.org/cpython/rev/3e4f3cc4f1f9 changeset: 93426:3e4f3cc4f1f9 parent: 93423:0b56adcb737d parent: 93425:ba4b31ed2952 user: Serhiy Storchaka date: Fri Nov 07 12:23:30 2014 +0200 summary: Issue #17293: uuid.getnode() now determines MAC address on AIX using netstat. Based on patch by Aivars Kalv?ns. files: Lib/test/test_uuid.py | 20 +++++++- Lib/uuid.py | 81 ++++++++++++++++++++---------- Misc/NEWS | 3 + 3 files changed, 76 insertions(+), 28 deletions(-) diff --git a/Lib/test/test_uuid.py b/Lib/test/test_uuid.py --- a/Lib/test/test_uuid.py +++ b/Lib/test/test_uuid.py @@ -320,6 +320,24 @@ if node is not None: self.check_node(node, 'ifconfig') + @unittest.skipUnless(os.name == 'posix', 'requires Posix') + def test_arp_getnode(self): + node = uuid._arp_getnode() + if node is not None: + self.check_node(node, 'arp') + + @unittest.skipUnless(os.name == 'posix', 'requires Posix') + def test_lanscan_getnode(self): + node = uuid._lanscan_getnode() + if node is not None: + self.check_node(node, 'lanscan') + + @unittest.skipUnless(os.name == 'posix', 'requires Posix') + def test_netstat_getnode(self): + node = uuid._netstat_getnode() + if node is not None: + self.check_node(node, 'netstat') + @unittest.skipUnless(os.name == 'nt', 'requires Windows') def test_ipconfig_getnode(self): node = uuid._ipconfig_getnode() @@ -377,7 +395,7 @@ return_value=popen): mac = uuid._find_mac( command='ifconfig', - arg='', + args='', hw_identifiers=[b'hwaddr'], get_index=lambda x: x + 1, ) diff --git a/Lib/uuid.py b/Lib/uuid.py --- a/Lib/uuid.py +++ b/Lib/uuid.py @@ -304,7 +304,7 @@ if self.variant == RFC_4122: return int((self.int >> 76) & 0xf) -def _find_mac(command, arg, hw_identifiers, get_index): +def _popen(command, *args): import os, shutil, subprocess executable = shutil.which(command) if executable is None: @@ -312,28 +312,32 @@ executable = shutil.which(command, path=path) if executable is None: return None + # LC_ALL=C to ensure English output, stderr=DEVNULL to prevent output + # on stderr (Note: we don't have an example where the words we search + # for are actually localized, but in theory some system could do so.) + env = dict(os.environ) + env['LC_ALL'] = 'C' + proc = subprocess.Popen((executable,) + args, + stdout=subprocess.PIPE, + stderr=subprocess.DEVNULL, + env=env) + return proc +def _find_mac(command, args, hw_identifiers, get_index): try: - # LC_ALL=C to ensure English output, stderr=DEVNULL to prevent output - # on stderr (Note: we don't have an example where the words we search - # for are actually localized, but in theory some system could do so.) - env = dict(os.environ) - env['LC_ALL'] = 'C' - cmd = [executable] - if arg: - cmd.append(arg) - proc = subprocess.Popen(cmd, - stdout=subprocess.PIPE, - stderr=subprocess.DEVNULL, - env=env) + proc = _popen(command, *args.split()) + if not proc: + return with proc: for line in proc.stdout: - words = line.lower().split() + words = line.lower().rstrip().split() for i in range(len(words)): if words[i] in hw_identifiers: try: - return int( - words[get_index(i)].replace(b':', b''), 16) + word = words[get_index(i)] + mac = int(word.replace(b':', b''), 16) + if mac: + return mac except (ValueError, IndexError): # Virtual interfaces, such as those provided by # VPNs, do not have a colon-delimited MAC address @@ -346,28 +350,50 @@ def _ifconfig_getnode(): """Get the hardware address on Unix by running ifconfig.""" - import os - # This works on Linux ('' or '-a'), Tru64 ('-av'), but not all Unixes. for args in ('', '-a', '-av'): mac = _find_mac('ifconfig', args, [b'hwaddr', b'ether'], lambda i: i+1) if mac: return mac - import socket +def _arp_getnode(): + """Get the hardware address on Unix by running arp.""" + import os, socket ip_addr = socket.gethostbyname(socket.gethostname()) # Try getting the MAC addr from arp based on our IP address (Solaris). - mac = _find_mac('arp', '-an', [os.fsencode(ip_addr)], lambda i: -1) - if mac: - return mac + return _find_mac('arp', '-an', [os.fsencode(ip_addr)], lambda i: -1) +def _lanscan_getnode(): + """Get the hardware address on Unix by running lanscan.""" # This might work on HP-UX. - mac = _find_mac('lanscan', '-ai', [b'lan0'], lambda i: 0) - if mac: - return mac + return _find_mac('lanscan', '-ai', [b'lan0'], lambda i: 0) - return None +def _netstat_getnode(): + """Get the hardware address on Unix by running netstat.""" + # This might work on AIX, Tru64 UNIX and presumably on IRIX. + try: + proc = _popen('netstat', '-ia') + if not proc: + return + with proc: + words = proc.stdout.readline().rstrip().split() + try: + i = words.index(b'Address') + except ValueError: + return + for line in proc.stdout: + try: + words = line.rstrip().split() + word = words[i] + if len(word) == 17 and word.count(b':') == 5: + mac = int(word.replace(b':', b''), 16) + if mac: + return mac + except (ValueError, IndexError): + pass + except OSError: + pass def _ipconfig_getnode(): """Get the hardware address on Windows by running ipconfig.exe.""" @@ -509,7 +535,8 @@ if sys.platform == 'win32': getters = [_windll_getnode, _netbios_getnode, _ipconfig_getnode] else: - getters = [_unixdll_getnode, _ifconfig_getnode] + getters = [_unixdll_getnode, _ifconfig_getnode, _arp_getnode, + _lanscan_getnode, _netstat_getnode] for getter in getters + [_random_getnode]: try: diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -183,6 +183,9 @@ Library ------- +- Issue #17293: uuid.getnode() now determines MAC address on AIX using netstat. + Based on patch by Aivars Kalv?ns. + - Issue #22769: Fixed ttk.Treeview.tag_has() when called without arguments. - Issue #22417: Verify certificates by default in httplib (PEP 476). -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 7 13:12:47 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Fri, 07 Nov 2014 12:12:47 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyNDA2?= =?utf-8?q?=3A_Fixed_the_uu=5Fcodec_codec_incorrectly_ported_to_3=2Ex=2E?= Message-ID: <20141107121243.85202.47710@psf.io> https://hg.python.org/cpython/rev/ad89a652b4ed changeset: 93427:ad89a652b4ed branch: 3.4 parent: 93425:ba4b31ed2952 user: Serhiy Storchaka date: Fri Nov 07 14:04:37 2014 +0200 summary: Issue #22406: Fixed the uu_codec codec incorrectly ported to 3.x. Based on patch by Martin Panter. files: Lib/encodings/uu_codec.py | 2 +- Lib/test/test_codecs.py | 4 ++++ Lib/test/test_uu.py | 22 ++++++++++++++++++++++ Misc/NEWS | 3 +++ 4 files changed, 30 insertions(+), 1 deletions(-) diff --git a/Lib/encodings/uu_codec.py b/Lib/encodings/uu_codec.py --- a/Lib/encodings/uu_codec.py +++ b/Lib/encodings/uu_codec.py @@ -54,7 +54,7 @@ data = binascii.a2b_uu(s) except binascii.Error as v: # Workaround for broken uuencoders by /Fredrik Lundh - nbytes = (((ord(s[0])-32) & 63) * 4 + 5) / 3 + nbytes = (((s[0]-32) & 63) * 4 + 5) // 3 data = binascii.a2b_uu(s[:nbytes]) #sys.stderr.write("Warning: %s\n" % str(v)) write(data) diff --git a/Lib/test/test_codecs.py b/Lib/test/test_codecs.py --- a/Lib/test/test_codecs.py +++ b/Lib/test/test_codecs.py @@ -2563,6 +2563,10 @@ info = codecs.lookup(alias) self.assertEqual(info.name, expected_name) + def test_uu_invalid(self): + # Missing "begin" line + self.assertRaises(ValueError, codecs.decode, b"", "uu-codec") + # The codec system tries to wrap exceptions in order to ensure the error # mentions the operation being performed and the codec involved. We diff --git a/Lib/test/test_uu.py b/Lib/test/test_uu.py --- a/Lib/test/test_uu.py +++ b/Lib/test/test_uu.py @@ -93,6 +93,28 @@ except uu.Error as e: self.assertEqual(str(e), "No valid begin line found in input file") + def test_garbage_padding(self): + # Issue #22406 + encodedtext = ( + b"begin 644 file\n" + # length 1; bits 001100 111111 111111 111111 + b"\x21\x2C\x5F\x5F\x5F\n" + b"\x20\n" + b"end\n" + ) + plaintext = b"\x33" # 00110011 + + with self.subTest("uu.decode()"): + inp = io.BytesIO(encodedtext) + out = io.BytesIO() + uu.decode(inp, out, quiet=True) + self.assertEqual(out.getvalue(), plaintext) + + with self.subTest("uu_codec"): + import codecs + decoded = codecs.decode(encodedtext, "uu_codec") + self.assertEqual(decoded, plaintext) + class UUStdIOTest(unittest.TestCase): def setUp(self): diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -36,6 +36,9 @@ Library ------- +- Issue #22406: Fixed the uu_codec codec incorrectly ported to 3.x. + Based on patch by Martin Panter. + - Issue #17293: uuid.getnode() now determines MAC address on AIX using netstat. Based on patch by Aivars Kalv?ns. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 7 13:12:47 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Fri, 07 Nov 2014 12:12:47 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=282=2E7=29=3A_Backported_tes?= =?utf-8?q?ts_for_issue_=2322406=2E?= Message-ID: <20141107121244.113468.37884@psf.io> https://hg.python.org/cpython/rev/7b82b58b8329 changeset: 93429:7b82b58b8329 branch: 2.7 parent: 93424:e80cb046e764 user: Serhiy Storchaka date: Fri Nov 07 14:07:43 2014 +0200 summary: Backported tests for issue #22406. files: Lib/test/test_codecs.py | 4 ++++ Lib/test/test_uu.py | 20 ++++++++++++++++++++ 2 files changed, 24 insertions(+), 0 deletions(-) diff --git a/Lib/test/test_codecs.py b/Lib/test/test_codecs.py --- a/Lib/test/test_codecs.py +++ b/Lib/test/test_codecs.py @@ -2109,6 +2109,10 @@ BomTest, ) + def test_uu_invalid(self): + # Missing "begin" line + self.assertRaises(ValueError, codecs.decode, "", "uu-codec") + if __name__ == "__main__": test_main() diff --git a/Lib/test/test_uu.py b/Lib/test/test_uu.py --- a/Lib/test/test_uu.py +++ b/Lib/test/test_uu.py @@ -61,6 +61,26 @@ except uu.Error, e: self.assertEqual(str(e), "No valid begin line found in input file") + def test_garbage_padding(self): + # Issue #22406 + encodedtext = ( + "begin 644 file\n" + # length 1; bits 001100 111111 111111 111111 + "\x21\x2C\x5F\x5F\x5F\n" + "\x20\n" + "end\n" + ) + plaintext = "\x33" # 00110011 + + inp = cStringIO.StringIO(encodedtext) + out = cStringIO.StringIO() + uu.decode(inp, out, quiet=True) + self.assertEqual(out.getvalue(), plaintext) + + import codecs + decoded = codecs.decode(encodedtext, "uu_codec") + self.assertEqual(decoded, plaintext) + class UUStdIOTest(unittest.TestCase): def setUp(self): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 7 13:12:47 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Fri, 07 Nov 2014 12:12:47 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2322406=3A_Fixed_the_uu=5Fcodec_codec_incorrectly?= =?utf-8?q?_ported_to_3=2Ex=2E?= Message-ID: <20141107121244.108375.25405@psf.io> https://hg.python.org/cpython/rev/b18ef4a3e7c1 changeset: 93428:b18ef4a3e7c1 parent: 93426:3e4f3cc4f1f9 parent: 93427:ad89a652b4ed user: Serhiy Storchaka date: Fri Nov 07 14:06:19 2014 +0200 summary: Issue #22406: Fixed the uu_codec codec incorrectly ported to 3.x. Based on patch by Martin Panter. files: Lib/encodings/uu_codec.py | 2 +- Lib/test/test_codecs.py | 4 ++++ Lib/test/test_uu.py | 22 ++++++++++++++++++++++ Misc/NEWS | 3 +++ 4 files changed, 30 insertions(+), 1 deletions(-) diff --git a/Lib/encodings/uu_codec.py b/Lib/encodings/uu_codec.py --- a/Lib/encodings/uu_codec.py +++ b/Lib/encodings/uu_codec.py @@ -54,7 +54,7 @@ data = binascii.a2b_uu(s) except binascii.Error as v: # Workaround for broken uuencoders by /Fredrik Lundh - nbytes = (((ord(s[0])-32) & 63) * 4 + 5) / 3 + nbytes = (((s[0]-32) & 63) * 4 + 5) // 3 data = binascii.a2b_uu(s[:nbytes]) #sys.stderr.write("Warning: %s\n" % str(v)) write(data) diff --git a/Lib/test/test_codecs.py b/Lib/test/test_codecs.py --- a/Lib/test/test_codecs.py +++ b/Lib/test/test_codecs.py @@ -2571,6 +2571,10 @@ info = codecs.lookup(alias) self.assertEqual(info.name, expected_name) + def test_uu_invalid(self): + # Missing "begin" line + self.assertRaises(ValueError, codecs.decode, b"", "uu-codec") + # The codec system tries to wrap exceptions in order to ensure the error # mentions the operation being performed and the codec involved. We diff --git a/Lib/test/test_uu.py b/Lib/test/test_uu.py --- a/Lib/test/test_uu.py +++ b/Lib/test/test_uu.py @@ -93,6 +93,28 @@ except uu.Error as e: self.assertEqual(str(e), "No valid begin line found in input file") + def test_garbage_padding(self): + # Issue #22406 + encodedtext = ( + b"begin 644 file\n" + # length 1; bits 001100 111111 111111 111111 + b"\x21\x2C\x5F\x5F\x5F\n" + b"\x20\n" + b"end\n" + ) + plaintext = b"\x33" # 00110011 + + with self.subTest("uu.decode()"): + inp = io.BytesIO(encodedtext) + out = io.BytesIO() + uu.decode(inp, out, quiet=True) + self.assertEqual(out.getvalue(), plaintext) + + with self.subTest("uu_codec"): + import codecs + decoded = codecs.decode(encodedtext, "uu_codec") + self.assertEqual(decoded, plaintext) + class UUStdIOTest(unittest.TestCase): def setUp(self): diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -183,6 +183,9 @@ Library ------- +- Issue #22406: Fixed the uu_codec codec incorrectly ported to 3.x. + Based on patch by Martin Panter. + - Issue #17293: uuid.getnode() now determines MAC address on AIX using netstat. Based on patch by Aivars Kalv?ns. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 7 15:56:22 2014 From: python-checkins at python.org (brett.cannon) Date: Fri, 07 Nov 2014 14:56:22 +0000 Subject: [Python-checkins] =?utf-8?q?pythontestdotnet=3A_Link_to_the_hg_re?= =?utf-8?q?po_and_Salt_config?= Message-ID: <20141107145614.108375.81360@psf.io> https://hg.python.org/pythontestdotnet/rev/b51c46800184 changeset: 5:b51c46800184 user: Brett Cannon date: Fri Nov 07 09:56:11 2014 -0500 summary: Link to the hg repo and Salt config files: www/index.html | 5 +++++ 1 files changed, 5 insertions(+), 0 deletions(-) diff --git a/www/index.html b/www/index.html --- a/www/index.html +++ b/www/index.html @@ -6,5 +6,10 @@ This domain is used to host various services contacted by the Python test suite. + All content is managed through + + a Mercurial repository and its configuration is + + managed through Salt. -- Repository URL: https://hg.python.org/pythontestdotnet From python-checkins at python.org Fri Nov 7 17:29:44 2014 From: python-checkins at python.org (brett.cannon) Date: Fri, 07 Nov 2014 16:29:44 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2322242=3A_Try_to_m?= =?utf-8?q?ake_some_import-related_loader_details_clearer=2E?= Message-ID: <20141107162942.731.21157@psf.io> https://hg.python.org/cpython/rev/f473063318c3 changeset: 93430:f473063318c3 parent: 93428:b18ef4a3e7c1 user: Brett Cannon date: Fri Nov 07 11:29:33 2014 -0500 summary: Issue #22242: Try to make some import-related loader details clearer. Thanks to Jon Poler for pointing this out. files: Doc/reference/import.rst | 3 ++- 1 files changed, 2 insertions(+), 1 deletions(-) diff --git a/Doc/reference/import.rst b/Doc/reference/import.rst --- a/Doc/reference/import.rst +++ b/Doc/reference/import.rst @@ -459,7 +459,8 @@ * If loading fails, the loader must remove any modules it has inserted into :data:`sys.modules`, but it must remove **only** the failing - module, and only if the loader itself has loaded it explicitly. + module(s), and only if the loader itself has loaded the module(s) + explicitly. Module spec ----------- -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 7 18:51:31 2014 From: python-checkins at python.org (berker.peksag) Date: Fri, 07 Nov 2014 17:51:31 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2322808=3A_Link_to_the_correct_time_method_in_Bas?= =?utf-8?b?ZUV2ZW50TG9vcC5jYWxsX2F0KCku?= Message-ID: <20141107175130.108071.25688@psf.io> https://hg.python.org/cpython/rev/98f4bc1332c9 changeset: 93432:98f4bc1332c9 parent: 93430:f473063318c3 parent: 93431:8b1d8fcb494b user: Berker Peksag date: Fri Nov 07 19:51:37 2014 +0200 summary: Issue #22808: Link to the correct time method in BaseEventLoop.call_at(). Patch by Mark Grandi. files: Doc/library/asyncio-eventloop.rst | 3 ++- 1 files changed, 2 insertions(+), 1 deletions(-) diff --git a/Doc/library/asyncio-eventloop.rst b/Doc/library/asyncio-eventloop.rst --- a/Doc/library/asyncio-eventloop.rst +++ b/Doc/library/asyncio-eventloop.rst @@ -121,7 +121,8 @@ .. method:: BaseEventLoop.call_at(when, callback, *args) Arrange for the *callback* to be called at the given absolute timestamp - *when* (an int or float), using the same time reference as :meth:`time`. + *when* (an int or float), using the same time reference as + :meth:`BaseEventLoop.time`. This method's behavior is the same as :meth:`call_later`. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 7 18:51:31 2014 From: python-checkins at python.org (berker.peksag) Date: Fri, 07 Nov 2014 17:51:31 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyODA4?= =?utf-8?q?=3A_Link_to_the_correct_time_method_in_BaseEventLoop=2Ecall=5Fa?= =?utf-8?b?dCgpLg==?= Message-ID: <20141107175130.108081.78582@psf.io> https://hg.python.org/cpython/rev/8b1d8fcb494b changeset: 93431:8b1d8fcb494b branch: 3.4 parent: 93427:ad89a652b4ed user: Berker Peksag date: Fri Nov 07 19:51:07 2014 +0200 summary: Issue #22808: Link to the correct time method in BaseEventLoop.call_at(). Patch by Mark Grandi. files: Doc/library/asyncio-eventloop.rst | 3 ++- 1 files changed, 2 insertions(+), 1 deletions(-) diff --git a/Doc/library/asyncio-eventloop.rst b/Doc/library/asyncio-eventloop.rst --- a/Doc/library/asyncio-eventloop.rst +++ b/Doc/library/asyncio-eventloop.rst @@ -121,7 +121,8 @@ .. method:: BaseEventLoop.call_at(when, callback, *args) Arrange for the *callback* to be called at the given absolute timestamp - *when* (an int or float), using the same time reference as :meth:`time`. + *when* (an int or float), using the same time reference as + :meth:`BaseEventLoop.time`. This method's behavior is the same as :meth:`call_later`. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 7 20:49:19 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Fri, 07 Nov 2014 19:49:19 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issues_=23814253=2C_=239179=3A_Group_references_and_cond?= =?utf-8?q?itional_group_references_now?= Message-ID: <20141107194916.85210.99344@psf.io> https://hg.python.org/cpython/rev/60fccf0aad83 changeset: 93435:60fccf0aad83 parent: 93432:98f4bc1332c9 parent: 93434:9fcf4008b626 user: Serhiy Storchaka date: Fri Nov 07 21:45:17 2014 +0200 summary: Issues #814253, #9179: Group references and conditional group references now work in lookbehind assertions in regular expressions. files: Lib/re.py | 5 ++- Lib/sre_parse.py | 33 ++++++++++++++++++++------- Lib/test/test_re.py | 38 ++++++++++++++++++++++++++++++++- Misc/NEWS | 3 ++ 4 files changed, 67 insertions(+), 12 deletions(-) diff --git a/Lib/re.py b/Lib/re.py --- a/Lib/re.py +++ b/Lib/re.py @@ -351,10 +351,11 @@ s = sre_parse.Pattern() s.flags = flags for phrase, action in lexicon: + gid = s.opengroup() p.append(sre_parse.SubPattern(s, [ - (SUBPATTERN, (len(p)+1, sre_parse.parse(phrase, flags))), + (SUBPATTERN, (gid, sre_parse.parse(phrase, flags))), ])) - s.groups = len(p)+1 + s.closegroup(gid, p[-1]) p = sre_parse.SubPattern(s, [(BRANCH, (None, p))]) self.scanner = sre_compile.compile(p) def scan(self, string): diff --git a/Lib/sre_parse.py b/Lib/sre_parse.py --- a/Lib/sre_parse.py +++ b/Lib/sre_parse.py @@ -69,12 +69,14 @@ # master pattern object. keeps track of global attributes def __init__(self): self.flags = 0 - self.open = [] - self.groups = 1 self.groupdict = {} + self.subpatterns = [None] # group 0 + @property + def groups(self): + return len(self.subpatterns) def opengroup(self, name=None): gid = self.groups - self.groups = gid + 1 + self.subpatterns.append(None) if self.groups > MAXGROUPS: raise error("groups number is too large") if name is not None: @@ -83,12 +85,11 @@ raise error("redefinition of group name %s as group %d; " "was group %d" % (repr(name), gid, ogid)) self.groupdict[name] = gid - self.open.append(gid) return gid - def closegroup(self, gid): - self.open.remove(gid) + def closegroup(self, gid, p): + self.subpatterns[gid] = p def checkgroup(self, gid): - return gid < self.groups and gid not in self.open + return gid < self.groups and self.subpatterns[gid] is not None class SubPattern: # a subpattern, in intermediate form @@ -184,7 +185,21 @@ elif op in _UNITCODES: lo = lo + 1 hi = hi + 1 - elif op == SUCCESS: + elif op is GROUPREF: + i, j = self.pattern.subpatterns[av].getwidth() + lo = lo + i + hi = hi + j + elif op is GROUPREF_EXISTS: + i, j = av[1].getwidth() + if av[2] is not None: + l, h = av[2].getwidth() + i = min(i, l) + j = max(j, h) + else: + i = 0 + lo = lo + i + hi = hi + j + elif op is SUCCESS: break self.width = min(lo, MAXREPEAT - 1), min(hi, MAXREPEAT) return self.width @@ -705,7 +720,7 @@ if not sourcematch(")"): raise error("unbalanced parenthesis") if group is not None: - state.closegroup(group) + state.closegroup(group, p) subpatternappend((SUBPATTERN, (group, p))) else: while True: diff --git a/Lib/test/test_re.py b/Lib/test/test_re.py --- a/Lib/test/test_re.py +++ b/Lib/test/test_re.py @@ -575,7 +575,7 @@ self.assertEqual(re.match("a.*b", "a\n\nb", re.DOTALL).group(0), "a\n\nb") - def test_non_consuming(self): + def test_lookahead(self): self.assertEqual(re.match("(a(?=\s[^a]))", "a b").group(1), "a") self.assertEqual(re.match("(a(?=\s[^a]*))", "a b").group(1), "a") self.assertEqual(re.match("(a(?=\s[abc]))", "a b").group(1), "a") @@ -589,6 +589,42 @@ self.assertEqual(re.match(r"(a)(?!\s\1)", "a b").group(1), "a") self.assertEqual(re.match(r"(a)(?!\s(abc|a))", "a b").group(1), "a") + # Group reference. + self.assertTrue(re.match(r'(a)b(?=\1)a', 'aba')) + self.assertIsNone(re.match(r'(a)b(?=\1)c', 'abac')) + # Conditional group reference. + self.assertTrue(re.match('(?:(a)|(x))b(?=(?(2)x|c))c', 'abc')) + self.assertIsNone(re.match('(?:(a)|(x))b(?=(?(2)c|x))c', 'abc')) + self.assertTrue(re.match('(?:(a)|(x))b(?=(?(2)x|c))c', 'abc')) + self.assertIsNone(re.match('(?:(a)|(x))b(?=(?(1)b|x))c', 'abc')) + self.assertTrue(re.match('(?:(a)|(x))b(?=(?(1)c|x))c', 'abc')) + # Group used before defined. + self.assertTrue(re.match('(a)b(?=(?(2)x|c))(c)', 'abc')) + self.assertIsNone(re.match('(a)b(?=(?(2)b|x))(c)', 'abc')) + self.assertTrue(re.match('(a)b(?=(?(1)c|x))(c)', 'abc')) + + def test_lookbehind(self): + self.assertTrue(re.match('ab(?<=b)c', 'abc')) + self.assertIsNone(re.match('ab(?<=c)c', 'abc')) + self.assertIsNone(re.match('ab(? https://hg.python.org/cpython/rev/9fcf4008b626 changeset: 93434:9fcf4008b626 branch: 3.4 parent: 93431:8b1d8fcb494b user: Serhiy Storchaka date: Fri Nov 07 21:43:57 2014 +0200 summary: Issues #814253, #9179: Group references and conditional group references now work in lookbehind assertions in regular expressions. files: Lib/re.py | 5 ++- Lib/sre_parse.py | 33 ++++++++++++++++++++------- Lib/test/test_re.py | 38 ++++++++++++++++++++++++++++++++- Misc/NEWS | 3 ++ 4 files changed, 67 insertions(+), 12 deletions(-) diff --git a/Lib/re.py b/Lib/re.py --- a/Lib/re.py +++ b/Lib/re.py @@ -352,10 +352,11 @@ s = sre_parse.Pattern() s.flags = flags for phrase, action in lexicon: + gid = s.opengroup() p.append(sre_parse.SubPattern(s, [ - (SUBPATTERN, (len(p)+1, sre_parse.parse(phrase, flags))), + (SUBPATTERN, (gid, sre_parse.parse(phrase, flags))), ])) - s.groups = len(p)+1 + s.closegroup(gid, p[-1]) p = sre_parse.SubPattern(s, [(BRANCH, (None, p))]) self.scanner = sre_compile.compile(p) def scan(self, string): diff --git a/Lib/sre_parse.py b/Lib/sre_parse.py --- a/Lib/sre_parse.py +++ b/Lib/sre_parse.py @@ -66,24 +66,25 @@ # master pattern object. keeps track of global attributes def __init__(self): self.flags = 0 - self.open = [] - self.groups = 1 self.groupdict = {} + self.subpatterns = [None] # group 0 + @property + def groups(self): + return len(self.subpatterns) def opengroup(self, name=None): gid = self.groups - self.groups = gid + 1 + self.subpatterns.append(None) if name is not None: ogid = self.groupdict.get(name, None) if ogid is not None: raise error("redefinition of group name %s as group %d; " "was group %d" % (repr(name), gid, ogid)) self.groupdict[name] = gid - self.open.append(gid) return gid - def closegroup(self, gid): - self.open.remove(gid) + def closegroup(self, gid, p): + self.subpatterns[gid] = p def checkgroup(self, gid): - return gid < self.groups and gid not in self.open + return gid < self.groups and self.subpatterns[gid] is not None class SubPattern: # a subpattern, in intermediate form @@ -181,7 +182,21 @@ elif op in UNITCODES: lo = lo + 1 hi = hi + 1 - elif op == SUCCESS: + elif op is GROUPREF: + i, j = self.pattern.subpatterns[av].getwidth() + lo = lo + i + hi = hi + j + elif op is GROUPREF_EXISTS: + i, j = av[1].getwidth() + if av[2] is not None: + l, h = av[2].getwidth() + i = min(i, l) + j = max(j, h) + else: + i = 0 + lo = lo + i + hi = hi + j + elif op is SUCCESS: break self.width = min(lo, MAXREPEAT - 1), min(hi, MAXREPEAT) return self.width @@ -709,7 +724,7 @@ if not sourcematch(")"): raise error("unbalanced parenthesis") if group is not None: - state.closegroup(group) + state.closegroup(group, p) subpatternappend((SUBPATTERN, (group, p))) else: while 1: diff --git a/Lib/test/test_re.py b/Lib/test/test_re.py --- a/Lib/test/test_re.py +++ b/Lib/test/test_re.py @@ -557,7 +557,7 @@ self.assertEqual(re.match("a.*b", "a\n\nb", re.DOTALL).group(0), "a\n\nb") - def test_non_consuming(self): + def test_lookahead(self): self.assertEqual(re.match("(a(?=\s[^a]))", "a b").group(1), "a") self.assertEqual(re.match("(a(?=\s[^a]*))", "a b").group(1), "a") self.assertEqual(re.match("(a(?=\s[abc]))", "a b").group(1), "a") @@ -571,6 +571,42 @@ self.assertEqual(re.match(r"(a)(?!\s\1)", "a b").group(1), "a") self.assertEqual(re.match(r"(a)(?!\s(abc|a))", "a b").group(1), "a") + # Group reference. + self.assertTrue(re.match(r'(a)b(?=\1)a', 'aba')) + self.assertIsNone(re.match(r'(a)b(?=\1)c', 'abac')) + # Conditional group reference. + self.assertTrue(re.match('(?:(a)|(x))b(?=(?(2)x|c))c', 'abc')) + self.assertIsNone(re.match('(?:(a)|(x))b(?=(?(2)c|x))c', 'abc')) + self.assertTrue(re.match('(?:(a)|(x))b(?=(?(2)x|c))c', 'abc')) + self.assertIsNone(re.match('(?:(a)|(x))b(?=(?(1)b|x))c', 'abc')) + self.assertTrue(re.match('(?:(a)|(x))b(?=(?(1)c|x))c', 'abc')) + # Group used before defined. + self.assertTrue(re.match('(a)b(?=(?(2)x|c))(c)', 'abc')) + self.assertIsNone(re.match('(a)b(?=(?(2)b|x))(c)', 'abc')) + self.assertTrue(re.match('(a)b(?=(?(1)c|x))(c)', 'abc')) + + def test_lookbehind(self): + self.assertTrue(re.match('ab(?<=b)c', 'abc')) + self.assertIsNone(re.match('ab(?<=c)c', 'abc')) + self.assertIsNone(re.match('ab(? https://hg.python.org/cpython/rev/fac649bf2d10 changeset: 93433:fac649bf2d10 branch: 2.7 parent: 93429:7b82b58b8329 user: Serhiy Storchaka date: Fri Nov 07 21:43:45 2014 +0200 summary: Issues #814253, #9179: Group references and conditional group references now work in lookbehind assertions in regular expressions. files: Lib/re.py | 5 ++- Lib/sre_parse.py | 33 ++++++++++++++++++++------- Lib/test/test_re.py | 38 ++++++++++++++++++++++++++++++++- Misc/NEWS | 3 ++ 4 files changed, 67 insertions(+), 12 deletions(-) diff --git a/Lib/re.py b/Lib/re.py --- a/Lib/re.py +++ b/Lib/re.py @@ -312,10 +312,11 @@ s = sre_parse.Pattern() s.flags = flags for phrase, action in lexicon: + gid = s.opengroup() p.append(sre_parse.SubPattern(s, [ - (SUBPATTERN, (len(p)+1, sre_parse.parse(phrase, flags))), + (SUBPATTERN, (gid, sre_parse.parse(phrase, flags))), ])) - s.groups = len(p)+1 + s.closegroup(gid, p[-1]) p = sre_parse.SubPattern(s, [(BRANCH, (None, p))]) self.scanner = sre_compile.compile(p) def scan(self, string): diff --git a/Lib/sre_parse.py b/Lib/sre_parse.py --- a/Lib/sre_parse.py +++ b/Lib/sre_parse.py @@ -66,24 +66,25 @@ # master pattern object. keeps track of global attributes def __init__(self): self.flags = 0 - self.open = [] - self.groups = 1 self.groupdict = {} + self.subpatterns = [None] # group 0 + @property + def groups(self): + return len(self.subpatterns) def opengroup(self, name=None): gid = self.groups - self.groups = gid + 1 + self.subpatterns.append(None) if name is not None: ogid = self.groupdict.get(name, None) if ogid is not None: raise error, ("redefinition of group name %s as group %d; " "was group %d" % (repr(name), gid, ogid)) self.groupdict[name] = gid - self.open.append(gid) return gid - def closegroup(self, gid): - self.open.remove(gid) + def closegroup(self, gid, p): + self.subpatterns[gid] = p def checkgroup(self, gid): - return gid < self.groups and gid not in self.open + return gid < self.groups and self.subpatterns[gid] is not None class SubPattern: # a subpattern, in intermediate form @@ -178,7 +179,21 @@ elif op in UNITCODES: lo = lo + 1 hi = hi + 1 - elif op == SUCCESS: + elif op is GROUPREF: + i, j = self.pattern.subpatterns[av].getwidth() + lo = lo + i + hi = hi + j + elif op is GROUPREF_EXISTS: + i, j = av[1].getwidth() + if av[2] is not None: + l, h = av[2].getwidth() + i = min(i, l) + j = max(j, h) + else: + i = 0 + lo = lo + i + hi = hi + j + elif op is SUCCESS: break self.width = min(lo, MAXREPEAT - 1), min(hi, MAXREPEAT) return self.width @@ -657,7 +672,7 @@ if not sourcematch(")"): raise error, "unbalanced parenthesis" if group is not None: - state.closegroup(group) + state.closegroup(group, p) subpatternappend((SUBPATTERN, (group, p))) else: while 1: diff --git a/Lib/test/test_re.py b/Lib/test/test_re.py --- a/Lib/test/test_re.py +++ b/Lib/test/test_re.py @@ -448,7 +448,7 @@ self.assertEqual(re.match("a.*b", "a\n\nb", re.DOTALL).group(0), "a\n\nb") - def test_non_consuming(self): + def test_lookahead(self): self.assertEqual(re.match("(a(?=\s[^a]))", "a b").group(1), "a") self.assertEqual(re.match("(a(?=\s[^a]*))", "a b").group(1), "a") self.assertEqual(re.match("(a(?=\s[abc]))", "a b").group(1), "a") @@ -462,6 +462,42 @@ self.assertEqual(re.match(r"(a)(?!\s\1)", "a b").group(1), "a") self.assertEqual(re.match(r"(a)(?!\s(abc|a))", "a b").group(1), "a") + # Group reference. + self.assertTrue(re.match(r'(a)b(?=\1)a', 'aba')) + self.assertIsNone(re.match(r'(a)b(?=\1)c', 'abac')) + # Conditional group reference. + self.assertTrue(re.match('(?:(a)|(x))b(?=(?(2)x|c))c', 'abc')) + self.assertIsNone(re.match('(?:(a)|(x))b(?=(?(2)c|x))c', 'abc')) + self.assertTrue(re.match('(?:(a)|(x))b(?=(?(2)x|c))c', 'abc')) + self.assertIsNone(re.match('(?:(a)|(x))b(?=(?(1)b|x))c', 'abc')) + self.assertTrue(re.match('(?:(a)|(x))b(?=(?(1)c|x))c', 'abc')) + # Group used before defined. + self.assertTrue(re.match('(a)b(?=(?(2)x|c))(c)', 'abc')) + self.assertIsNone(re.match('(a)b(?=(?(2)b|x))(c)', 'abc')) + self.assertTrue(re.match('(a)b(?=(?(1)c|x))(c)', 'abc')) + + def test_lookbehind(self): + self.assertTrue(re.match('ab(?<=b)c', 'abc')) + self.assertIsNone(re.match('ab(?<=c)c', 'abc')) + self.assertIsNone(re.match('ab(? https://hg.python.org/cpython/rev/0e2c7d774df3 changeset: 93436:0e2c7d774df3 branch: 2.7 parent: 93433:fac649bf2d10 user: Serhiy Storchaka date: Fri Nov 07 22:31:54 2014 +0200 summary: Silence the failure of test_pyclbr after adding a property in sre_parse (issue #814253). files: Lib/test/test_pyclbr.py | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Lib/test/test_pyclbr.py b/Lib/test/test_pyclbr.py --- a/Lib/test/test_pyclbr.py +++ b/Lib/test/test_pyclbr.py @@ -180,7 +180,7 @@ cm('pickle') cm('aifc', ignore=('openfp',)) # set with = in module cm('Cookie') - cm('sre_parse', ignore=('dump',)) # from sre_constants import * + cm('sre_parse', ignore=('dump', 'groups')) # from sre_constants import *; property cm('pdb') cm('pydoc') -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 7 21:37:07 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Fri, 07 Nov 2014 20:37:07 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E4=29=3A_Silence_the_fa?= =?utf-8?q?ilure_of_test=5Fpyclbr_after_adding_a_property_in_sre=5Fparse?= Message-ID: <20141107203701.113478.34289@psf.io> https://hg.python.org/cpython/rev/246c9570a757 changeset: 93437:246c9570a757 branch: 3.4 parent: 93434:9fcf4008b626 user: Serhiy Storchaka date: Fri Nov 07 22:32:37 2014 +0200 summary: Silence the failure of test_pyclbr after adding a property in sre_parse (issue #814253). files: Lib/test/test_pyclbr.py | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Lib/test/test_pyclbr.py b/Lib/test/test_pyclbr.py --- a/Lib/test/test_pyclbr.py +++ b/Lib/test/test_pyclbr.py @@ -159,7 +159,7 @@ cm('cgi', ignore=('log',)) # set with = in module cm('pickle') cm('aifc', ignore=('openfp', '_aifc_params')) # set with = in module - cm('sre_parse', ignore=('dump',)) # from sre_constants import * + cm('sre_parse', ignore=('dump', 'groups')) # from sre_constants import *; property cm('pdb') cm('pydoc') -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 7 21:37:07 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Fri, 07 Nov 2014 20:37:07 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Silence_the_failure_of_test=5Fpyclbr_after_adding_a_prop?= =?utf-8?q?erty_in_sre=5Fparse?= Message-ID: <20141107203701.108085.59089@psf.io> https://hg.python.org/cpython/rev/b2c17681404f changeset: 93438:b2c17681404f parent: 93435:60fccf0aad83 parent: 93437:246c9570a757 user: Serhiy Storchaka date: Fri Nov 07 22:33:19 2014 +0200 summary: Silence the failure of test_pyclbr after adding a property in sre_parse (issue #814253). files: Lib/test/test_pyclbr.py | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Lib/test/test_pyclbr.py b/Lib/test/test_pyclbr.py --- a/Lib/test/test_pyclbr.py +++ b/Lib/test/test_pyclbr.py @@ -159,7 +159,7 @@ cm('cgi', ignore=('log',)) # set with = in module cm('pickle') cm('aifc', ignore=('openfp', '_aifc_params')) # set with = in module - cm('sre_parse', ignore=('dump',)) # from sre_constants import * + cm('sre_parse', ignore=('dump', 'groups')) # from sre_constants import *; property cm('pdb') cm('pydoc') -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 8 07:47:38 2014 From: python-checkins at python.org (raymond.hettinger) Date: Sat, 08 Nov 2014 06:47:38 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=282=2E7=29=3A_Remove_unused_?= =?utf-8?q?import?= Message-ID: <20141108064736.713.24362@psf.io> https://hg.python.org/cpython/rev/1cde2bbe841a changeset: 93439:1cde2bbe841a branch: 2.7 parent: 93436:0e2c7d774df3 user: Raymond Hettinger date: Fri Nov 07 22:47:30 2014 -0800 summary: Remove unused import files: Lib/decimal.py | 1 - 1 files changed, 0 insertions(+), 1 deletions(-) diff --git a/Lib/decimal.py b/Lib/decimal.py --- a/Lib/decimal.py +++ b/Lib/decimal.py @@ -136,7 +136,6 @@ __version__ = '1.70' # Highest version of the spec this complies with -import copy as _copy import math as _math import numbers as _numbers -- Repository URL: https://hg.python.org/cpython From solipsis at pitrou.net Sat Nov 8 10:33:05 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Sat, 08 Nov 2014 10:33:05 +0100 Subject: [Python-checkins] Daily reference leaks (b2c17681404f): sum=3 Message-ID: results for b2c17681404f on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflog8Jo34A', '-x'] From python-checkins at python.org Sat Nov 8 21:40:49 2014 From: python-checkins at python.org (berker.peksag) Date: Sat, 08 Nov 2014 20:40:49 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyNjk1?= =?utf-8?q?=3A_Fix_rendering_of_the_deprecated-removed_role_in_HTML=2E?= Message-ID: <20141108204048.108095.70866@psf.io> https://hg.python.org/cpython/rev/9001298e3094 changeset: 93440:9001298e3094 branch: 3.4 parent: 93437:246c9570a757 user: Berker Peksag date: Sat Nov 08 22:40:22 2014 +0200 summary: Issue #22695: Fix rendering of the deprecated-removed role in HTML. files: Doc/tools/extensions/pyspecific.py | 10 ++++------ 1 files changed, 4 insertions(+), 6 deletions(-) diff --git a/Doc/tools/extensions/pyspecific.py b/Doc/tools/extensions/pyspecific.py --- a/Doc/tools/extensions/pyspecific.py +++ b/Doc/tools/extensions/pyspecific.py @@ -172,22 +172,20 @@ messages = [] if self.content: self.state.nested_parse(self.content, self.content_offset, node) + if len(node): if isinstance(node[0], nodes.paragraph) and node[0].rawsource: content = nodes.inline(node[0].rawsource, translatable=True) content.source = node[0].source content.line = node[0].line content += node[0].children node[0].replace_self(nodes.paragraph('', '', content)) - node[0].insert(0, nodes.inline('', '%s: ' % text, - classes=['versionmodified'])) + node[0].insert(0, nodes.inline('', '%s: ' % text, + classes=['versionmodified'])) else: para = nodes.paragraph('', '', nodes.inline('', '%s.' % text, classes=['versionmodified'])) - if len(node): - node.insert(0, para) - else: - node.append(para) + node.append(para) env = self.state.document.settings.env env.note_versionchange('deprecated', version[0], node, self.lineno) return [node] + messages -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 8 21:40:51 2014 From: python-checkins at python.org (berker.peksag) Date: Sat, 08 Nov 2014 20:40:51 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2322695=3A_Fix_rendering_of_the_deprecated-remove?= =?utf-8?q?d_role_in_HTML=2E?= Message-ID: <20141108204048.108087.12693@psf.io> https://hg.python.org/cpython/rev/ec81edc30221 changeset: 93441:ec81edc30221 parent: 93438:b2c17681404f parent: 93440:9001298e3094 user: Berker Peksag date: Sat Nov 08 22:41:00 2014 +0200 summary: Issue #22695: Fix rendering of the deprecated-removed role in HTML. files: Doc/tools/extensions/pyspecific.py | 10 ++++------ 1 files changed, 4 insertions(+), 6 deletions(-) diff --git a/Doc/tools/extensions/pyspecific.py b/Doc/tools/extensions/pyspecific.py --- a/Doc/tools/extensions/pyspecific.py +++ b/Doc/tools/extensions/pyspecific.py @@ -172,22 +172,20 @@ messages = [] if self.content: self.state.nested_parse(self.content, self.content_offset, node) + if len(node): if isinstance(node[0], nodes.paragraph) and node[0].rawsource: content = nodes.inline(node[0].rawsource, translatable=True) content.source = node[0].source content.line = node[0].line content += node[0].children node[0].replace_self(nodes.paragraph('', '', content)) - node[0].insert(0, nodes.inline('', '%s: ' % text, - classes=['versionmodified'])) + node[0].insert(0, nodes.inline('', '%s: ' % text, + classes=['versionmodified'])) else: para = nodes.paragraph('', '', nodes.inline('', '%s.' % text, classes=['versionmodified'])) - if len(node): - node.insert(0, para) - else: - node.append(para) + node.append(para) env = self.state.document.settings.env env.note_versionchange('deprecated', version[0], node, self.lineno) return [node] + messages -- Repository URL: https://hg.python.org/cpython From solipsis at pitrou.net Sun Nov 9 10:32:20 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Sun, 09 Nov 2014 10:32:20 +0100 Subject: [Python-checkins] Daily reference leaks (ec81edc30221): sum=3 Message-ID: results for ec81edc30221 on branch "default" -------------------------------------------- test_collections leaked [-2, 0, 2] references, sum=0 test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogXcGGjL', '-x'] From ncoghlan at gmail.com Sun Nov 9 13:44:27 2014 From: ncoghlan at gmail.com (Nick Coghlan) Date: Sun, 9 Nov 2014 22:44:27 +1000 Subject: [Python-checkins] cpython (2.7): #22650: test suite: load Unicode test data files from www.pythontest.net In-Reply-To: References: <20141106135652.108375.20457@psf.io> Message-ID: On 7 Nov 2014 02:44, "Georg Brandl" wrote: > > On 11/06/2014 03:39 PM, Brett Cannon wrote: > > What is pythontest.net ? Is it something we control, and > > if so how do we add things to it for tests? Did I miss an email on python-dev or > > python-committers about this? > > Benjamin already gave the link to the related issue. The idea is to make the > networking tests depend on as few external hosts as possible, so that we can > reduce spurious skips or failures when one of them is not reachable or changes > its configuration. > > The pythontest.net domain was chosen to be able to test things like cookies or > certificates without a potential of compromising python.org related services. > > There is a repository at hg.python.org/pythontestdotnet which can be used by > developers; server configuration is maintained together with other Python > services on https://github.com/python/psf-salt. Thanks for the info! Could we capture that somewhere a bit more permanent? The developer guide would probably be a good place, although it may involve creating a new subsection. Cheers, Nick. > > cheers, > Georg > > _______________________________________________ > Python-checkins mailing list > Python-checkins at python.org > https://mail.python.org/mailman/listinfo/python-checkins -------------- next part -------------- An HTML attachment was scrubbed... URL: From python-checkins at python.org Mon Nov 10 00:56:39 2014 From: python-checkins at python.org (raymond.hettinger) Date: Sun, 09 Nov 2014 23:56:39 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2322823=3A_Use_set_?= =?utf-8?q?literals_instead_of_creating_a_set_from_a_list?= Message-ID: <20141109235639.108385.96711@psf.io> https://hg.python.org/cpython/rev/4480506137ed changeset: 93442:4480506137ed user: Raymond Hettinger date: Sun Nov 09 15:56:33 2014 -0800 summary: Issue #22823: Use set literals instead of creating a set from a list files: Doc/howto/logging-cookbook.rst | 2 +- Doc/library/pickle.rst | 2 +- Lib/_strptime.py | 4 ++-- Lib/asyncore.py | 6 +++--- Lib/ipaddress.py | 2 +- Lib/mailbox.py | 4 ++-- Lib/sre_compile.py | 8 ++++---- Lib/sre_parse.py | 4 ++-- Lib/statistics.py | 4 ++-- Parser/asdl.py | 3 +-- 10 files changed, 19 insertions(+), 20 deletions(-) diff --git a/Doc/howto/logging-cookbook.rst b/Doc/howto/logging-cookbook.rst --- a/Doc/howto/logging-cookbook.rst +++ b/Doc/howto/logging-cookbook.rst @@ -1680,7 +1680,7 @@ def main(): logging.basicConfig(level=logging.INFO, format='%(message)s') - logging.info(_('message 1', set_value=set([1, 2, 3]), snowman='\u2603')) + logging.info(_('message 1', set_value={1, 2, 3}, snowman='\u2603')) if __name__ == '__main__': main() diff --git a/Doc/library/pickle.rst b/Doc/library/pickle.rst --- a/Doc/library/pickle.rst +++ b/Doc/library/pickle.rst @@ -859,7 +859,7 @@ data = { 'a': [1, 2.0, 3, 4+6j], 'b': ("character string", b"byte string"), - 'c': set([None, True, False]) + 'c': {None, True, False} } with open('data.pickle', 'wb') as f: diff --git a/Lib/_strptime.py b/Lib/_strptime.py --- a/Lib/_strptime.py +++ b/Lib/_strptime.py @@ -167,9 +167,9 @@ time.tzset() except AttributeError: pass - no_saving = frozenset(["utc", "gmt", time.tzname[0].lower()]) + no_saving = frozenset({"utc", "gmt", time.tzname[0].lower()}) if time.daylight: - has_saving = frozenset([time.tzname[1].lower()]) + has_saving = frozenset({time.tzname[1].lower()}) else: has_saving = frozenset() self.timezone = (no_saving, has_saving) diff --git a/Lib/asyncore.py b/Lib/asyncore.py --- a/Lib/asyncore.py +++ b/Lib/asyncore.py @@ -57,8 +57,8 @@ ENOTCONN, ESHUTDOWN, EISCONN, EBADF, ECONNABORTED, EPIPE, EAGAIN, \ errorcode -_DISCONNECTED = frozenset((ECONNRESET, ENOTCONN, ESHUTDOWN, ECONNABORTED, EPIPE, - EBADF)) +_DISCONNECTED = frozenset({ECONNRESET, ENOTCONN, ESHUTDOWN, ECONNABORTED, EPIPE, + EBADF}) try: socket_map @@ -220,7 +220,7 @@ connecting = False closing = False addr = None - ignore_log_types = frozenset(['warning']) + ignore_log_types = frozenset({'warning'}) def __init__(self, sock=None, map=None): if map is None: diff --git a/Lib/ipaddress.py b/Lib/ipaddress.py --- a/Lib/ipaddress.py +++ b/Lib/ipaddress.py @@ -1088,7 +1088,7 @@ _DECIMAL_DIGITS = frozenset('0123456789') # the valid octets for host and netmasks. only useful for IPv4. - _valid_mask_octets = frozenset((255, 254, 252, 248, 240, 224, 192, 128, 0)) + _valid_mask_octets = frozenset({255, 254, 252, 248, 240, 224, 192, 128, 0}) _max_prefixlen = IPV4LENGTH # There are only a handful of valid v4 netmasks, so we cache them all diff --git a/Lib/mailbox.py b/Lib/mailbox.py --- a/Lib/mailbox.py +++ b/Lib/mailbox.py @@ -1230,8 +1230,8 @@ class Babyl(_singlefileMailbox): """An Rmail-style Babyl mailbox.""" - _special_labels = frozenset(('unseen', 'deleted', 'filed', 'answered', - 'forwarded', 'edited', 'resent')) + _special_labels = frozenset({'unseen', 'deleted', 'filed', 'answered', + 'forwarded', 'edited', 'resent'}) def __init__(self, path, factory=None, create=True): """Initialize a Babyl mailbox.""" diff --git a/Lib/sre_compile.py b/Lib/sre_compile.py --- a/Lib/sre_compile.py +++ b/Lib/sre_compile.py @@ -22,10 +22,10 @@ else: MAXCODE = 0xFFFFFFFF -_LITERAL_CODES = set([LITERAL, NOT_LITERAL]) -_REPEATING_CODES = set([REPEAT, MIN_REPEAT, MAX_REPEAT]) -_SUCCESS_CODES = set([SUCCESS, FAILURE]) -_ASSERT_CODES = set([ASSERT, ASSERT_NOT]) +_LITERAL_CODES = {LITERAL, NOT_LITERAL} +_REPEATING_CODES = {REPEAT, MIN_REPEAT, MAX_REPEAT} +_SUCCESS_CODES = {SUCCESS, FAILURE} +_ASSERT_CODES = {ASSERT, ASSERT_NOT} def _compile(code, pattern, flags): # internal: compile a (sub)pattern diff --git a/Lib/sre_parse.py b/Lib/sre_parse.py --- a/Lib/sre_parse.py +++ b/Lib/sre_parse.py @@ -25,8 +25,8 @@ WHITESPACE = frozenset(" \t\n\r\v\f") -_REPEATCODES = frozenset((MIN_REPEAT, MAX_REPEAT)) -_UNITCODES = frozenset((ANY, RANGE, IN, LITERAL, NOT_LITERAL, CATEGORY)) +_REPEATCODES = frozenset({MIN_REPEAT, MAX_REPEAT}) +_UNITCODES = frozenset({ANY, RANGE, IN, LITERAL, NOT_LITERAL, CATEGORY}) ESCAPES = { r"\a": (LITERAL, ord("\a")), diff --git a/Lib/statistics.py b/Lib/statistics.py --- a/Lib/statistics.py +++ b/Lib/statistics.py @@ -150,7 +150,7 @@ # We fail as soon as we reach a value that is not an int or the type of # the first value which is not an int. E.g. _sum([int, int, float, int]) # is okay, but sum([int, int, float, Fraction]) is not. - allowed_types = set([int, type(start)]) + allowed_types = {int, type(start)} n, d = _exact_ratio(start) partials = {d: n} # map {denominator: sum of numerators} # Micro-optimizations. @@ -168,7 +168,7 @@ assert allowed_types.pop() is int T = int else: - T = (allowed_types - set([int])).pop() + T = (allowed_types - {int}).pop() if None in partials: assert issubclass(T, (float, Decimal)) assert not math.isfinite(partials[None]) diff --git a/Parser/asdl.py b/Parser/asdl.py --- a/Parser/asdl.py +++ b/Parser/asdl.py @@ -33,8 +33,7 @@ # See the EBNF at the top of the file to understand the logical connection # between the various node types. -builtin_types = set( - ['identifier', 'string', 'bytes', 'int', 'object', 'singleton']) +builtin_types = {'identifier', 'string', 'bytes', 'int', 'object', 'singleton'} class AST: def __repr__(self): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 02:10:32 2014 From: python-checkins at python.org (raymond.hettinger) Date: Mon, 10 Nov 2014 01:10:32 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgMjI4MzA6?= =?utf-8?q?__Clarify_docs_for_functools=2Ecmp=5Fto=5Fkey=28=29=2E?= Message-ID: <20141110011027.108377.83502@psf.io> https://hg.python.org/cpython/rev/dbe1744ec62e changeset: 93443:dbe1744ec62e branch: 2.7 parent: 93439:1cde2bbe841a user: Raymond Hettinger date: Sun Nov 09 17:10:17 2014 -0800 summary: Issue 22830: Clarify docs for functools.cmp_to_key(). files: Doc/library/functools.rst | 11 +++++++---- 1 files changed, 7 insertions(+), 4 deletions(-) diff --git a/Doc/library/functools.rst b/Doc/library/functools.rst --- a/Doc/library/functools.rst +++ b/Doc/library/functools.rst @@ -22,8 +22,8 @@ .. function:: cmp_to_key(func) - Transform an old-style comparison function to a key function. Used with - tools that accept key functions (such as :func:`sorted`, :func:`min`, + Transform an old-style comparison function to a :term:`key function`. Used + with tools that accept key functions (such as :func:`sorted`, :func:`min`, :func:`max`, :func:`heapq.nlargest`, :func:`heapq.nsmallest`, :func:`itertools.groupby`). This function is primarily used as a transition tool for programs being converted to Python 3 where comparison functions are @@ -32,13 +32,16 @@ A comparison function is any callable that accept two arguments, compares them, and returns a negative number for less-than, zero for equality, or a positive number for greater-than. A key function is a callable that accepts one - argument and returns another value that indicates the position in the desired - collation sequence. + argument and returns another value to be used as the sort key. Example:: sorted(iterable, key=cmp_to_key(locale.strcoll)) # locale-aware sort order + For sorting examples and a brief sorting tutorial, see `Sorting HowTo + `_\. + + .. versionadded:: 2.7 .. function:: total_ordering(cls) -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 02:21:33 2014 From: python-checkins at python.org (raymond.hettinger) Date: Mon, 10 Nov 2014 01:21:33 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgMjI4MzA6?= =?utf-8?q?__Clarify_docs_for_functools=2Ecmp=5Fto=5Fkey=28=29=2E?= Message-ID: <20141110012129.108101.79727@psf.io> https://hg.python.org/cpython/rev/63274cf1b40d changeset: 93444:63274cf1b40d branch: 3.4 parent: 93440:9001298e3094 user: Raymond Hettinger date: Sun Nov 09 17:20:56 2014 -0800 summary: Issue 22830: Clarify docs for functools.cmp_to_key(). files: Doc/library/functools.rst | 9 +++++---- 1 files changed, 5 insertions(+), 4 deletions(-) diff --git a/Doc/library/functools.rst b/Doc/library/functools.rst --- a/Doc/library/functools.rst +++ b/Doc/library/functools.rst @@ -21,8 +21,8 @@ .. function:: cmp_to_key(func) - Transform an old-style comparison function to a key function. Used with - tools that accept key functions (such as :func:`sorted`, :func:`min`, + Transform an old-style comparison function to a :term:`key function`. Used + with tools that accept key functions (such as :func:`sorted`, :func:`min`, :func:`max`, :func:`heapq.nlargest`, :func:`heapq.nsmallest`, :func:`itertools.groupby`). This function is primarily used as a transition tool for programs being converted from Python 2 which supported the use of @@ -31,13 +31,14 @@ A comparison function is any callable that accept two arguments, compares them, and returns a negative number for less-than, zero for equality, or a positive number for greater-than. A key function is a callable that accepts one - argument and returns another value indicating the position in the desired - collation sequence. + argument and returns another value to be used as the sort key. Example:: sorted(iterable, key=cmp_to_key(locale.strcoll)) # locale-aware sort order + For sorting examples and a brief sorting tutorial, see :ref:`sortinghowto`. + .. versionadded:: 3.2 -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 02:21:33 2014 From: python-checkins at python.org (raymond.hettinger) Date: Mon, 10 Nov 2014 01:21:33 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_merge?= Message-ID: <20141110012129.113464.72926@psf.io> https://hg.python.org/cpython/rev/0c34a2532e31 changeset: 93445:0c34a2532e31 parent: 93442:4480506137ed parent: 93444:63274cf1b40d user: Raymond Hettinger date: Sun Nov 09 17:21:20 2014 -0800 summary: merge files: Doc/library/functools.rst | 9 +++++---- 1 files changed, 5 insertions(+), 4 deletions(-) diff --git a/Doc/library/functools.rst b/Doc/library/functools.rst --- a/Doc/library/functools.rst +++ b/Doc/library/functools.rst @@ -21,8 +21,8 @@ .. function:: cmp_to_key(func) - Transform an old-style comparison function to a key function. Used with - tools that accept key functions (such as :func:`sorted`, :func:`min`, + Transform an old-style comparison function to a :term:`key function`. Used + with tools that accept key functions (such as :func:`sorted`, :func:`min`, :func:`max`, :func:`heapq.nlargest`, :func:`heapq.nsmallest`, :func:`itertools.groupby`). This function is primarily used as a transition tool for programs being converted from Python 2 which supported the use of @@ -31,13 +31,14 @@ A comparison function is any callable that accept two arguments, compares them, and returns a negative number for less-than, zero for equality, or a positive number for greater-than. A key function is a callable that accepts one - argument and returns another value indicating the position in the desired - collation sequence. + argument and returns another value to be used as the sort key. Example:: sorted(iterable, key=cmp_to_key(locale.strcoll)) # locale-aware sort order + For sorting examples and a brief sorting tutorial, see :ref:`sortinghowto`. + .. versionadded:: 3.2 -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 02:23:00 2014 From: python-checkins at python.org (brett.cannon) Date: Mon, 10 Nov 2014 01:23:00 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_default_-=3E_default?= =?utf-8?q?=29=3A_Merge_with_default?= Message-ID: <20141110012300.108395.24581@psf.io> https://hg.python.org/cpython/rev/55b89e5f9c37 changeset: 93447:55b89e5f9c37 parent: 93446:6e6532d313a1 parent: 93445:0c34a2532e31 user: Brett Cannon date: Sun Nov 09 20:22:53 2014 -0500 summary: Merge with default files: Doc/library/functools.rst | 9 +++++---- 1 files changed, 5 insertions(+), 4 deletions(-) diff --git a/Doc/library/functools.rst b/Doc/library/functools.rst --- a/Doc/library/functools.rst +++ b/Doc/library/functools.rst @@ -21,8 +21,8 @@ .. function:: cmp_to_key(func) - Transform an old-style comparison function to a key function. Used with - tools that accept key functions (such as :func:`sorted`, :func:`min`, + Transform an old-style comparison function to a :term:`key function`. Used + with tools that accept key functions (such as :func:`sorted`, :func:`min`, :func:`max`, :func:`heapq.nlargest`, :func:`heapq.nsmallest`, :func:`itertools.groupby`). This function is primarily used as a transition tool for programs being converted from Python 2 which supported the use of @@ -31,13 +31,14 @@ A comparison function is any callable that accept two arguments, compares them, and returns a negative number for less-than, zero for equality, or a positive number for greater-than. A key function is a callable that accepts one - argument and returns another value indicating the position in the desired - collation sequence. + argument and returns another value to be used as the sort key. Example:: sorted(iterable, key=cmp_to_key(locale.strcoll)) # locale-aware sort order + For sorting examples and a brief sorting tutorial, see :ref:`sortinghowto`. + .. versionadded:: 3.2 -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 02:23:00 2014 From: python-checkins at python.org (brett.cannon) Date: Mon, 10 Nov 2014 01:23:00 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_20152=2C_22821=3A_Po?= =?utf-8?q?rt_the_fcntl_module_to_Argument_Clinic=2E?= Message-ID: <20141110012300.108381.39051@psf.io> https://hg.python.org/cpython/rev/6e6532d313a1 changeset: 93446:6e6532d313a1 parent: 93442:4480506137ed user: Brett Cannon date: Sun Nov 09 20:22:01 2014 -0500 summary: Issue 20152, 22821: Port the fcntl module to Argument Clinic. Along the way, fix an argumrnt to fcntl.fcntl to be an int instead of a long. Thanks to Serhiy Storchaka for reviewing my Clinic patch and for writing the patch to fix the long/int issue. files: Modules/clinic/fcntlmodule.c.h | 188 +++++++++ Modules/fcntlmodule.c | 432 ++++++++++---------- 2 files changed, 413 insertions(+), 207 deletions(-) diff --git a/Modules/clinic/fcntlmodule.c.h b/Modules/clinic/fcntlmodule.c.h new file mode 100644 --- /dev/null +++ b/Modules/clinic/fcntlmodule.c.h @@ -0,0 +1,188 @@ +/*[clinic input] +preserve +[clinic start generated code]*/ + +PyDoc_STRVAR(fcntl_fcntl__doc__, +"fcntl($module, fd, code, arg=None, /)\n" +"--\n" +"\n" +"Perform the operation `code` on file descriptor fd.\n" +"\n" +"The values used for `code` are operating system dependent, and are available\n" +"as constants in the fcntl module, using the same names as used in\n" +"the relevant C header files. The argument arg is optional, and\n" +"defaults to 0; it may be an int or a string. If arg is given as a string,\n" +"the return value of fcntl is a string of that length, containing the\n" +"resulting value put in the arg buffer by the operating system. The length\n" +"of the arg string is not allowed to exceed 1024 bytes. If the arg given\n" +"is an integer or if none is specified, the result value is an integer\n" +"corresponding to the return value of the fcntl call in the C code."); + +#define FCNTL_FCNTL_METHODDEF \ + {"fcntl", (PyCFunction)fcntl_fcntl, METH_VARARGS, fcntl_fcntl__doc__}, + +static PyObject * +fcntl_fcntl_impl(PyModuleDef *module, int fd, int code, PyObject *arg); + +static PyObject * +fcntl_fcntl(PyModuleDef *module, PyObject *args) +{ + PyObject *return_value = NULL; + int fd; + int code; + PyObject *arg = NULL; + + if (!PyArg_ParseTuple(args, + "O&i|O:fcntl", + conv_descriptor, &fd, &code, &arg)) + goto exit; + return_value = fcntl_fcntl_impl(module, fd, code, arg); + +exit: + return return_value; +} + +PyDoc_STRVAR(fcntl_ioctl__doc__, +"ioctl($module, fd, op, arg=None, mutate_flag=True, /)\n" +"--\n" +"\n" +"Perform the operation op on file descriptor fd.\n" +"\n" +"The values used for op are operating system dependent, and are available as\n" +"constants in the fcntl or termios library modules, using the same names as\n" +"used in the relevant C header files.\n" +"\n" +"The argument `arg` is optional, and defaults to 0; it may be an int or a\n" +"buffer containing character data (most likely a string or an array).\n" +"\n" +"If the argument is a mutable buffer (such as an array) and if the\n" +"mutate_flag argument (which is only allowed in this case) is true then the\n" +"buffer is (in effect) passed to the operating system and changes made by\n" +"the OS will be reflected in the contents of the buffer after the call has\n" +"returned. The return value is the integer returned by the ioctl system\n" +"call.\n" +"\n" +"If the argument is a mutable buffer and the mutable_flag argument is not\n" +"passed or is false, the behavior is as if a string had been passed. This\n" +"behavior will change in future releases of Python.\n" +"\n" +"If the argument is an immutable buffer (most likely a string) then a copy\n" +"of the buffer is passed to the operating system and the return value is a\n" +"string of the same length containing whatever the operating system put in\n" +"the buffer. The length of the arg buffer in this case is not allowed to\n" +"exceed 1024 bytes.\n" +"\n" +"If the arg given is an integer or if none is specified, the result value is\n" +"an integer corresponding to the return value of the ioctl call in the C\n" +"code."); + +#define FCNTL_IOCTL_METHODDEF \ + {"ioctl", (PyCFunction)fcntl_ioctl, METH_VARARGS, fcntl_ioctl__doc__}, + +static PyObject * +fcntl_ioctl_impl(PyModuleDef *module, int fd, unsigned int code, PyObject *ob_arg, int mutate_arg); + +static PyObject * +fcntl_ioctl(PyModuleDef *module, PyObject *args) +{ + PyObject *return_value = NULL; + int fd; + unsigned int code; + PyObject *ob_arg = NULL; + int mutate_arg = 1; + + if (!PyArg_ParseTuple(args, + "O&I|Op:ioctl", + conv_descriptor, &fd, &code, &ob_arg, &mutate_arg)) + goto exit; + return_value = fcntl_ioctl_impl(module, fd, code, ob_arg, mutate_arg); + +exit: + return return_value; +} + +PyDoc_STRVAR(fcntl_flock__doc__, +"flock($module, fd, code, /)\n" +"--\n" +"\n" +"Perform the lock operation op on file descriptor fd.\n" +"\n" +"See the Unix manual page for flock(2) for details (On some systems, this\n" +"function is emulated using fcntl())."); + +#define FCNTL_FLOCK_METHODDEF \ + {"flock", (PyCFunction)fcntl_flock, METH_VARARGS, fcntl_flock__doc__}, + +static PyObject * +fcntl_flock_impl(PyModuleDef *module, int fd, int code); + +static PyObject * +fcntl_flock(PyModuleDef *module, PyObject *args) +{ + PyObject *return_value = NULL; + int fd; + int code; + + if (!PyArg_ParseTuple(args, + "O&i:flock", + conv_descriptor, &fd, &code)) + goto exit; + return_value = fcntl_flock_impl(module, fd, code); + +exit: + return return_value; +} + +PyDoc_STRVAR(fcntl_lockf__doc__, +"lockf($module, fd, code, lenobj=None, startobj=None, whence=0, /)\n" +"--\n" +"\n" +"A wrapper around the fcntl() locking calls.\n" +"\n" +"fd is the file descriptor of the file to lock or unlock, and operation is one\n" +"of the following values:\n" +"\n" +" LOCK_UN - unlock\n" +" LOCK_SH - acquire a shared lock\n" +" LOCK_EX - acquire an exclusive lock\n" +"\n" +"When operation is LOCK_SH or LOCK_EX, it can also be bitwise ORed with\n" +"LOCK_NB to avoid blocking on lock acquisition. If LOCK_NB is used and the\n" +"lock cannot be acquired, an IOError will be raised and the exception will\n" +"have an errno attribute set to EACCES or EAGAIN (depending on the operating\n" +"system -- for portability, check for either value).\n" +"\n" +"length is the number of bytes to lock, with the default meaning to lock to\n" +"EOF. start is the byte offset, relative to whence, to that the lock\n" +"starts. whence is as with fileobj.seek(), specifically:\n" +"\n" +" 0 - relative to the start of the file (SEEK_SET)\n" +" 1 - relative to the current buffer position (SEEK_CUR)\n" +" 2 - relative to the end of the file (SEEK_END)"); + +#define FCNTL_LOCKF_METHODDEF \ + {"lockf", (PyCFunction)fcntl_lockf, METH_VARARGS, fcntl_lockf__doc__}, + +static PyObject * +fcntl_lockf_impl(PyModuleDef *module, int fd, int code, PyObject *lenobj, PyObject *startobj, int whence); + +static PyObject * +fcntl_lockf(PyModuleDef *module, PyObject *args) +{ + PyObject *return_value = NULL; + int fd; + int code; + PyObject *lenobj = NULL; + PyObject *startobj = NULL; + int whence = 0; + + if (!PyArg_ParseTuple(args, + "O&i|OOi:lockf", + conv_descriptor, &fd, &code, &lenobj, &startobj, &whence)) + goto exit; + return_value = fcntl_lockf_impl(module, fd, code, lenobj, startobj, whence); + +exit: + return return_value; +} +/*[clinic end generated code: output=84bdde73a92f7c61 input=a9049054013a1b77]*/ diff --git a/Modules/fcntlmodule.c b/Modules/fcntlmodule.c --- a/Modules/fcntlmodule.c +++ b/Modules/fcntlmodule.c @@ -15,6 +15,12 @@ #include #endif +/*[clinic input] +output preset file +module fcntl +[clinic start generated code]*/ +/*[clinic end generated code: output=da39a3ee5e6b4b0d input=c7356fdb126a904a]*/ + static int conv_descriptor(PyObject *object, int *target) { @@ -26,48 +32,72 @@ return 1; } +/* Must come after conv_descriptor definition. */ +#include "clinic/fcntlmodule.c.h" -/* fcntl(fd, op, [arg]) */ +/*[clinic input] +fcntl.fcntl + + fd: object(type='int', converter='conv_descriptor') + code: int + arg: object = NULL + / + +Perform the operation `code` on file descriptor fd. + +The values used for `code` are operating system dependent, and are available +as constants in the fcntl module, using the same names as used in +the relevant C header files. The argument arg is optional, and +defaults to 0; it may be an int or a string. If arg is given as a string, +the return value of fcntl is a string of that length, containing the +resulting value put in the arg buffer by the operating system. The length +of the arg string is not allowed to exceed 1024 bytes. If the arg given +is an integer or if none is specified, the result value is an integer +corresponding to the return value of the fcntl call in the C code. +[clinic start generated code]*/ static PyObject * -fcntl_fcntl(PyObject *self, PyObject *args) +fcntl_fcntl_impl(PyModuleDef *module, int fd, int code, PyObject *arg) +/*[clinic end generated code: output=afc5bfa74a03ef0d input=4850c13a41e86930]*/ { - int fd; - int code; - long arg; + int int_arg = 0; int ret; char *str; Py_ssize_t len; char buf[1024]; - if (PyArg_ParseTuple(args, "O&is#:fcntl", - conv_descriptor, &fd, &code, &str, &len)) { - if ((size_t)len > sizeof buf) { - PyErr_SetString(PyExc_ValueError, - "fcntl string arg too long"); - return NULL; + if (arg != NULL) { + int parse_result; + + if (PyArg_Parse(arg, "s#", &str, &len)) { + if ((size_t)len > sizeof buf) { + PyErr_SetString(PyExc_ValueError, + "fcntl string arg too long"); + return NULL; + } + memcpy(buf, str, len); + Py_BEGIN_ALLOW_THREADS + ret = fcntl(fd, code, buf); + Py_END_ALLOW_THREADS + if (ret < 0) { + PyErr_SetFromErrno(PyExc_IOError); + return NULL; + } + return PyBytes_FromStringAndSize(buf, len); } - memcpy(buf, str, len); - Py_BEGIN_ALLOW_THREADS - ret = fcntl(fd, code, buf); - Py_END_ALLOW_THREADS - if (ret < 0) { - PyErr_SetFromErrno(PyExc_IOError); - return NULL; + + PyErr_Clear(); + parse_result = PyArg_Parse(arg, + "l;fcntl requires a file or file descriptor," + " an integer and optionally a third integer or a string", + &int_arg); + if (!parse_result) { + return NULL; } - return PyBytes_FromStringAndSize(buf, len); } - PyErr_Clear(); - arg = 0; - if (!PyArg_ParseTuple(args, - "O&i|l;fcntl requires a file or file descriptor," - " an integer and optionally a third integer or a string", - conv_descriptor, &fd, &code, &arg)) { - return NULL; - } Py_BEGIN_ALLOW_THREADS - ret = fcntl(fd, code, arg); + ret = fcntl(fd, code, int_arg); Py_END_ALLOW_THREADS if (ret < 0) { PyErr_SetFromErrno(PyExc_IOError); @@ -76,29 +106,53 @@ return PyLong_FromLong((long)ret); } -PyDoc_STRVAR(fcntl_doc, -"fcntl(fd, op, [arg])\n\ -\n\ -Perform the operation op on file descriptor fd. The values used\n\ -for op are operating system dependent, and are available\n\ -as constants in the fcntl module, using the same names as used in\n\ -the relevant C header files. The argument arg is optional, and\n\ -defaults to 0; it may be an int or a string. If arg is given as a string,\n\ -the return value of fcntl is a string of that length, containing the\n\ -resulting value put in the arg buffer by the operating system. The length\n\ -of the arg string is not allowed to exceed 1024 bytes. If the arg given\n\ -is an integer or if none is specified, the result value is an integer\n\ -corresponding to the return value of the fcntl call in the C code."); +/*[clinic input] +fcntl.ioctl -/* ioctl(fd, op, [arg]) */ + fd: object(type='int', converter='conv_descriptor') + op as code: unsigned_int(bitwise=True) + arg as ob_arg: object = NULL + mutate_flag as mutate_arg: bool = True + / + +Perform the operation op on file descriptor fd. + +The values used for op are operating system dependent, and are available as +constants in the fcntl or termios library modules, using the same names as +used in the relevant C header files. + +The argument `arg` is optional, and defaults to 0; it may be an int or a +buffer containing character data (most likely a string or an array). + +If the argument is a mutable buffer (such as an array) and if the +mutate_flag argument (which is only allowed in this case) is true then the +buffer is (in effect) passed to the operating system and changes made by +the OS will be reflected in the contents of the buffer after the call has +returned. The return value is the integer returned by the ioctl system +call. + +If the argument is a mutable buffer and the mutable_flag argument is not +passed or is false, the behavior is as if a string had been passed. This +behavior will change in future releases of Python. + +If the argument is an immutable buffer (most likely a string) then a copy +of the buffer is passed to the operating system and the return value is a +string of the same length containing whatever the operating system put in +the buffer. The length of the arg buffer in this case is not allowed to +exceed 1024 bytes. + +If the arg given is an integer or if none is specified, the result value is +an integer corresponding to the return value of the ioctl call in the C +code. +[clinic start generated code]*/ static PyObject * -fcntl_ioctl(PyObject *self, PyObject *args) +fcntl_ioctl_impl(PyModuleDef *module, int fd, unsigned int code, PyObject *ob_arg, int mutate_arg) +/*[clinic end generated code: output=ad47738c118622bf input=a55a6ee8e494c449]*/ { #define IOCTL_BUFSZ 1024 - int fd; - /* In PyArg_ParseTuple below, we use the unsigned non-checked 'I' + /* We use the unsigned non-checked 'I' format for the 'code' parameter because Python turns 0x8000000 into either a large positive number (PyLong or PyInt on 64-bit platforms) or a negative number on others (32-bit PyInt) @@ -111,101 +165,98 @@ in their unsigned long ioctl codes this will break and need special casing based on the platform being built on. */ - unsigned int code; - int arg; + int arg = 0; int ret; Py_buffer pstr; char *str; Py_ssize_t len; - int mutate_arg = 1; char buf[IOCTL_BUFSZ+1]; /* argument plus NUL byte */ - if (PyArg_ParseTuple(args, "O&Iw*|i:ioctl", - conv_descriptor, &fd, &code, - &pstr, &mutate_arg)) { - char *arg; - str = pstr.buf; - len = pstr.len; + if (ob_arg != NULL) { + if (PyArg_Parse(ob_arg, "w*:ioctl", &pstr)) { + char *arg; + str = pstr.buf; + len = pstr.len; - if (mutate_arg) { - if (len <= IOCTL_BUFSZ) { - memcpy(buf, str, len); - buf[len] = '\0'; - arg = buf; + if (mutate_arg) { + if (len <= IOCTL_BUFSZ) { + memcpy(buf, str, len); + buf[len] = '\0'; + arg = buf; + } + else { + arg = str; + } } else { - arg = str; + if (len > IOCTL_BUFSZ) { + PyBuffer_Release(&pstr); + PyErr_SetString(PyExc_ValueError, + "ioctl string arg too long"); + return NULL; + } + else { + memcpy(buf, str, len); + buf[len] = '\0'; + arg = buf; + } + } + if (buf == arg) { + Py_BEGIN_ALLOW_THREADS /* think array.resize() */ + ret = ioctl(fd, code, arg); + Py_END_ALLOW_THREADS + } + else { + ret = ioctl(fd, code, arg); + } + if (mutate_arg && (len <= IOCTL_BUFSZ)) { + memcpy(str, buf, len); + } + PyBuffer_Release(&pstr); /* No further access to str below this point */ + if (ret < 0) { + PyErr_SetFromErrno(PyExc_IOError); + return NULL; + } + if (mutate_arg) { + return PyLong_FromLong(ret); + } + else { + return PyBytes_FromStringAndSize(buf, len); } } - else { + + PyErr_Clear(); + if (PyArg_Parse(ob_arg, "s*:ioctl", &pstr)) { + str = pstr.buf; + len = pstr.len; if (len > IOCTL_BUFSZ) { PyBuffer_Release(&pstr); PyErr_SetString(PyExc_ValueError, - "ioctl string arg too long"); + "ioctl string arg too long"); return NULL; } - else { - memcpy(buf, str, len); - buf[len] = '\0'; - arg = buf; + memcpy(buf, str, len); + buf[len] = '\0'; + Py_BEGIN_ALLOW_THREADS + ret = ioctl(fd, code, buf); + Py_END_ALLOW_THREADS + if (ret < 0) { + PyBuffer_Release(&pstr); + PyErr_SetFromErrno(PyExc_IOError); + return NULL; } - } - if (buf == arg) { - Py_BEGIN_ALLOW_THREADS /* think array.resize() */ - ret = ioctl(fd, code, arg); - Py_END_ALLOW_THREADS - } - else { - ret = ioctl(fd, code, arg); - } - if (mutate_arg && (len <= IOCTL_BUFSZ)) { - memcpy(str, buf, len); - } - PyBuffer_Release(&pstr); /* No further access to str below this point */ - if (ret < 0) { - PyErr_SetFromErrno(PyExc_IOError); - return NULL; - } - if (mutate_arg) { - return PyLong_FromLong(ret); - } - else { + PyBuffer_Release(&pstr); return PyBytes_FromStringAndSize(buf, len); } - } - PyErr_Clear(); - if (PyArg_ParseTuple(args, "O&Is*:ioctl", - conv_descriptor, &fd, &code, &pstr)) { - str = pstr.buf; - len = pstr.len; - if (len > IOCTL_BUFSZ) { - PyBuffer_Release(&pstr); - PyErr_SetString(PyExc_ValueError, - "ioctl string arg too long"); - return NULL; + PyErr_Clear(); + if (!PyArg_Parse(ob_arg, + "i;ioctl requires a file or file descriptor," + " an integer and optionally an integer or buffer argument", + &arg)) { + return NULL; } - memcpy(buf, str, len); - buf[len] = '\0'; - Py_BEGIN_ALLOW_THREADS - ret = ioctl(fd, code, buf); - Py_END_ALLOW_THREADS - if (ret < 0) { - PyBuffer_Release(&pstr); - PyErr_SetFromErrno(PyExc_IOError); - return NULL; - } - PyBuffer_Release(&pstr); - return PyBytes_FromStringAndSize(buf, len); - } - - PyErr_Clear(); - arg = 0; - if (!PyArg_ParseTuple(args, - "O&I|i;ioctl requires a file or file descriptor," - " an integer and optionally an integer or buffer argument", - conv_descriptor, &fd, &code, &arg)) { - return NULL; + // Fall-through to outside the 'if' statement. } Py_BEGIN_ALLOW_THREADS ret = ioctl(fd, code, arg); @@ -218,52 +269,25 @@ #undef IOCTL_BUFSZ } -PyDoc_STRVAR(ioctl_doc, -"ioctl(fd, op[, arg[, mutate_flag]])\n\ -\n\ -Perform the operation op on file descriptor fd. The values used for op\n\ -are operating system dependent, and are available as constants in the\n\ -fcntl or termios library modules, using the same names as used in the\n\ -relevant C header files.\n\ -\n\ -The argument arg is optional, and defaults to 0; it may be an int or a\n\ -buffer containing character data (most likely a string or an array). \n\ -\n\ -If the argument is a mutable buffer (such as an array) and if the\n\ -mutate_flag argument (which is only allowed in this case) is true then the\n\ -buffer is (in effect) passed to the operating system and changes made by\n\ -the OS will be reflected in the contents of the buffer after the call has\n\ -returned. The return value is the integer returned by the ioctl system\n\ -call.\n\ -\n\ -If the argument is a mutable buffer and the mutable_flag argument is not\n\ -passed or is false, the behavior is as if a string had been passed. This\n\ -behavior will change in future releases of Python.\n\ -\n\ -If the argument is an immutable buffer (most likely a string) then a copy\n\ -of the buffer is passed to the operating system and the return value is a\n\ -string of the same length containing whatever the operating system put in\n\ -the buffer. The length of the arg buffer in this case is not allowed to\n\ -exceed 1024 bytes.\n\ -\n\ -If the arg given is an integer or if none is specified, the result value is\n\ -an integer corresponding to the return value of the ioctl call in the C\n\ -code."); +/*[clinic input] +fcntl.flock + fd: object(type='int', converter='conv_descriptor') + code: int + / -/* flock(fd, operation) */ +Perform the lock operation op on file descriptor fd. + +See the Unix manual page for flock(2) for details (On some systems, this +function is emulated using fcntl()). +[clinic start generated code]*/ static PyObject * -fcntl_flock(PyObject *self, PyObject *args) +fcntl_flock_impl(PyModuleDef *module, int fd, int code) +/*[clinic end generated code: output=c9035133a7dbfc96 input=b762aa9448d05e43]*/ { - int fd; - int code; int ret; - if (!PyArg_ParseTuple(args, "O&i:flock", - conv_descriptor, &fd, &code)) - return NULL; - #ifdef HAVE_FLOCK Py_BEGIN_ALLOW_THREADS ret = flock(fd, code); @@ -299,29 +323,49 @@ PyErr_SetFromErrno(PyExc_IOError); return NULL; } - Py_INCREF(Py_None); - return Py_None; + Py_RETURN_NONE; } -PyDoc_STRVAR(flock_doc, -"flock(fd, operation)\n\ -\n\ -Perform the lock operation op on file descriptor fd. See the Unix \n\ -manual page for flock(2) for details. (On some systems, this function is\n\ -emulated using fcntl().)"); +/*[clinic input] +fcntl.lockf -/* lockf(fd, operation) */ + fd: object(type='int', converter='conv_descriptor') + code: int + lenobj: object = NULL + startobj: object = NULL + whence: int = 0 + / + +A wrapper around the fcntl() locking calls. + +fd is the file descriptor of the file to lock or unlock, and operation is one +of the following values: + + LOCK_UN - unlock + LOCK_SH - acquire a shared lock + LOCK_EX - acquire an exclusive lock + +When operation is LOCK_SH or LOCK_EX, it can also be bitwise ORed with +LOCK_NB to avoid blocking on lock acquisition. If LOCK_NB is used and the +lock cannot be acquired, an IOError will be raised and the exception will +have an errno attribute set to EACCES or EAGAIN (depending on the operating +system -- for portability, check for either value). + +length is the number of bytes to lock, with the default meaning to lock to +EOF. start is the byte offset, relative to whence, to that the lock +starts. whence is as with fileobj.seek(), specifically: + + 0 - relative to the start of the file (SEEK_SET) + 1 - relative to the current buffer position (SEEK_CUR) + 2 - relative to the end of the file (SEEK_END) +[clinic start generated code]*/ + static PyObject * -fcntl_lockf(PyObject *self, PyObject *args) +fcntl_lockf_impl(PyModuleDef *module, int fd, int code, PyObject *lenobj, PyObject *startobj, int whence) +/*[clinic end generated code: output=5536df2892bf3ce9 input=44856fa06db36184]*/ { - int fd, code, ret, whence = 0; - PyObject *lenobj = NULL, *startobj = NULL; - - if (!PyArg_ParseTuple(args, "O&i|OOi:lockf", - conv_descriptor, &fd, &code, - &lenobj, &startobj, &whence)) - return NULL; + int ret; #ifndef LOCK_SH #define LOCK_SH 1 /* shared lock */ @@ -374,43 +418,17 @@ PyErr_SetFromErrno(PyExc_IOError); return NULL; } - Py_INCREF(Py_None); - return Py_None; + Py_RETURN_NONE; } -PyDoc_STRVAR(lockf_doc, -"lockf (fd, operation, length=0, start=0, whence=0)\n\ -\n\ -This is essentially a wrapper around the fcntl() locking calls. fd is the\n\ -file descriptor of the file to lock or unlock, and operation is one of the\n\ -following values:\n\ -\n\ - LOCK_UN - unlock\n\ - LOCK_SH - acquire a shared lock\n\ - LOCK_EX - acquire an exclusive lock\n\ -\n\ -When operation is LOCK_SH or LOCK_EX, it can also be bitwise ORed with\n\ -LOCK_NB to avoid blocking on lock acquisition. If LOCK_NB is used and the\n\ -lock cannot be acquired, an IOError will be raised and the exception will\n\ -have an errno attribute set to EACCES or EAGAIN (depending on the operating\n\ -system -- for portability, check for either value).\n\ -\n\ -length is the number of bytes to lock, with the default meaning to lock to\n\ -EOF. start is the byte offset, relative to whence, to that the lock\n\ -starts. whence is as with fileobj.seek(), specifically:\n\ -\n\ - 0 - relative to the start of the file (SEEK_SET)\n\ - 1 - relative to the current buffer position (SEEK_CUR)\n\ - 2 - relative to the end of the file (SEEK_END)"); - /* List of functions */ static PyMethodDef fcntl_methods[] = { - {"fcntl", fcntl_fcntl, METH_VARARGS, fcntl_doc}, - {"ioctl", fcntl_ioctl, METH_VARARGS, ioctl_doc}, - {"flock", fcntl_flock, METH_VARARGS, flock_doc}, - {"lockf", fcntl_lockf, METH_VARARGS, lockf_doc}, - {NULL, NULL} /* sentinel */ + FCNTL_FCNTL_METHODDEF + FCNTL_IOCTL_METHODDEF + FCNTL_FLOCK_METHODDEF + FCNTL_LOCKF_METHODDEF + {NULL, NULL} /* sentinel */ }; -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 02:25:52 2014 From: python-checkins at python.org (raymond.hettinger) Date: Mon, 10 Nov 2014 01:25:52 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=282=2E7=29=3A_Use_internal_l?= =?utf-8?q?inks_where_possible?= Message-ID: <20141110012551.85212.96118@psf.io> https://hg.python.org/cpython/rev/3a8e0a5359cf changeset: 93448:3a8e0a5359cf branch: 2.7 parent: 93443:dbe1744ec62e user: Raymond Hettinger date: Sun Nov 09 17:25:42 2014 -0800 summary: Use internal links where possible files: Doc/library/functions.rst | 3 +-- Doc/library/functools.rst | 3 +-- 2 files changed, 2 insertions(+), 4 deletions(-) diff --git a/Doc/library/functions.rst b/Doc/library/functions.rst --- a/Doc/library/functions.rst +++ b/Doc/library/functions.rst @@ -1326,8 +1326,7 @@ compare equal --- this is helpful for sorting in multiple passes (for example, sort by department, then by salary grade). - For sorting examples and a brief sorting tutorial, see `Sorting HowTo - `_\. + For sorting examples and a brief sorting tutorial, see :ref:`sortinghowto`. .. versionadded:: 2.4 diff --git a/Doc/library/functools.rst b/Doc/library/functools.rst --- a/Doc/library/functools.rst +++ b/Doc/library/functools.rst @@ -38,8 +38,7 @@ sorted(iterable, key=cmp_to_key(locale.strcoll)) # locale-aware sort order - For sorting examples and a brief sorting tutorial, see `Sorting HowTo - `_\. + For sorting examples and a brief sorting tutorial, see :ref:`sortinghowto`. .. versionadded:: 2.7 -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 07:30:42 2014 From: python-checkins at python.org (raymond.hettinger) Date: Mon, 10 Nov 2014 06:30:42 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2322824=3A__Updated?= =?utf-8?q?_reprlib_output_format_for_sets_to_use_set_literals=2E?= Message-ID: <20141110063042.108083.25450@psf.io> https://hg.python.org/cpython/rev/147fda13bec8 changeset: 93449:147fda13bec8 parent: 93447:55b89e5f9c37 user: Raymond Hettinger date: Sun Nov 09 22:30:36 2014 -0800 summary: Issue #22824: Updated reprlib output format for sets to use set literals. files: Doc/tutorial/stdlib2.rst | 2 +- Lib/reprlib.py | 8 +++- Lib/test/test_reprlib.py | 44 ++++++++++++++++----------- Misc/NEWS | 3 + 4 files changed, 36 insertions(+), 21 deletions(-) diff --git a/Doc/tutorial/stdlib2.rst b/Doc/tutorial/stdlib2.rst --- a/Doc/tutorial/stdlib2.rst +++ b/Doc/tutorial/stdlib2.rst @@ -18,7 +18,7 @@ >>> import reprlib >>> reprlib.repr(set('supercalifragilisticexpialidocious')) - "set(['a', 'c', 'd', 'e', 'f', 'g', ...])" + "{'a', 'c', 'd', 'e', 'f', 'g', ...}" The :mod:`pprint` module offers more sophisticated control over printing both built-in and user defined objects in a way that is readable by the interpreter. diff --git a/Lib/reprlib.py b/Lib/reprlib.py --- a/Lib/reprlib.py +++ b/Lib/reprlib.py @@ -87,12 +87,16 @@ return self._repr_iterable(x, level, header, '])', self.maxarray) def repr_set(self, x, level): + if not x: + return 'set()' x = _possibly_sorted(x) - return self._repr_iterable(x, level, 'set([', '])', self.maxset) + return self._repr_iterable(x, level, '{', '}', self.maxset) def repr_frozenset(self, x, level): + if not x: + return 'frozenset()' x = _possibly_sorted(x) - return self._repr_iterable(x, level, 'frozenset([', '])', + return self._repr_iterable(x, level, 'frozenset({', '})', self.maxfrozenset) def repr_deque(self, x, level): diff --git a/Lib/test/test_reprlib.py b/Lib/test/test_reprlib.py --- a/Lib/test/test_reprlib.py +++ b/Lib/test/test_reprlib.py @@ -10,7 +10,7 @@ import importlib.util import unittest -from test.support import run_unittest, create_empty_file, verbose +from test.support import create_empty_file, verbose from reprlib import repr as r # Don't shadow builtin repr from reprlib import Repr from reprlib import recursive_repr @@ -70,18 +70,18 @@ eq(r([1, 2, 3, 4, 5, 6, 7]), "[1, 2, 3, 4, 5, 6, ...]") # Sets give up after 6 as well - eq(r(set([])), "set([])") - eq(r(set([1])), "set([1])") - eq(r(set([1, 2, 3])), "set([1, 2, 3])") - eq(r(set([1, 2, 3, 4, 5, 6])), "set([1, 2, 3, 4, 5, 6])") - eq(r(set([1, 2, 3, 4, 5, 6, 7])), "set([1, 2, 3, 4, 5, 6, ...])") + eq(r(set([])), "set()") + eq(r(set([1])), "{1}") + eq(r(set([1, 2, 3])), "{1, 2, 3}") + eq(r(set([1, 2, 3, 4, 5, 6])), "{1, 2, 3, 4, 5, 6}") + eq(r(set([1, 2, 3, 4, 5, 6, 7])), "{1, 2, 3, 4, 5, 6, ...}") # Frozensets give up after 6 as well - eq(r(frozenset([])), "frozenset([])") - eq(r(frozenset([1])), "frozenset([1])") - eq(r(frozenset([1, 2, 3])), "frozenset([1, 2, 3])") - eq(r(frozenset([1, 2, 3, 4, 5, 6])), "frozenset([1, 2, 3, 4, 5, 6])") - eq(r(frozenset([1, 2, 3, 4, 5, 6, 7])), "frozenset([1, 2, 3, 4, 5, 6, ...])") + eq(r(frozenset([])), "frozenset()") + eq(r(frozenset([1])), "frozenset({1})") + eq(r(frozenset([1, 2, 3])), "frozenset({1, 2, 3})") + eq(r(frozenset([1, 2, 3, 4, 5, 6])), "frozenset({1, 2, 3, 4, 5, 6})") + eq(r(frozenset([1, 2, 3, 4, 5, 6, 7])), "frozenset({1, 2, 3, 4, 5, 6, ...})") # collections.deque after 6 eq(r(deque([1, 2, 3, 4, 5, 6, 7])), "deque([1, 2, 3, 4, 5, 6, ...])") @@ -103,6 +103,20 @@ eq(r(array('i', [1, 2, 3, 4, 5, 6])), "array('i', [1, 2, 3, 4, 5, ...])") + def test_set_literal(self): + eq = self.assertEqual + eq(r({1}), "{1}") + eq(r({1, 2, 3}), "{1, 2, 3}") + eq(r({1, 2, 3, 4, 5, 6}), "{1, 2, 3, 4, 5, 6}") + eq(r({1, 2, 3, 4, 5, 6, 7}), "{1, 2, 3, 4, 5, 6, ...}") + + def test_frozenset(self): + eq = self.assertEqual + eq(r(frozenset({1})), "frozenset({1})") + eq(r(frozenset({1, 2, 3})), "frozenset({1, 2, 3})") + eq(r(frozenset({1, 2, 3, 4, 5, 6})), "frozenset({1, 2, 3, 4, 5, 6})") + eq(r(frozenset({1, 2, 3, 4, 5, 6, 7})), "frozenset({1, 2, 3, 4, 5, 6, ...})") + def test_numbers(self): eq = self.assertEqual eq(r(123), repr(123)) @@ -373,11 +387,5 @@ m.append(m) self.assertEqual(repr(m), '') -def test_main(): - run_unittest(ReprTests) - run_unittest(LongReprTest) - run_unittest(TestRecursiveRepr) - - if __name__ == "__main__": - test_main() + unittest.main() diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -186,6 +186,9 @@ - Issues #814253, #9179: Group references and conditional group references now work in lookbehind assertions in regular expressions. +- Issue #22824: Updated reprlib output format for sets to use set literals. + Patch contributed by Berker Peksag. + - Issue #22406: Fixed the uu_codec codec incorrectly ported to 3.x. Based on patch by Martin Panter. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 08:56:36 2014 From: python-checkins at python.org (berker.peksag) Date: Mon, 10 Nov 2014 07:56:36 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2321650=3A_Add_an_?= =?utf-8?q?=60--sort-keys=60_option_to_json=2Etool_CLI=2E?= Message-ID: <20141110075635.731.11536@psf.io> https://hg.python.org/cpython/rev/58a871227e5b changeset: 93450:58a871227e5b user: Berker Peksag date: Mon Nov 10 09:56:54 2014 +0200 summary: Issue #21650: Add an `--sort-keys` option to json.tool CLI. files: Doc/library/json.rst | 11 ++++++ Doc/whatsnew/3.5.rst | 8 ++++ Lib/json/tool.py | 12 ++++++- Lib/test/test_json/test_tool.py | 35 +++++++++++++++++++- Misc/NEWS | 2 + 5 files changed, 64 insertions(+), 4 deletions(-) diff --git a/Doc/library/json.rst b/Doc/library/json.rst --- a/Doc/library/json.rst +++ b/Doc/library/json.rst @@ -567,6 +567,7 @@ The *object_pairs_hook* parameter can be used to alter this behavior. .. highlight:: bash +.. module:: json.tool .. _json-commandline: @@ -586,6 +587,10 @@ $ echo '{1.2:3.4}' | python -m json.tool Expecting property name enclosed in double quotes: line 1 column 2 (char 1) +.. versionchanged:: 3.5 + The output is now in the same order as the input. Use the + :option:`--sort-keys` option to sort the output of dictionaries + alphabetically by key. Command line options ^^^^^^^^^^^^^^^^^^^^ @@ -613,6 +618,12 @@ Write the output of the *infile* to the given *outfile*. Otherwise, write it to :attr:`sys.stdout`. +.. cmdoption:: --sort-keys + + Sort the output of dictionaries alphabetically by key. + + .. versionadded:: 3.5 + .. cmdoption:: -h, --help Show the help message. diff --git a/Doc/whatsnew/3.5.rst b/Doc/whatsnew/3.5.rst --- a/Doc/whatsnew/3.5.rst +++ b/Doc/whatsnew/3.5.rst @@ -211,6 +211,14 @@ network objects from existing addresses. (Contributed by Peter Moody and Antoine Pitrou in :issue:`16531`.) +json +---- + +* The output of :mod:`json.tool` command line interface is now in the same + order as the input. Use the :option:`--sort-keys` option to sort the output + of dictionaries alphabetically by key. (Contributed by Berker Peksag in + :issue:`21650`.) + os -- diff --git a/Lib/json/tool.py b/Lib/json/tool.py --- a/Lib/json/tool.py +++ b/Lib/json/tool.py @@ -11,6 +11,7 @@ """ import argparse +import collections import json import sys @@ -24,17 +25,24 @@ help='a JSON file to be validated or pretty-printed') parser.add_argument('outfile', nargs='?', type=argparse.FileType('w'), help='write the output of infile to outfile') + parser.add_argument('--sort-keys', action='store_true', default=False, + help='sort the output of dictionaries alphabetically by key') options = parser.parse_args() infile = options.infile or sys.stdin outfile = options.outfile or sys.stdout + sort_keys = options.sort_keys with infile: try: - obj = json.load(infile) + if sort_keys: + obj = json.load(infile) + else: + obj = json.load(infile, + object_pairs_hook=collections.OrderedDict) except ValueError as e: raise SystemExit(e) with outfile: - json.dump(obj, outfile, sort_keys=True, indent=4) + json.dump(obj, outfile, sort_keys=sort_keys, indent=4) outfile.write('\n') diff --git a/Lib/test/test_json/test_tool.py b/Lib/test/test_json/test_tool.py --- a/Lib/test/test_json/test_tool.py +++ b/Lib/test/test_json/test_tool.py @@ -6,6 +6,7 @@ from test import support from test.script_helper import assert_python_ok + class TestTool(unittest.TestCase): data = """ @@ -15,6 +16,28 @@ :"yes"} ] """ + expect_without_sort_keys = textwrap.dedent("""\ + [ + [ + "blorpie" + ], + [ + "whoops" + ], + [], + "d-shtaeou", + "d-nthiouh", + "i-vhbjkhnth", + { + "nifty": 87 + }, + { + "field": "yes", + "morefield": false + } + ] + """) + expect = textwrap.dedent("""\ [ [ @@ -31,8 +54,8 @@ "nifty": 87 }, { - "field": "yes", - "morefield": false + "morefield": false, + "field": "yes" } ] """) @@ -75,3 +98,11 @@ self.assertEqual(rc, 0) self.assertTrue(out.startswith(b'usage: ')) self.assertEqual(err, b'') + + def test_sort_keys_flag(self): + infile = self._create_infile() + rc, out, err = assert_python_ok('-m', 'json.tool', '--sort-keys', infile) + self.assertEqual(rc, 0) + self.assertEqual(out.splitlines(), + self.expect_without_sort_keys.encode().splitlines()) + self.assertEqual(err, b'') diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -183,6 +183,8 @@ Library ------- +- Issue #21650: Add an `--sort-keys` option to json.tool CLI. + - Issues #814253, #9179: Group references and conditional group references now work in lookbehind assertions in regular expressions. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 09:23:18 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 10 Nov 2014 08:23:18 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2322434=3A_Constant?= =?utf-8?q?s_in_sre=5Fconstants_are_now_named_constants_=28enum-like=29=2E?= Message-ID: <20141110082318.113474.69580@psf.io> https://hg.python.org/cpython/rev/fc7dbba57869 changeset: 93451:fc7dbba57869 parent: 93441:ec81edc30221 user: Serhiy Storchaka date: Sun Nov 09 20:48:36 2014 +0200 summary: Issue #22434: Constants in sre_constants are now named constants (enum-like). files: Lib/sre_compile.py | 75 +++++----- Lib/sre_constants.py | 197 +++++++++++------------------- Lib/sre_parse.py | 9 +- Lib/test/test_re.py | 32 ++-- 4 files changed, 127 insertions(+), 186 deletions(-) diff --git a/Lib/sre_compile.py b/Lib/sre_compile.py --- a/Lib/sre_compile.py +++ b/Lib/sre_compile.py @@ -13,7 +13,6 @@ import _sre import sre_parse from sre_constants import * -from _sre import MAXREPEAT assert _sre.MAGIC == MAGIC, "SRE module mismatch" @@ -38,65 +37,65 @@ for op, av in pattern: if op in LITERAL_CODES: if flags & SRE_FLAG_IGNORECASE: - emit(OPCODES[OP_IGNORE[op]]) + emit(OP_IGNORE[op]) emit(_sre.getlower(av, flags)) else: - emit(OPCODES[op]) + emit(op) emit(av) elif op is IN: if flags & SRE_FLAG_IGNORECASE: - emit(OPCODES[OP_IGNORE[op]]) + emit(OP_IGNORE[op]) def fixup(literal, flags=flags): return _sre.getlower(literal, flags) else: - emit(OPCODES[op]) + emit(op) fixup = None skip = _len(code); emit(0) _compile_charset(av, flags, code, fixup) code[skip] = _len(code) - skip elif op is ANY: if flags & SRE_FLAG_DOTALL: - emit(OPCODES[ANY_ALL]) + emit(ANY_ALL) else: - emit(OPCODES[ANY]) + emit(ANY) elif op in REPEATING_CODES: if flags & SRE_FLAG_TEMPLATE: raise error("internal: unsupported template operator") elif _simple(av) and op is not REPEAT: if op is MAX_REPEAT: - emit(OPCODES[REPEAT_ONE]) + emit(REPEAT_ONE) else: - emit(OPCODES[MIN_REPEAT_ONE]) + emit(MIN_REPEAT_ONE) skip = _len(code); emit(0) emit(av[0]) emit(av[1]) _compile(code, av[2], flags) - emit(OPCODES[SUCCESS]) + emit(SUCCESS) code[skip] = _len(code) - skip else: - emit(OPCODES[REPEAT]) + emit(REPEAT) skip = _len(code); emit(0) emit(av[0]) emit(av[1]) _compile(code, av[2], flags) code[skip] = _len(code) - skip if op is MAX_REPEAT: - emit(OPCODES[MAX_UNTIL]) + emit(MAX_UNTIL) else: - emit(OPCODES[MIN_UNTIL]) + emit(MIN_UNTIL) elif op is SUBPATTERN: if av[0]: - emit(OPCODES[MARK]) + emit(MARK) emit((av[0]-1)*2) # _compile_info(code, av[1], flags) _compile(code, av[1], flags) if av[0]: - emit(OPCODES[MARK]) + emit(MARK) emit((av[0]-1)*2+1) elif op in SUCCESS_CODES: - emit(OPCODES[op]) + emit(op) elif op in ASSERT_CODES: - emit(OPCODES[op]) + emit(op) skip = _len(code); emit(0) if av[0] >= 0: emit(0) # look ahead @@ -106,57 +105,57 @@ raise error("look-behind requires fixed-width pattern") emit(lo) # look behind _compile(code, av[1], flags) - emit(OPCODES[SUCCESS]) + emit(SUCCESS) code[skip] = _len(code) - skip elif op is CALL: - emit(OPCODES[op]) + emit(op) skip = _len(code); emit(0) _compile(code, av, flags) - emit(OPCODES[SUCCESS]) + emit(SUCCESS) code[skip] = _len(code) - skip elif op is AT: - emit(OPCODES[op]) + emit(op) if flags & SRE_FLAG_MULTILINE: av = AT_MULTILINE.get(av, av) if flags & SRE_FLAG_LOCALE: av = AT_LOCALE.get(av, av) elif flags & SRE_FLAG_UNICODE: av = AT_UNICODE.get(av, av) - emit(ATCODES[av]) + emit(av) elif op is BRANCH: - emit(OPCODES[op]) + emit(op) tail = [] tailappend = tail.append for av in av[1]: skip = _len(code); emit(0) # _compile_info(code, av, flags) _compile(code, av, flags) - emit(OPCODES[JUMP]) + emit(JUMP) tailappend(_len(code)); emit(0) code[skip] = _len(code) - skip emit(0) # end of branch for tail in tail: code[tail] = _len(code) - tail elif op is CATEGORY: - emit(OPCODES[op]) + emit(op) if flags & SRE_FLAG_LOCALE: av = CH_LOCALE[av] elif flags & SRE_FLAG_UNICODE: av = CH_UNICODE[av] - emit(CHCODES[av]) + emit(av) elif op is GROUPREF: if flags & SRE_FLAG_IGNORECASE: - emit(OPCODES[OP_IGNORE[op]]) + emit(OP_IGNORE[op]) else: - emit(OPCODES[op]) + emit(op) emit(av-1) elif op is GROUPREF_EXISTS: - emit(OPCODES[op]) + emit(op) emit(av[0]-1) skipyes = _len(code); emit(0) _compile(code, av[1], flags) if av[2]: - emit(OPCODES[JUMP]) + emit(JUMP) skipno = _len(code); emit(0) code[skipyes] = _len(code) - skipyes + 1 _compile(code, av[2], flags) @@ -170,7 +169,7 @@ # compile charset subprogram emit = code.append for op, av in _optimize_charset(charset, fixup): - emit(OPCODES[op]) + emit(op) if op is NEGATE: pass elif op is LITERAL: @@ -184,14 +183,14 @@ code.extend(av) elif op is CATEGORY: if flags & SRE_FLAG_LOCALE: - emit(CHCODES[CH_LOCALE[av]]) + emit(CH_LOCALE[av]) elif flags & SRE_FLAG_UNICODE: - emit(CHCODES[CH_UNICODE[av]]) + emit(CH_UNICODE[av]) else: - emit(CHCODES[av]) + emit(av) else: raise error("internal: unsupported set operator") - emit(OPCODES[FAILURE]) + emit(FAILURE) def _optimize_charset(charset, fixup): # internal: optimize character set @@ -414,7 +413,7 @@ ## print "*** CHARSET", charset # add an info block emit = code.append - emit(OPCODES[INFO]) + emit(INFO) skip = len(code); emit(0) # literal flag mask = 0 @@ -460,7 +459,7 @@ # compile the pattern _compile(code, p.data, flags) - code.append(OPCODES[SUCCESS]) + code.append(SUCCESS) return code @@ -475,7 +474,7 @@ code = _code(p, flags) - # print code + # print(code) # map in either direction groupindex = p.pattern.groupdict diff --git a/Lib/sre_constants.py b/Lib/sre_constants.py --- a/Lib/sre_constants.py +++ b/Lib/sre_constants.py @@ -23,138 +23,81 @@ class error(Exception): pass + +class _NamedIntConstant(int): + def __new__(cls, value, name): + self = super(_NamedIntConstant, cls).__new__(cls, value) + self.name = name + return self + + def __str__(self): + return self.name + + __repr__ = __str__ + +MAXREPEAT = _NamedIntConstant(MAXREPEAT, 'MAXREPEAT') + +def _makecodes(names): + names = names.strip().split() + items = [_NamedIntConstant(i, name) for i, name in enumerate(names)] + globals().update({item.name: item for item in items}) + return items + # operators +# failure=0 success=1 (just because it looks better that way :-) +OPCODES = _makecodes(""" + FAILURE SUCCESS -FAILURE = "failure" -SUCCESS = "success" + ANY ANY_ALL + ASSERT ASSERT_NOT + AT + BRANCH + CALL + CATEGORY + CHARSET BIGCHARSET + GROUPREF GROUPREF_EXISTS GROUPREF_IGNORE + IN IN_IGNORE + INFO + JUMP + LITERAL LITERAL_IGNORE + MARK + MAX_UNTIL + MIN_UNTIL + NOT_LITERAL NOT_LITERAL_IGNORE + NEGATE + RANGE + REPEAT + REPEAT_ONE + SUBPATTERN + MIN_REPEAT_ONE + RANGE_IGNORE -ANY = "any" -ANY_ALL = "any_all" -ASSERT = "assert" -ASSERT_NOT = "assert_not" -AT = "at" -BIGCHARSET = "bigcharset" -BRANCH = "branch" -CALL = "call" -CATEGORY = "category" -CHARSET = "charset" -GROUPREF = "groupref" -GROUPREF_IGNORE = "groupref_ignore" -GROUPREF_EXISTS = "groupref_exists" -IN = "in" -IN_IGNORE = "in_ignore" -INFO = "info" -JUMP = "jump" -LITERAL = "literal" -LITERAL_IGNORE = "literal_ignore" -MARK = "mark" -MAX_REPEAT = "max_repeat" -MAX_UNTIL = "max_until" -MIN_REPEAT = "min_repeat" -MIN_UNTIL = "min_until" -NEGATE = "negate" -NOT_LITERAL = "not_literal" -NOT_LITERAL_IGNORE = "not_literal_ignore" -RANGE = "range" -RANGE_IGNORE = "range_ignore" -REPEAT = "repeat" -REPEAT_ONE = "repeat_one" -SUBPATTERN = "subpattern" -MIN_REPEAT_ONE = "min_repeat_one" + MIN_REPEAT MAX_REPEAT +""") +del OPCODES[-2:] # remove MIN_REPEAT and MAX_REPEAT # positions -AT_BEGINNING = "at_beginning" -AT_BEGINNING_LINE = "at_beginning_line" -AT_BEGINNING_STRING = "at_beginning_string" -AT_BOUNDARY = "at_boundary" -AT_NON_BOUNDARY = "at_non_boundary" -AT_END = "at_end" -AT_END_LINE = "at_end_line" -AT_END_STRING = "at_end_string" -AT_LOC_BOUNDARY = "at_loc_boundary" -AT_LOC_NON_BOUNDARY = "at_loc_non_boundary" -AT_UNI_BOUNDARY = "at_uni_boundary" -AT_UNI_NON_BOUNDARY = "at_uni_non_boundary" +ATCODES = _makecodes(""" + AT_BEGINNING AT_BEGINNING_LINE AT_BEGINNING_STRING + AT_BOUNDARY AT_NON_BOUNDARY + AT_END AT_END_LINE AT_END_STRING + AT_LOC_BOUNDARY AT_LOC_NON_BOUNDARY + AT_UNI_BOUNDARY AT_UNI_NON_BOUNDARY +""") # categories -CATEGORY_DIGIT = "category_digit" -CATEGORY_NOT_DIGIT = "category_not_digit" -CATEGORY_SPACE = "category_space" -CATEGORY_NOT_SPACE = "category_not_space" -CATEGORY_WORD = "category_word" -CATEGORY_NOT_WORD = "category_not_word" -CATEGORY_LINEBREAK = "category_linebreak" -CATEGORY_NOT_LINEBREAK = "category_not_linebreak" -CATEGORY_LOC_WORD = "category_loc_word" -CATEGORY_LOC_NOT_WORD = "category_loc_not_word" -CATEGORY_UNI_DIGIT = "category_uni_digit" -CATEGORY_UNI_NOT_DIGIT = "category_uni_not_digit" -CATEGORY_UNI_SPACE = "category_uni_space" -CATEGORY_UNI_NOT_SPACE = "category_uni_not_space" -CATEGORY_UNI_WORD = "category_uni_word" -CATEGORY_UNI_NOT_WORD = "category_uni_not_word" -CATEGORY_UNI_LINEBREAK = "category_uni_linebreak" -CATEGORY_UNI_NOT_LINEBREAK = "category_uni_not_linebreak" +CHCODES = _makecodes(""" + CATEGORY_DIGIT CATEGORY_NOT_DIGIT + CATEGORY_SPACE CATEGORY_NOT_SPACE + CATEGORY_WORD CATEGORY_NOT_WORD + CATEGORY_LINEBREAK CATEGORY_NOT_LINEBREAK + CATEGORY_LOC_WORD CATEGORY_LOC_NOT_WORD + CATEGORY_UNI_DIGIT CATEGORY_UNI_NOT_DIGIT + CATEGORY_UNI_SPACE CATEGORY_UNI_NOT_SPACE + CATEGORY_UNI_WORD CATEGORY_UNI_NOT_WORD + CATEGORY_UNI_LINEBREAK CATEGORY_UNI_NOT_LINEBREAK +""") -OPCODES = [ - - # failure=0 success=1 (just because it looks better that way :-) - FAILURE, SUCCESS, - - ANY, ANY_ALL, - ASSERT, ASSERT_NOT, - AT, - BRANCH, - CALL, - CATEGORY, - CHARSET, BIGCHARSET, - GROUPREF, GROUPREF_EXISTS, GROUPREF_IGNORE, - IN, IN_IGNORE, - INFO, - JUMP, - LITERAL, LITERAL_IGNORE, - MARK, - MAX_UNTIL, - MIN_UNTIL, - NOT_LITERAL, NOT_LITERAL_IGNORE, - NEGATE, - RANGE, - REPEAT, - REPEAT_ONE, - SUBPATTERN, - MIN_REPEAT_ONE, - RANGE_IGNORE, - -] - -ATCODES = [ - AT_BEGINNING, AT_BEGINNING_LINE, AT_BEGINNING_STRING, AT_BOUNDARY, - AT_NON_BOUNDARY, AT_END, AT_END_LINE, AT_END_STRING, - AT_LOC_BOUNDARY, AT_LOC_NON_BOUNDARY, AT_UNI_BOUNDARY, - AT_UNI_NON_BOUNDARY -] - -CHCODES = [ - CATEGORY_DIGIT, CATEGORY_NOT_DIGIT, CATEGORY_SPACE, - CATEGORY_NOT_SPACE, CATEGORY_WORD, CATEGORY_NOT_WORD, - CATEGORY_LINEBREAK, CATEGORY_NOT_LINEBREAK, CATEGORY_LOC_WORD, - CATEGORY_LOC_NOT_WORD, CATEGORY_UNI_DIGIT, CATEGORY_UNI_NOT_DIGIT, - CATEGORY_UNI_SPACE, CATEGORY_UNI_NOT_SPACE, CATEGORY_UNI_WORD, - CATEGORY_UNI_NOT_WORD, CATEGORY_UNI_LINEBREAK, - CATEGORY_UNI_NOT_LINEBREAK -] - -def makedict(list): - d = {} - i = 0 - for item in list: - d[item] = i - i = i + 1 - return d - -OPCODES = makedict(OPCODES) -ATCODES = makedict(ATCODES) -CHCODES = makedict(CHCODES) # replacement operations for "ignore case" mode OP_IGNORE = { @@ -220,9 +163,9 @@ if __name__ == "__main__": def dump(f, d, prefix): - items = sorted(d.items(), key=lambda a: a[1]) - for k, v in items: - f.write("#define %s_%s %s\n" % (prefix, k.upper(), v)) + items = sorted(d) + for item in items: + f.write("#define %s_%s %d\n" % (prefix, item, item)) f = open("sre_constants.h", "w") f.write("""\ /* diff --git a/Lib/sre_parse.py b/Lib/sre_parse.py --- a/Lib/sre_parse.py +++ b/Lib/sre_parse.py @@ -13,7 +13,6 @@ # XXX: show string offset and offending character for all errors from sre_constants import * -from _sre import MAXREPEAT SPECIAL_CHARS = ".\\[{()*+?^$|" REPEAT_CHARS = "*+?{" @@ -103,24 +102,24 @@ nl = True seqtypes = (tuple, list) for op, av in self.data: - print(level*" " + op, end='') + print(level*" " + str(op), end='') if op == IN: # member sublanguage print() for op, a in av: - print((level+1)*" " + op, a) + print((level+1)*" " + str(op), a) elif op == BRANCH: print() for i, a in enumerate(av[1]): if i: - print(level*" " + "or") + print(level*" " + "OR") a.dump(level+1) elif op == GROUPREF_EXISTS: condgroup, item_yes, item_no = av print('', condgroup) item_yes.dump(level+1) if item_no: - print(level*" " + "else") + print(level*" " + "ELSE") item_no.dump(level+1) elif isinstance(av, seqtypes): nl = False diff --git a/Lib/test/test_re.py b/Lib/test/test_re.py --- a/Lib/test/test_re.py +++ b/Lib/test/test_re.py @@ -1285,22 +1285,22 @@ with captured_stdout() as out: re.compile(pat, re.DEBUG) dump = '''\ -subpattern 1 - literal 46 -subpattern None - branch - in - literal 99 - literal 104 - or - literal 112 - literal 121 -subpattern None - groupref_exists 1 - at at_end - else - literal 58 - literal 32 +SUBPATTERN 1 + LITERAL 46 +SUBPATTERN None + BRANCH + IN + LITERAL 99 + LITERAL 104 + OR + LITERAL 112 + LITERAL 121 +SUBPATTERN None + GROUPREF_EXISTS 1 + AT AT_END + ELSE + LITERAL 58 + LITERAL 32 ''' self.assertEqual(out.getvalue(), dump) # Debug output is output again even a second time (bypassing -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 09:23:18 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 10 Nov 2014 08:23:18 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_default_-=3E_default?= =?utf-8?q?=29=3A_Merge_heads?= Message-ID: <20141110082318.85194.34355@psf.io> https://hg.python.org/cpython/rev/8111ee79d27c changeset: 93452:8111ee79d27c parent: 93451:fc7dbba57869 parent: 93450:58a871227e5b user: Serhiy Storchaka date: Mon Nov 10 10:21:03 2014 +0200 summary: Merge heads files: Doc/howto/logging-cookbook.rst | 2 +- Doc/library/functools.rst | 9 +- Doc/library/json.rst | 11 + Doc/library/pickle.rst | 2 +- Doc/tutorial/stdlib2.rst | 2 +- Doc/whatsnew/3.5.rst | 8 + Lib/_strptime.py | 4 +- Lib/asyncore.py | 6 +- Lib/ipaddress.py | 2 +- Lib/json/tool.py | 12 +- Lib/mailbox.py | 4 +- Lib/reprlib.py | 8 +- Lib/sre_compile.py | 8 +- Lib/sre_parse.py | 4 +- Lib/statistics.py | 4 +- Lib/test/test_json/test_tool.py | 35 +- Lib/test/test_reprlib.py | 44 +- Misc/NEWS | 5 + Modules/clinic/fcntlmodule.c.h | 188 ++++++++ Modules/fcntlmodule.c | 432 ++++++++++--------- Parser/asdl.py | 3 +- 21 files changed, 537 insertions(+), 256 deletions(-) diff --git a/Doc/howto/logging-cookbook.rst b/Doc/howto/logging-cookbook.rst --- a/Doc/howto/logging-cookbook.rst +++ b/Doc/howto/logging-cookbook.rst @@ -1680,7 +1680,7 @@ def main(): logging.basicConfig(level=logging.INFO, format='%(message)s') - logging.info(_('message 1', set_value=set([1, 2, 3]), snowman='\u2603')) + logging.info(_('message 1', set_value={1, 2, 3}, snowman='\u2603')) if __name__ == '__main__': main() diff --git a/Doc/library/functools.rst b/Doc/library/functools.rst --- a/Doc/library/functools.rst +++ b/Doc/library/functools.rst @@ -21,8 +21,8 @@ .. function:: cmp_to_key(func) - Transform an old-style comparison function to a key function. Used with - tools that accept key functions (such as :func:`sorted`, :func:`min`, + Transform an old-style comparison function to a :term:`key function`. Used + with tools that accept key functions (such as :func:`sorted`, :func:`min`, :func:`max`, :func:`heapq.nlargest`, :func:`heapq.nsmallest`, :func:`itertools.groupby`). This function is primarily used as a transition tool for programs being converted from Python 2 which supported the use of @@ -31,13 +31,14 @@ A comparison function is any callable that accept two arguments, compares them, and returns a negative number for less-than, zero for equality, or a positive number for greater-than. A key function is a callable that accepts one - argument and returns another value indicating the position in the desired - collation sequence. + argument and returns another value to be used as the sort key. Example:: sorted(iterable, key=cmp_to_key(locale.strcoll)) # locale-aware sort order + For sorting examples and a brief sorting tutorial, see :ref:`sortinghowto`. + .. versionadded:: 3.2 diff --git a/Doc/library/json.rst b/Doc/library/json.rst --- a/Doc/library/json.rst +++ b/Doc/library/json.rst @@ -567,6 +567,7 @@ The *object_pairs_hook* parameter can be used to alter this behavior. .. highlight:: bash +.. module:: json.tool .. _json-commandline: @@ -586,6 +587,10 @@ $ echo '{1.2:3.4}' | python -m json.tool Expecting property name enclosed in double quotes: line 1 column 2 (char 1) +.. versionchanged:: 3.5 + The output is now in the same order as the input. Use the + :option:`--sort-keys` option to sort the output of dictionaries + alphabetically by key. Command line options ^^^^^^^^^^^^^^^^^^^^ @@ -613,6 +618,12 @@ Write the output of the *infile* to the given *outfile*. Otherwise, write it to :attr:`sys.stdout`. +.. cmdoption:: --sort-keys + + Sort the output of dictionaries alphabetically by key. + + .. versionadded:: 3.5 + .. cmdoption:: -h, --help Show the help message. diff --git a/Doc/library/pickle.rst b/Doc/library/pickle.rst --- a/Doc/library/pickle.rst +++ b/Doc/library/pickle.rst @@ -859,7 +859,7 @@ data = { 'a': [1, 2.0, 3, 4+6j], 'b': ("character string", b"byte string"), - 'c': set([None, True, False]) + 'c': {None, True, False} } with open('data.pickle', 'wb') as f: diff --git a/Doc/tutorial/stdlib2.rst b/Doc/tutorial/stdlib2.rst --- a/Doc/tutorial/stdlib2.rst +++ b/Doc/tutorial/stdlib2.rst @@ -18,7 +18,7 @@ >>> import reprlib >>> reprlib.repr(set('supercalifragilisticexpialidocious')) - "set(['a', 'c', 'd', 'e', 'f', 'g', ...])" + "{'a', 'c', 'd', 'e', 'f', 'g', ...}" The :mod:`pprint` module offers more sophisticated control over printing both built-in and user defined objects in a way that is readable by the interpreter. diff --git a/Doc/whatsnew/3.5.rst b/Doc/whatsnew/3.5.rst --- a/Doc/whatsnew/3.5.rst +++ b/Doc/whatsnew/3.5.rst @@ -211,6 +211,14 @@ network objects from existing addresses. (Contributed by Peter Moody and Antoine Pitrou in :issue:`16531`.) +json +---- + +* The output of :mod:`json.tool` command line interface is now in the same + order as the input. Use the :option:`--sort-keys` option to sort the output + of dictionaries alphabetically by key. (Contributed by Berker Peksag in + :issue:`21650`.) + os -- diff --git a/Lib/_strptime.py b/Lib/_strptime.py --- a/Lib/_strptime.py +++ b/Lib/_strptime.py @@ -167,9 +167,9 @@ time.tzset() except AttributeError: pass - no_saving = frozenset(["utc", "gmt", time.tzname[0].lower()]) + no_saving = frozenset({"utc", "gmt", time.tzname[0].lower()}) if time.daylight: - has_saving = frozenset([time.tzname[1].lower()]) + has_saving = frozenset({time.tzname[1].lower()}) else: has_saving = frozenset() self.timezone = (no_saving, has_saving) diff --git a/Lib/asyncore.py b/Lib/asyncore.py --- a/Lib/asyncore.py +++ b/Lib/asyncore.py @@ -57,8 +57,8 @@ ENOTCONN, ESHUTDOWN, EISCONN, EBADF, ECONNABORTED, EPIPE, EAGAIN, \ errorcode -_DISCONNECTED = frozenset((ECONNRESET, ENOTCONN, ESHUTDOWN, ECONNABORTED, EPIPE, - EBADF)) +_DISCONNECTED = frozenset({ECONNRESET, ENOTCONN, ESHUTDOWN, ECONNABORTED, EPIPE, + EBADF}) try: socket_map @@ -220,7 +220,7 @@ connecting = False closing = False addr = None - ignore_log_types = frozenset(['warning']) + ignore_log_types = frozenset({'warning'}) def __init__(self, sock=None, map=None): if map is None: diff --git a/Lib/ipaddress.py b/Lib/ipaddress.py --- a/Lib/ipaddress.py +++ b/Lib/ipaddress.py @@ -1088,7 +1088,7 @@ _DECIMAL_DIGITS = frozenset('0123456789') # the valid octets for host and netmasks. only useful for IPv4. - _valid_mask_octets = frozenset((255, 254, 252, 248, 240, 224, 192, 128, 0)) + _valid_mask_octets = frozenset({255, 254, 252, 248, 240, 224, 192, 128, 0}) _max_prefixlen = IPV4LENGTH # There are only a handful of valid v4 netmasks, so we cache them all diff --git a/Lib/json/tool.py b/Lib/json/tool.py --- a/Lib/json/tool.py +++ b/Lib/json/tool.py @@ -11,6 +11,7 @@ """ import argparse +import collections import json import sys @@ -24,17 +25,24 @@ help='a JSON file to be validated or pretty-printed') parser.add_argument('outfile', nargs='?', type=argparse.FileType('w'), help='write the output of infile to outfile') + parser.add_argument('--sort-keys', action='store_true', default=False, + help='sort the output of dictionaries alphabetically by key') options = parser.parse_args() infile = options.infile or sys.stdin outfile = options.outfile or sys.stdout + sort_keys = options.sort_keys with infile: try: - obj = json.load(infile) + if sort_keys: + obj = json.load(infile) + else: + obj = json.load(infile, + object_pairs_hook=collections.OrderedDict) except ValueError as e: raise SystemExit(e) with outfile: - json.dump(obj, outfile, sort_keys=True, indent=4) + json.dump(obj, outfile, sort_keys=sort_keys, indent=4) outfile.write('\n') diff --git a/Lib/mailbox.py b/Lib/mailbox.py --- a/Lib/mailbox.py +++ b/Lib/mailbox.py @@ -1230,8 +1230,8 @@ class Babyl(_singlefileMailbox): """An Rmail-style Babyl mailbox.""" - _special_labels = frozenset(('unseen', 'deleted', 'filed', 'answered', - 'forwarded', 'edited', 'resent')) + _special_labels = frozenset({'unseen', 'deleted', 'filed', 'answered', + 'forwarded', 'edited', 'resent'}) def __init__(self, path, factory=None, create=True): """Initialize a Babyl mailbox.""" diff --git a/Lib/reprlib.py b/Lib/reprlib.py --- a/Lib/reprlib.py +++ b/Lib/reprlib.py @@ -87,12 +87,16 @@ return self._repr_iterable(x, level, header, '])', self.maxarray) def repr_set(self, x, level): + if not x: + return 'set()' x = _possibly_sorted(x) - return self._repr_iterable(x, level, 'set([', '])', self.maxset) + return self._repr_iterable(x, level, '{', '}', self.maxset) def repr_frozenset(self, x, level): + if not x: + return 'frozenset()' x = _possibly_sorted(x) - return self._repr_iterable(x, level, 'frozenset([', '])', + return self._repr_iterable(x, level, 'frozenset({', '})', self.maxfrozenset) def repr_deque(self, x, level): diff --git a/Lib/sre_compile.py b/Lib/sre_compile.py --- a/Lib/sre_compile.py +++ b/Lib/sre_compile.py @@ -21,10 +21,10 @@ else: MAXCODE = 0xFFFFFFFF -_LITERAL_CODES = set([LITERAL, NOT_LITERAL]) -_REPEATING_CODES = set([REPEAT, MIN_REPEAT, MAX_REPEAT]) -_SUCCESS_CODES = set([SUCCESS, FAILURE]) -_ASSERT_CODES = set([ASSERT, ASSERT_NOT]) +_LITERAL_CODES = {LITERAL, NOT_LITERAL} +_REPEATING_CODES = {REPEAT, MIN_REPEAT, MAX_REPEAT} +_SUCCESS_CODES = {SUCCESS, FAILURE} +_ASSERT_CODES = {ASSERT, ASSERT_NOT} def _compile(code, pattern, flags): # internal: compile a (sub)pattern diff --git a/Lib/sre_parse.py b/Lib/sre_parse.py --- a/Lib/sre_parse.py +++ b/Lib/sre_parse.py @@ -24,8 +24,8 @@ WHITESPACE = frozenset(" \t\n\r\v\f") -_REPEATCODES = frozenset((MIN_REPEAT, MAX_REPEAT)) -_UNITCODES = frozenset((ANY, RANGE, IN, LITERAL, NOT_LITERAL, CATEGORY)) +_REPEATCODES = frozenset({MIN_REPEAT, MAX_REPEAT}) +_UNITCODES = frozenset({ANY, RANGE, IN, LITERAL, NOT_LITERAL, CATEGORY}) ESCAPES = { r"\a": (LITERAL, ord("\a")), diff --git a/Lib/statistics.py b/Lib/statistics.py --- a/Lib/statistics.py +++ b/Lib/statistics.py @@ -150,7 +150,7 @@ # We fail as soon as we reach a value that is not an int or the type of # the first value which is not an int. E.g. _sum([int, int, float, int]) # is okay, but sum([int, int, float, Fraction]) is not. - allowed_types = set([int, type(start)]) + allowed_types = {int, type(start)} n, d = _exact_ratio(start) partials = {d: n} # map {denominator: sum of numerators} # Micro-optimizations. @@ -168,7 +168,7 @@ assert allowed_types.pop() is int T = int else: - T = (allowed_types - set([int])).pop() + T = (allowed_types - {int}).pop() if None in partials: assert issubclass(T, (float, Decimal)) assert not math.isfinite(partials[None]) diff --git a/Lib/test/test_json/test_tool.py b/Lib/test/test_json/test_tool.py --- a/Lib/test/test_json/test_tool.py +++ b/Lib/test/test_json/test_tool.py @@ -6,6 +6,7 @@ from test import support from test.script_helper import assert_python_ok + class TestTool(unittest.TestCase): data = """ @@ -15,6 +16,28 @@ :"yes"} ] """ + expect_without_sort_keys = textwrap.dedent("""\ + [ + [ + "blorpie" + ], + [ + "whoops" + ], + [], + "d-shtaeou", + "d-nthiouh", + "i-vhbjkhnth", + { + "nifty": 87 + }, + { + "field": "yes", + "morefield": false + } + ] + """) + expect = textwrap.dedent("""\ [ [ @@ -31,8 +54,8 @@ "nifty": 87 }, { - "field": "yes", - "morefield": false + "morefield": false, + "field": "yes" } ] """) @@ -75,3 +98,11 @@ self.assertEqual(rc, 0) self.assertTrue(out.startswith(b'usage: ')) self.assertEqual(err, b'') + + def test_sort_keys_flag(self): + infile = self._create_infile() + rc, out, err = assert_python_ok('-m', 'json.tool', '--sort-keys', infile) + self.assertEqual(rc, 0) + self.assertEqual(out.splitlines(), + self.expect_without_sort_keys.encode().splitlines()) + self.assertEqual(err, b'') diff --git a/Lib/test/test_reprlib.py b/Lib/test/test_reprlib.py --- a/Lib/test/test_reprlib.py +++ b/Lib/test/test_reprlib.py @@ -10,7 +10,7 @@ import importlib.util import unittest -from test.support import run_unittest, create_empty_file, verbose +from test.support import create_empty_file, verbose from reprlib import repr as r # Don't shadow builtin repr from reprlib import Repr from reprlib import recursive_repr @@ -70,18 +70,18 @@ eq(r([1, 2, 3, 4, 5, 6, 7]), "[1, 2, 3, 4, 5, 6, ...]") # Sets give up after 6 as well - eq(r(set([])), "set([])") - eq(r(set([1])), "set([1])") - eq(r(set([1, 2, 3])), "set([1, 2, 3])") - eq(r(set([1, 2, 3, 4, 5, 6])), "set([1, 2, 3, 4, 5, 6])") - eq(r(set([1, 2, 3, 4, 5, 6, 7])), "set([1, 2, 3, 4, 5, 6, ...])") + eq(r(set([])), "set()") + eq(r(set([1])), "{1}") + eq(r(set([1, 2, 3])), "{1, 2, 3}") + eq(r(set([1, 2, 3, 4, 5, 6])), "{1, 2, 3, 4, 5, 6}") + eq(r(set([1, 2, 3, 4, 5, 6, 7])), "{1, 2, 3, 4, 5, 6, ...}") # Frozensets give up after 6 as well - eq(r(frozenset([])), "frozenset([])") - eq(r(frozenset([1])), "frozenset([1])") - eq(r(frozenset([1, 2, 3])), "frozenset([1, 2, 3])") - eq(r(frozenset([1, 2, 3, 4, 5, 6])), "frozenset([1, 2, 3, 4, 5, 6])") - eq(r(frozenset([1, 2, 3, 4, 5, 6, 7])), "frozenset([1, 2, 3, 4, 5, 6, ...])") + eq(r(frozenset([])), "frozenset()") + eq(r(frozenset([1])), "frozenset({1})") + eq(r(frozenset([1, 2, 3])), "frozenset({1, 2, 3})") + eq(r(frozenset([1, 2, 3, 4, 5, 6])), "frozenset({1, 2, 3, 4, 5, 6})") + eq(r(frozenset([1, 2, 3, 4, 5, 6, 7])), "frozenset({1, 2, 3, 4, 5, 6, ...})") # collections.deque after 6 eq(r(deque([1, 2, 3, 4, 5, 6, 7])), "deque([1, 2, 3, 4, 5, 6, ...])") @@ -103,6 +103,20 @@ eq(r(array('i', [1, 2, 3, 4, 5, 6])), "array('i', [1, 2, 3, 4, 5, ...])") + def test_set_literal(self): + eq = self.assertEqual + eq(r({1}), "{1}") + eq(r({1, 2, 3}), "{1, 2, 3}") + eq(r({1, 2, 3, 4, 5, 6}), "{1, 2, 3, 4, 5, 6}") + eq(r({1, 2, 3, 4, 5, 6, 7}), "{1, 2, 3, 4, 5, 6, ...}") + + def test_frozenset(self): + eq = self.assertEqual + eq(r(frozenset({1})), "frozenset({1})") + eq(r(frozenset({1, 2, 3})), "frozenset({1, 2, 3})") + eq(r(frozenset({1, 2, 3, 4, 5, 6})), "frozenset({1, 2, 3, 4, 5, 6})") + eq(r(frozenset({1, 2, 3, 4, 5, 6, 7})), "frozenset({1, 2, 3, 4, 5, 6, ...})") + def test_numbers(self): eq = self.assertEqual eq(r(123), repr(123)) @@ -373,11 +387,5 @@ m.append(m) self.assertEqual(repr(m), '') -def test_main(): - run_unittest(ReprTests) - run_unittest(LongReprTest) - run_unittest(TestRecursiveRepr) - - if __name__ == "__main__": - test_main() + unittest.main() diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -183,9 +183,14 @@ Library ------- +- Issue #21650: Add an `--sort-keys` option to json.tool CLI. + - Issues #814253, #9179: Group references and conditional group references now work in lookbehind assertions in regular expressions. +- Issue #22824: Updated reprlib output format for sets to use set literals. + Patch contributed by Berker Peksag. + - Issue #22406: Fixed the uu_codec codec incorrectly ported to 3.x. Based on patch by Martin Panter. diff --git a/Modules/clinic/fcntlmodule.c.h b/Modules/clinic/fcntlmodule.c.h new file mode 100644 --- /dev/null +++ b/Modules/clinic/fcntlmodule.c.h @@ -0,0 +1,188 @@ +/*[clinic input] +preserve +[clinic start generated code]*/ + +PyDoc_STRVAR(fcntl_fcntl__doc__, +"fcntl($module, fd, code, arg=None, /)\n" +"--\n" +"\n" +"Perform the operation `code` on file descriptor fd.\n" +"\n" +"The values used for `code` are operating system dependent, and are available\n" +"as constants in the fcntl module, using the same names as used in\n" +"the relevant C header files. The argument arg is optional, and\n" +"defaults to 0; it may be an int or a string. If arg is given as a string,\n" +"the return value of fcntl is a string of that length, containing the\n" +"resulting value put in the arg buffer by the operating system. The length\n" +"of the arg string is not allowed to exceed 1024 bytes. If the arg given\n" +"is an integer or if none is specified, the result value is an integer\n" +"corresponding to the return value of the fcntl call in the C code."); + +#define FCNTL_FCNTL_METHODDEF \ + {"fcntl", (PyCFunction)fcntl_fcntl, METH_VARARGS, fcntl_fcntl__doc__}, + +static PyObject * +fcntl_fcntl_impl(PyModuleDef *module, int fd, int code, PyObject *arg); + +static PyObject * +fcntl_fcntl(PyModuleDef *module, PyObject *args) +{ + PyObject *return_value = NULL; + int fd; + int code; + PyObject *arg = NULL; + + if (!PyArg_ParseTuple(args, + "O&i|O:fcntl", + conv_descriptor, &fd, &code, &arg)) + goto exit; + return_value = fcntl_fcntl_impl(module, fd, code, arg); + +exit: + return return_value; +} + +PyDoc_STRVAR(fcntl_ioctl__doc__, +"ioctl($module, fd, op, arg=None, mutate_flag=True, /)\n" +"--\n" +"\n" +"Perform the operation op on file descriptor fd.\n" +"\n" +"The values used for op are operating system dependent, and are available as\n" +"constants in the fcntl or termios library modules, using the same names as\n" +"used in the relevant C header files.\n" +"\n" +"The argument `arg` is optional, and defaults to 0; it may be an int or a\n" +"buffer containing character data (most likely a string or an array).\n" +"\n" +"If the argument is a mutable buffer (such as an array) and if the\n" +"mutate_flag argument (which is only allowed in this case) is true then the\n" +"buffer is (in effect) passed to the operating system and changes made by\n" +"the OS will be reflected in the contents of the buffer after the call has\n" +"returned. The return value is the integer returned by the ioctl system\n" +"call.\n" +"\n" +"If the argument is a mutable buffer and the mutable_flag argument is not\n" +"passed or is false, the behavior is as if a string had been passed. This\n" +"behavior will change in future releases of Python.\n" +"\n" +"If the argument is an immutable buffer (most likely a string) then a copy\n" +"of the buffer is passed to the operating system and the return value is a\n" +"string of the same length containing whatever the operating system put in\n" +"the buffer. The length of the arg buffer in this case is not allowed to\n" +"exceed 1024 bytes.\n" +"\n" +"If the arg given is an integer or if none is specified, the result value is\n" +"an integer corresponding to the return value of the ioctl call in the C\n" +"code."); + +#define FCNTL_IOCTL_METHODDEF \ + {"ioctl", (PyCFunction)fcntl_ioctl, METH_VARARGS, fcntl_ioctl__doc__}, + +static PyObject * +fcntl_ioctl_impl(PyModuleDef *module, int fd, unsigned int code, PyObject *ob_arg, int mutate_arg); + +static PyObject * +fcntl_ioctl(PyModuleDef *module, PyObject *args) +{ + PyObject *return_value = NULL; + int fd; + unsigned int code; + PyObject *ob_arg = NULL; + int mutate_arg = 1; + + if (!PyArg_ParseTuple(args, + "O&I|Op:ioctl", + conv_descriptor, &fd, &code, &ob_arg, &mutate_arg)) + goto exit; + return_value = fcntl_ioctl_impl(module, fd, code, ob_arg, mutate_arg); + +exit: + return return_value; +} + +PyDoc_STRVAR(fcntl_flock__doc__, +"flock($module, fd, code, /)\n" +"--\n" +"\n" +"Perform the lock operation op on file descriptor fd.\n" +"\n" +"See the Unix manual page for flock(2) for details (On some systems, this\n" +"function is emulated using fcntl())."); + +#define FCNTL_FLOCK_METHODDEF \ + {"flock", (PyCFunction)fcntl_flock, METH_VARARGS, fcntl_flock__doc__}, + +static PyObject * +fcntl_flock_impl(PyModuleDef *module, int fd, int code); + +static PyObject * +fcntl_flock(PyModuleDef *module, PyObject *args) +{ + PyObject *return_value = NULL; + int fd; + int code; + + if (!PyArg_ParseTuple(args, + "O&i:flock", + conv_descriptor, &fd, &code)) + goto exit; + return_value = fcntl_flock_impl(module, fd, code); + +exit: + return return_value; +} + +PyDoc_STRVAR(fcntl_lockf__doc__, +"lockf($module, fd, code, lenobj=None, startobj=None, whence=0, /)\n" +"--\n" +"\n" +"A wrapper around the fcntl() locking calls.\n" +"\n" +"fd is the file descriptor of the file to lock or unlock, and operation is one\n" +"of the following values:\n" +"\n" +" LOCK_UN - unlock\n" +" LOCK_SH - acquire a shared lock\n" +" LOCK_EX - acquire an exclusive lock\n" +"\n" +"When operation is LOCK_SH or LOCK_EX, it can also be bitwise ORed with\n" +"LOCK_NB to avoid blocking on lock acquisition. If LOCK_NB is used and the\n" +"lock cannot be acquired, an IOError will be raised and the exception will\n" +"have an errno attribute set to EACCES or EAGAIN (depending on the operating\n" +"system -- for portability, check for either value).\n" +"\n" +"length is the number of bytes to lock, with the default meaning to lock to\n" +"EOF. start is the byte offset, relative to whence, to that the lock\n" +"starts. whence is as with fileobj.seek(), specifically:\n" +"\n" +" 0 - relative to the start of the file (SEEK_SET)\n" +" 1 - relative to the current buffer position (SEEK_CUR)\n" +" 2 - relative to the end of the file (SEEK_END)"); + +#define FCNTL_LOCKF_METHODDEF \ + {"lockf", (PyCFunction)fcntl_lockf, METH_VARARGS, fcntl_lockf__doc__}, + +static PyObject * +fcntl_lockf_impl(PyModuleDef *module, int fd, int code, PyObject *lenobj, PyObject *startobj, int whence); + +static PyObject * +fcntl_lockf(PyModuleDef *module, PyObject *args) +{ + PyObject *return_value = NULL; + int fd; + int code; + PyObject *lenobj = NULL; + PyObject *startobj = NULL; + int whence = 0; + + if (!PyArg_ParseTuple(args, + "O&i|OOi:lockf", + conv_descriptor, &fd, &code, &lenobj, &startobj, &whence)) + goto exit; + return_value = fcntl_lockf_impl(module, fd, code, lenobj, startobj, whence); + +exit: + return return_value; +} +/*[clinic end generated code: output=84bdde73a92f7c61 input=a9049054013a1b77]*/ diff --git a/Modules/fcntlmodule.c b/Modules/fcntlmodule.c --- a/Modules/fcntlmodule.c +++ b/Modules/fcntlmodule.c @@ -15,6 +15,12 @@ #include #endif +/*[clinic input] +output preset file +module fcntl +[clinic start generated code]*/ +/*[clinic end generated code: output=da39a3ee5e6b4b0d input=c7356fdb126a904a]*/ + static int conv_descriptor(PyObject *object, int *target) { @@ -26,48 +32,72 @@ return 1; } +/* Must come after conv_descriptor definition. */ +#include "clinic/fcntlmodule.c.h" -/* fcntl(fd, op, [arg]) */ +/*[clinic input] +fcntl.fcntl + + fd: object(type='int', converter='conv_descriptor') + code: int + arg: object = NULL + / + +Perform the operation `code` on file descriptor fd. + +The values used for `code` are operating system dependent, and are available +as constants in the fcntl module, using the same names as used in +the relevant C header files. The argument arg is optional, and +defaults to 0; it may be an int or a string. If arg is given as a string, +the return value of fcntl is a string of that length, containing the +resulting value put in the arg buffer by the operating system. The length +of the arg string is not allowed to exceed 1024 bytes. If the arg given +is an integer or if none is specified, the result value is an integer +corresponding to the return value of the fcntl call in the C code. +[clinic start generated code]*/ static PyObject * -fcntl_fcntl(PyObject *self, PyObject *args) +fcntl_fcntl_impl(PyModuleDef *module, int fd, int code, PyObject *arg) +/*[clinic end generated code: output=afc5bfa74a03ef0d input=4850c13a41e86930]*/ { - int fd; - int code; - long arg; + int int_arg = 0; int ret; char *str; Py_ssize_t len; char buf[1024]; - if (PyArg_ParseTuple(args, "O&is#:fcntl", - conv_descriptor, &fd, &code, &str, &len)) { - if ((size_t)len > sizeof buf) { - PyErr_SetString(PyExc_ValueError, - "fcntl string arg too long"); - return NULL; + if (arg != NULL) { + int parse_result; + + if (PyArg_Parse(arg, "s#", &str, &len)) { + if ((size_t)len > sizeof buf) { + PyErr_SetString(PyExc_ValueError, + "fcntl string arg too long"); + return NULL; + } + memcpy(buf, str, len); + Py_BEGIN_ALLOW_THREADS + ret = fcntl(fd, code, buf); + Py_END_ALLOW_THREADS + if (ret < 0) { + PyErr_SetFromErrno(PyExc_IOError); + return NULL; + } + return PyBytes_FromStringAndSize(buf, len); } - memcpy(buf, str, len); - Py_BEGIN_ALLOW_THREADS - ret = fcntl(fd, code, buf); - Py_END_ALLOW_THREADS - if (ret < 0) { - PyErr_SetFromErrno(PyExc_IOError); - return NULL; + + PyErr_Clear(); + parse_result = PyArg_Parse(arg, + "l;fcntl requires a file or file descriptor," + " an integer and optionally a third integer or a string", + &int_arg); + if (!parse_result) { + return NULL; } - return PyBytes_FromStringAndSize(buf, len); } - PyErr_Clear(); - arg = 0; - if (!PyArg_ParseTuple(args, - "O&i|l;fcntl requires a file or file descriptor," - " an integer and optionally a third integer or a string", - conv_descriptor, &fd, &code, &arg)) { - return NULL; - } Py_BEGIN_ALLOW_THREADS - ret = fcntl(fd, code, arg); + ret = fcntl(fd, code, int_arg); Py_END_ALLOW_THREADS if (ret < 0) { PyErr_SetFromErrno(PyExc_IOError); @@ -76,29 +106,53 @@ return PyLong_FromLong((long)ret); } -PyDoc_STRVAR(fcntl_doc, -"fcntl(fd, op, [arg])\n\ -\n\ -Perform the operation op on file descriptor fd. The values used\n\ -for op are operating system dependent, and are available\n\ -as constants in the fcntl module, using the same names as used in\n\ -the relevant C header files. The argument arg is optional, and\n\ -defaults to 0; it may be an int or a string. If arg is given as a string,\n\ -the return value of fcntl is a string of that length, containing the\n\ -resulting value put in the arg buffer by the operating system. The length\n\ -of the arg string is not allowed to exceed 1024 bytes. If the arg given\n\ -is an integer or if none is specified, the result value is an integer\n\ -corresponding to the return value of the fcntl call in the C code."); +/*[clinic input] +fcntl.ioctl -/* ioctl(fd, op, [arg]) */ + fd: object(type='int', converter='conv_descriptor') + op as code: unsigned_int(bitwise=True) + arg as ob_arg: object = NULL + mutate_flag as mutate_arg: bool = True + / + +Perform the operation op on file descriptor fd. + +The values used for op are operating system dependent, and are available as +constants in the fcntl or termios library modules, using the same names as +used in the relevant C header files. + +The argument `arg` is optional, and defaults to 0; it may be an int or a +buffer containing character data (most likely a string or an array). + +If the argument is a mutable buffer (such as an array) and if the +mutate_flag argument (which is only allowed in this case) is true then the +buffer is (in effect) passed to the operating system and changes made by +the OS will be reflected in the contents of the buffer after the call has +returned. The return value is the integer returned by the ioctl system +call. + +If the argument is a mutable buffer and the mutable_flag argument is not +passed or is false, the behavior is as if a string had been passed. This +behavior will change in future releases of Python. + +If the argument is an immutable buffer (most likely a string) then a copy +of the buffer is passed to the operating system and the return value is a +string of the same length containing whatever the operating system put in +the buffer. The length of the arg buffer in this case is not allowed to +exceed 1024 bytes. + +If the arg given is an integer or if none is specified, the result value is +an integer corresponding to the return value of the ioctl call in the C +code. +[clinic start generated code]*/ static PyObject * -fcntl_ioctl(PyObject *self, PyObject *args) +fcntl_ioctl_impl(PyModuleDef *module, int fd, unsigned int code, PyObject *ob_arg, int mutate_arg) +/*[clinic end generated code: output=ad47738c118622bf input=a55a6ee8e494c449]*/ { #define IOCTL_BUFSZ 1024 - int fd; - /* In PyArg_ParseTuple below, we use the unsigned non-checked 'I' + /* We use the unsigned non-checked 'I' format for the 'code' parameter because Python turns 0x8000000 into either a large positive number (PyLong or PyInt on 64-bit platforms) or a negative number on others (32-bit PyInt) @@ -111,101 +165,98 @@ in their unsigned long ioctl codes this will break and need special casing based on the platform being built on. */ - unsigned int code; - int arg; + int arg = 0; int ret; Py_buffer pstr; char *str; Py_ssize_t len; - int mutate_arg = 1; char buf[IOCTL_BUFSZ+1]; /* argument plus NUL byte */ - if (PyArg_ParseTuple(args, "O&Iw*|i:ioctl", - conv_descriptor, &fd, &code, - &pstr, &mutate_arg)) { - char *arg; - str = pstr.buf; - len = pstr.len; + if (ob_arg != NULL) { + if (PyArg_Parse(ob_arg, "w*:ioctl", &pstr)) { + char *arg; + str = pstr.buf; + len = pstr.len; - if (mutate_arg) { - if (len <= IOCTL_BUFSZ) { - memcpy(buf, str, len); - buf[len] = '\0'; - arg = buf; + if (mutate_arg) { + if (len <= IOCTL_BUFSZ) { + memcpy(buf, str, len); + buf[len] = '\0'; + arg = buf; + } + else { + arg = str; + } } else { - arg = str; + if (len > IOCTL_BUFSZ) { + PyBuffer_Release(&pstr); + PyErr_SetString(PyExc_ValueError, + "ioctl string arg too long"); + return NULL; + } + else { + memcpy(buf, str, len); + buf[len] = '\0'; + arg = buf; + } + } + if (buf == arg) { + Py_BEGIN_ALLOW_THREADS /* think array.resize() */ + ret = ioctl(fd, code, arg); + Py_END_ALLOW_THREADS + } + else { + ret = ioctl(fd, code, arg); + } + if (mutate_arg && (len <= IOCTL_BUFSZ)) { + memcpy(str, buf, len); + } + PyBuffer_Release(&pstr); /* No further access to str below this point */ + if (ret < 0) { + PyErr_SetFromErrno(PyExc_IOError); + return NULL; + } + if (mutate_arg) { + return PyLong_FromLong(ret); + } + else { + return PyBytes_FromStringAndSize(buf, len); } } - else { + + PyErr_Clear(); + if (PyArg_Parse(ob_arg, "s*:ioctl", &pstr)) { + str = pstr.buf; + len = pstr.len; if (len > IOCTL_BUFSZ) { PyBuffer_Release(&pstr); PyErr_SetString(PyExc_ValueError, - "ioctl string arg too long"); + "ioctl string arg too long"); return NULL; } - else { - memcpy(buf, str, len); - buf[len] = '\0'; - arg = buf; + memcpy(buf, str, len); + buf[len] = '\0'; + Py_BEGIN_ALLOW_THREADS + ret = ioctl(fd, code, buf); + Py_END_ALLOW_THREADS + if (ret < 0) { + PyBuffer_Release(&pstr); + PyErr_SetFromErrno(PyExc_IOError); + return NULL; } - } - if (buf == arg) { - Py_BEGIN_ALLOW_THREADS /* think array.resize() */ - ret = ioctl(fd, code, arg); - Py_END_ALLOW_THREADS - } - else { - ret = ioctl(fd, code, arg); - } - if (mutate_arg && (len <= IOCTL_BUFSZ)) { - memcpy(str, buf, len); - } - PyBuffer_Release(&pstr); /* No further access to str below this point */ - if (ret < 0) { - PyErr_SetFromErrno(PyExc_IOError); - return NULL; - } - if (mutate_arg) { - return PyLong_FromLong(ret); - } - else { + PyBuffer_Release(&pstr); return PyBytes_FromStringAndSize(buf, len); } - } - PyErr_Clear(); - if (PyArg_ParseTuple(args, "O&Is*:ioctl", - conv_descriptor, &fd, &code, &pstr)) { - str = pstr.buf; - len = pstr.len; - if (len > IOCTL_BUFSZ) { - PyBuffer_Release(&pstr); - PyErr_SetString(PyExc_ValueError, - "ioctl string arg too long"); - return NULL; + PyErr_Clear(); + if (!PyArg_Parse(ob_arg, + "i;ioctl requires a file or file descriptor," + " an integer and optionally an integer or buffer argument", + &arg)) { + return NULL; } - memcpy(buf, str, len); - buf[len] = '\0'; - Py_BEGIN_ALLOW_THREADS - ret = ioctl(fd, code, buf); - Py_END_ALLOW_THREADS - if (ret < 0) { - PyBuffer_Release(&pstr); - PyErr_SetFromErrno(PyExc_IOError); - return NULL; - } - PyBuffer_Release(&pstr); - return PyBytes_FromStringAndSize(buf, len); - } - - PyErr_Clear(); - arg = 0; - if (!PyArg_ParseTuple(args, - "O&I|i;ioctl requires a file or file descriptor," - " an integer and optionally an integer or buffer argument", - conv_descriptor, &fd, &code, &arg)) { - return NULL; + // Fall-through to outside the 'if' statement. } Py_BEGIN_ALLOW_THREADS ret = ioctl(fd, code, arg); @@ -218,52 +269,25 @@ #undef IOCTL_BUFSZ } -PyDoc_STRVAR(ioctl_doc, -"ioctl(fd, op[, arg[, mutate_flag]])\n\ -\n\ -Perform the operation op on file descriptor fd. The values used for op\n\ -are operating system dependent, and are available as constants in the\n\ -fcntl or termios library modules, using the same names as used in the\n\ -relevant C header files.\n\ -\n\ -The argument arg is optional, and defaults to 0; it may be an int or a\n\ -buffer containing character data (most likely a string or an array). \n\ -\n\ -If the argument is a mutable buffer (such as an array) and if the\n\ -mutate_flag argument (which is only allowed in this case) is true then the\n\ -buffer is (in effect) passed to the operating system and changes made by\n\ -the OS will be reflected in the contents of the buffer after the call has\n\ -returned. The return value is the integer returned by the ioctl system\n\ -call.\n\ -\n\ -If the argument is a mutable buffer and the mutable_flag argument is not\n\ -passed or is false, the behavior is as if a string had been passed. This\n\ -behavior will change in future releases of Python.\n\ -\n\ -If the argument is an immutable buffer (most likely a string) then a copy\n\ -of the buffer is passed to the operating system and the return value is a\n\ -string of the same length containing whatever the operating system put in\n\ -the buffer. The length of the arg buffer in this case is not allowed to\n\ -exceed 1024 bytes.\n\ -\n\ -If the arg given is an integer or if none is specified, the result value is\n\ -an integer corresponding to the return value of the ioctl call in the C\n\ -code."); +/*[clinic input] +fcntl.flock + fd: object(type='int', converter='conv_descriptor') + code: int + / -/* flock(fd, operation) */ +Perform the lock operation op on file descriptor fd. + +See the Unix manual page for flock(2) for details (On some systems, this +function is emulated using fcntl()). +[clinic start generated code]*/ static PyObject * -fcntl_flock(PyObject *self, PyObject *args) +fcntl_flock_impl(PyModuleDef *module, int fd, int code) +/*[clinic end generated code: output=c9035133a7dbfc96 input=b762aa9448d05e43]*/ { - int fd; - int code; int ret; - if (!PyArg_ParseTuple(args, "O&i:flock", - conv_descriptor, &fd, &code)) - return NULL; - #ifdef HAVE_FLOCK Py_BEGIN_ALLOW_THREADS ret = flock(fd, code); @@ -299,29 +323,49 @@ PyErr_SetFromErrno(PyExc_IOError); return NULL; } - Py_INCREF(Py_None); - return Py_None; + Py_RETURN_NONE; } -PyDoc_STRVAR(flock_doc, -"flock(fd, operation)\n\ -\n\ -Perform the lock operation op on file descriptor fd. See the Unix \n\ -manual page for flock(2) for details. (On some systems, this function is\n\ -emulated using fcntl().)"); +/*[clinic input] +fcntl.lockf -/* lockf(fd, operation) */ + fd: object(type='int', converter='conv_descriptor') + code: int + lenobj: object = NULL + startobj: object = NULL + whence: int = 0 + / + +A wrapper around the fcntl() locking calls. + +fd is the file descriptor of the file to lock or unlock, and operation is one +of the following values: + + LOCK_UN - unlock + LOCK_SH - acquire a shared lock + LOCK_EX - acquire an exclusive lock + +When operation is LOCK_SH or LOCK_EX, it can also be bitwise ORed with +LOCK_NB to avoid blocking on lock acquisition. If LOCK_NB is used and the +lock cannot be acquired, an IOError will be raised and the exception will +have an errno attribute set to EACCES or EAGAIN (depending on the operating +system -- for portability, check for either value). + +length is the number of bytes to lock, with the default meaning to lock to +EOF. start is the byte offset, relative to whence, to that the lock +starts. whence is as with fileobj.seek(), specifically: + + 0 - relative to the start of the file (SEEK_SET) + 1 - relative to the current buffer position (SEEK_CUR) + 2 - relative to the end of the file (SEEK_END) +[clinic start generated code]*/ + static PyObject * -fcntl_lockf(PyObject *self, PyObject *args) +fcntl_lockf_impl(PyModuleDef *module, int fd, int code, PyObject *lenobj, PyObject *startobj, int whence) +/*[clinic end generated code: output=5536df2892bf3ce9 input=44856fa06db36184]*/ { - int fd, code, ret, whence = 0; - PyObject *lenobj = NULL, *startobj = NULL; - - if (!PyArg_ParseTuple(args, "O&i|OOi:lockf", - conv_descriptor, &fd, &code, - &lenobj, &startobj, &whence)) - return NULL; + int ret; #ifndef LOCK_SH #define LOCK_SH 1 /* shared lock */ @@ -374,43 +418,17 @@ PyErr_SetFromErrno(PyExc_IOError); return NULL; } - Py_INCREF(Py_None); - return Py_None; + Py_RETURN_NONE; } -PyDoc_STRVAR(lockf_doc, -"lockf (fd, operation, length=0, start=0, whence=0)\n\ -\n\ -This is essentially a wrapper around the fcntl() locking calls. fd is the\n\ -file descriptor of the file to lock or unlock, and operation is one of the\n\ -following values:\n\ -\n\ - LOCK_UN - unlock\n\ - LOCK_SH - acquire a shared lock\n\ - LOCK_EX - acquire an exclusive lock\n\ -\n\ -When operation is LOCK_SH or LOCK_EX, it can also be bitwise ORed with\n\ -LOCK_NB to avoid blocking on lock acquisition. If LOCK_NB is used and the\n\ -lock cannot be acquired, an IOError will be raised and the exception will\n\ -have an errno attribute set to EACCES or EAGAIN (depending on the operating\n\ -system -- for portability, check for either value).\n\ -\n\ -length is the number of bytes to lock, with the default meaning to lock to\n\ -EOF. start is the byte offset, relative to whence, to that the lock\n\ -starts. whence is as with fileobj.seek(), specifically:\n\ -\n\ - 0 - relative to the start of the file (SEEK_SET)\n\ - 1 - relative to the current buffer position (SEEK_CUR)\n\ - 2 - relative to the end of the file (SEEK_END)"); - /* List of functions */ static PyMethodDef fcntl_methods[] = { - {"fcntl", fcntl_fcntl, METH_VARARGS, fcntl_doc}, - {"ioctl", fcntl_ioctl, METH_VARARGS, ioctl_doc}, - {"flock", fcntl_flock, METH_VARARGS, flock_doc}, - {"lockf", fcntl_lockf, METH_VARARGS, lockf_doc}, - {NULL, NULL} /* sentinel */ + FCNTL_FCNTL_METHODDEF + FCNTL_IOCTL_METHODDEF + FCNTL_FLOCK_METHODDEF + FCNTL_LOCKF_METHODDEF + {NULL, NULL} /* sentinel */ }; diff --git a/Parser/asdl.py b/Parser/asdl.py --- a/Parser/asdl.py +++ b/Parser/asdl.py @@ -33,8 +33,7 @@ # See the EBNF at the top of the file to understand the logical connection # between the various node types. -builtin_types = set( - ['identifier', 'string', 'bytes', 'int', 'object', 'singleton']) +builtin_types = {'identifier', 'string', 'bytes', 'int', 'object', 'singleton'} class AST: def __repr__(self): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 10:29:55 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 10 Nov 2014 09:29:55 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyODIx?= =?utf-8?q?=3A_Fixed_fcntl=28=29_with_integer_argument_on_64-bit_big-endia?= =?utf-8?q?n?= Message-ID: <20141110092952.699.35208@psf.io> https://hg.python.org/cpython/rev/45e8aed69767 changeset: 93454:45e8aed69767 branch: 3.4 parent: 93444:63274cf1b40d user: Serhiy Storchaka date: Mon Nov 10 10:42:26 2014 +0200 summary: Issue #22821: Fixed fcntl() with integer argument on 64-bit big-endian platforms. files: Misc/NEWS | 3 +++ Modules/fcntlmodule.c | 4 ++-- 2 files changed, 5 insertions(+), 2 deletions(-) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -36,6 +36,9 @@ Library ------- +- Issue #22821: Fixed fcntl() with integer argument on 64-bit big-endian + platforms. + - Issues #814253, #9179: Group references and conditional group references now work in lookbehind assertions in regular expressions. diff --git a/Modules/fcntlmodule.c b/Modules/fcntlmodule.c --- a/Modules/fcntlmodule.c +++ b/Modules/fcntlmodule.c @@ -34,7 +34,7 @@ { int fd; int code; - long arg; + int arg; int ret; char *str; Py_ssize_t len; @@ -61,7 +61,7 @@ PyErr_Clear(); arg = 0; if (!PyArg_ParseTuple(args, - "O&i|l;fcntl requires a file or file descriptor," + "O&i|I;fcntl requires a file or file descriptor," " an integer and optionally a third integer or a string", conv_descriptor, &fd, &code, &arg)) { return NULL; -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 10:29:55 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 10 Nov 2014 09:29:55 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2322821=3A_Fixed_fcntl=28=29_with_integer_argumen?= =?utf-8?q?t_on_64-bit_big-endian?= Message-ID: <20141110092952.85202.88603@psf.io> https://hg.python.org/cpython/rev/2d203a0b7908 changeset: 93455:2d203a0b7908 parent: 93452:8111ee79d27c parent: 93454:45e8aed69767 user: Serhiy Storchaka date: Mon Nov 10 11:25:50 2014 +0200 summary: Issue #22821: Fixed fcntl() with integer argument on 64-bit big-endian platforms. files: Misc/NEWS | 3 +++ Modules/fcntlmodule.c | 6 +++--- 2 files changed, 6 insertions(+), 3 deletions(-) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -183,6 +183,9 @@ Library ------- +- Issue #22821: Fixed fcntl() with integer argument on 64-bit big-endian + platforms. + - Issue #21650: Add an `--sort-keys` option to json.tool CLI. - Issues #814253, #9179: Group references and conditional group references now diff --git a/Modules/fcntlmodule.c b/Modules/fcntlmodule.c --- a/Modules/fcntlmodule.c +++ b/Modules/fcntlmodule.c @@ -60,7 +60,7 @@ fcntl_fcntl_impl(PyModuleDef *module, int fd, int code, PyObject *arg) /*[clinic end generated code: output=afc5bfa74a03ef0d input=4850c13a41e86930]*/ { - int int_arg = 0; + unsigned int int_arg = 0; int ret; char *str; Py_ssize_t len; @@ -88,7 +88,7 @@ PyErr_Clear(); parse_result = PyArg_Parse(arg, - "l;fcntl requires a file or file descriptor," + "I;fcntl requires a file or file descriptor," " an integer and optionally a third integer or a string", &int_arg); if (!parse_result) { @@ -97,7 +97,7 @@ } Py_BEGIN_ALLOW_THREADS - ret = fcntl(fd, code, int_arg); + ret = fcntl(fd, code, (int)int_arg); Py_END_ALLOW_THREADS if (ret < 0) { PyErr_SetFromErrno(PyExc_IOError); -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 10:29:55 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 10 Nov 2014 09:29:55 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzIyODIx?= =?utf-8?q?=3A_Fixed_fcntl=28=29_with_integer_argument_on_64-bit_big-endia?= =?utf-8?q?n?= Message-ID: <20141110092952.113476.92406@psf.io> https://hg.python.org/cpython/rev/61e99438c237 changeset: 93453:61e99438c237 branch: 2.7 parent: 93448:3a8e0a5359cf user: Serhiy Storchaka date: Mon Nov 10 10:42:06 2014 +0200 summary: Issue #22821: Fixed fcntl() with integer argument on 64-bit big-endian platforms. files: Misc/NEWS | 3 +++ Modules/fcntlmodule.c | 4 ++-- 2 files changed, 5 insertions(+), 2 deletions(-) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -37,6 +37,9 @@ Library ------- +- Issue #22821: Fixed fcntl() with integer argument on 64-bit big-endian + platforms. + - Issues #814253, #9179: Group references and conditional group references now work in lookbehind assertions in regular expressions. diff --git a/Modules/fcntlmodule.c b/Modules/fcntlmodule.c --- a/Modules/fcntlmodule.c +++ b/Modules/fcntlmodule.c @@ -34,7 +34,7 @@ { int fd; int code; - long arg; + int arg; int ret; char *str; Py_ssize_t len; @@ -61,7 +61,7 @@ PyErr_Clear(); arg = 0; if (!PyArg_ParseTuple(args, - "O&i|l;fcntl requires a file or file descriptor," + "O&i|I;fcntl requires a file or file descriptor," " an integer and optionally a third integer or a string", conv_descriptor, &fd, &code, &arg)) { return NULL; -- Repository URL: https://hg.python.org/cpython From solipsis at pitrou.net Mon Nov 10 10:32:00 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Mon, 10 Nov 2014 10:32:00 +0100 Subject: [Python-checkins] Daily reference leaks (55b89e5f9c37): sum=3 Message-ID: results for 55b89e5f9c37 on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogocLb0X', '-x'] From python-checkins at python.org Mon Nov 10 11:47:06 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 10 Nov 2014 10:47:06 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzEyNzI4?= =?utf-8?q?=3A_Different_Unicode_characters_having_the_same_uppercase_but?= Message-ID: <20141110104704.108389.60853@psf.io> https://hg.python.org/cpython/rev/47b3084dd6aa changeset: 93457:47b3084dd6aa branch: 3.4 parent: 93454:45e8aed69767 user: Serhiy Storchaka date: Mon Nov 10 12:37:16 2014 +0200 summary: Issue #12728: Different Unicode characters having the same uppercase but different lowercase are now matched in case-insensitive regular expressions. files: Lib/sre_compile.py | 92 +++++++++++++++++++++++++++++--- Lib/test/test_re.py | 51 ++++++++++++++++++ Misc/NEWS | 3 + 3 files changed, 135 insertions(+), 11 deletions(-) diff --git a/Lib/sre_compile.py b/Lib/sre_compile.py --- a/Lib/sre_compile.py +++ b/Lib/sre_compile.py @@ -27,6 +27,46 @@ _SUCCESS_CODES = set([SUCCESS, FAILURE]) _ASSERT_CODES = set([ASSERT, ASSERT_NOT]) +# Sets of lowercase characters which have the same uppercase. +_equivalences = ( + # LATIN SMALL LETTER I, LATIN SMALL LETTER DOTLESS I + (0x69, 0x131), # i? + # LATIN SMALL LETTER S, LATIN SMALL LETTER LONG S + (0x73, 0x17f), # s? + # MICRO SIGN, GREEK SMALL LETTER MU + (0xb5, 0x3bc), # ?? + # COMBINING GREEK YPOGEGRAMMENI, GREEK SMALL LETTER IOTA, GREEK PROSGEGRAMMENI + (0x345, 0x3b9, 0x1fbe), # \u0345?? + # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS, GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA + (0x390, 0x1fd3), # ?? + # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS, GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA + (0x3b0, 0x1fe3), # ?? + # GREEK SMALL LETTER BETA, GREEK BETA SYMBOL + (0x3b2, 0x3d0), # ?? + # GREEK SMALL LETTER EPSILON, GREEK LUNATE EPSILON SYMBOL + (0x3b5, 0x3f5), # ?? + # GREEK SMALL LETTER THETA, GREEK THETA SYMBOL + (0x3b8, 0x3d1), # ?? + # GREEK SMALL LETTER KAPPA, GREEK KAPPA SYMBOL + (0x3ba, 0x3f0), # ?? + # GREEK SMALL LETTER PI, GREEK PI SYMBOL + (0x3c0, 0x3d6), # ?? + # GREEK SMALL LETTER RHO, GREEK RHO SYMBOL + (0x3c1, 0x3f1), # ?? + # GREEK SMALL LETTER FINAL SIGMA, GREEK SMALL LETTER SIGMA + (0x3c2, 0x3c3), # ?? + # GREEK SMALL LETTER PHI, GREEK PHI SYMBOL + (0x3c6, 0x3d5), # ?? + # LATIN SMALL LETTER S WITH DOT ABOVE, LATIN SMALL LETTER LONG S WITH DOT ABOVE + (0x1e61, 0x1e9b), # ?? + # LATIN SMALL LIGATURE LONG S T, LATIN SMALL LIGATURE ST + (0xfb05, 0xfb06), # ?? +) + +# Maps the lowercase code to lowercase codes which have the same uppercase. +_ignorecase_fixes = {i: tuple(j for j in t if i != j) + for t in _equivalences for i in t} + def _compile(code, pattern, flags): # internal: compile a (sub)pattern emit = code.append @@ -35,11 +75,29 @@ REPEATING_CODES = _REPEATING_CODES SUCCESS_CODES = _SUCCESS_CODES ASSERT_CODES = _ASSERT_CODES + if (flags & SRE_FLAG_IGNORECASE and + not (flags & SRE_FLAG_LOCALE) and + flags & SRE_FLAG_UNICODE): + fixes = _ignorecase_fixes + else: + fixes = None for op, av in pattern: if op in LITERAL_CODES: if flags & SRE_FLAG_IGNORECASE: - emit(OPCODES[OP_IGNORE[op]]) - emit(_sre.getlower(av, flags)) + lo = _sre.getlower(av, flags) + if fixes and lo in fixes: + emit(OPCODES[IN_IGNORE]) + skip = _len(code); emit(0) + if op is NOT_LITERAL: + emit(OPCODES[NEGATE]) + for k in (lo,) + fixes[lo]: + emit(OPCODES[LITERAL]) + emit(k) + emit(OPCODES[FAILURE]) + code[skip] = _len(code) - skip + else: + emit(OPCODES[OP_IGNORE[op]]) + emit(lo) else: emit(OPCODES[op]) emit(av) @@ -52,7 +110,7 @@ emit(OPCODES[op]) fixup = None skip = _len(code); emit(0) - _compile_charset(av, flags, code, fixup) + _compile_charset(av, flags, code, fixup, fixes) code[skip] = _len(code) - skip elif op is ANY: if flags & SRE_FLAG_DOTALL: @@ -166,10 +224,11 @@ else: raise ValueError("unsupported operand type", op) -def _compile_charset(charset, flags, code, fixup=None): +def _compile_charset(charset, flags, code, fixup=None, fixes=None): # compile charset subprogram emit = code.append - for op, av in _optimize_charset(charset, fixup, flags & SRE_FLAG_UNICODE): + for op, av in _optimize_charset(charset, fixup, fixes, + flags & SRE_FLAG_UNICODE): emit(OPCODES[op]) if op is NEGATE: pass @@ -193,7 +252,7 @@ raise error("internal: unsupported set operator") emit(OPCODES[FAILURE]) -def _optimize_charset(charset, fixup, isunicode): +def _optimize_charset(charset, fixup, fixes, isunicode): # internal: optimize character set out = [] tail = [] @@ -202,16 +261,27 @@ while True: try: if op is LITERAL: - i = av if fixup: - i = fixup(i) - charmap[i] = 1 + i = fixup(av) + charmap[i] = 1 + if fixes and i in fixes: + for k in fixes[i]: + charmap[k] = 1 + else: + charmap[av] = 1 elif op is RANGE: r = range(av[0], av[1]+1) if fixup: r = map(fixup, r) - for i in r: - charmap[i] = 1 + if fixup and fixes: + for i in r: + charmap[i] = 1 + if i in fixes: + for k in fixes[i]: + charmap[k] = 1 + else: + for i in r: + charmap[i] = 1 elif op is NEGATE: out.append((op, av)) else: diff --git a/Lib/test/test_re.py b/Lib/test/test_re.py --- a/Lib/test/test_re.py +++ b/Lib/test/test_re.py @@ -619,6 +619,43 @@ self.assertEqual(re.match(r"((a)\s(abc|a))", "a a", re.I).group(1), "a a") self.assertEqual(re.match(r"((a)\s(abc|a)*)", "a aa", re.I).group(1), "a aa") + assert '\u212a'.lower() == 'k' # '?' + self.assertTrue(re.match(r'K', '\u212a', re.I)) + self.assertTrue(re.match(r'k', '\u212a', re.I)) + self.assertTrue(re.match(r'\u212a', 'K', re.I)) + self.assertTrue(re.match(r'\u212a', 'k', re.I)) + assert '\u017f'.upper() == 'S' # '?' + self.assertTrue(re.match(r'S', '\u017f', re.I)) + self.assertTrue(re.match(r's', '\u017f', re.I)) + self.assertTrue(re.match(r'\u017f', 'S', re.I)) + self.assertTrue(re.match(r'\u017f', 's', re.I)) + assert '\ufb05'.upper() == '\ufb06'.upper() == 'ST' # '?', '?' + self.assertTrue(re.match(r'\ufb05', '\ufb06', re.I)) + self.assertTrue(re.match(r'\ufb06', '\ufb05', re.I)) + + def test_ignore_case_set(self): + self.assertTrue(re.match(r'[19A]', 'A', re.I)) + self.assertTrue(re.match(r'[19a]', 'a', re.I)) + self.assertTrue(re.match(r'[19a]', 'A', re.I)) + self.assertTrue(re.match(r'[19A]', 'a', re.I)) + self.assertTrue(re.match(br'[19A]', b'A', re.I)) + self.assertTrue(re.match(br'[19a]', b'a', re.I)) + self.assertTrue(re.match(br'[19a]', b'A', re.I)) + self.assertTrue(re.match(br'[19A]', b'a', re.I)) + assert '\u212a'.lower() == 'k' # '?' + self.assertTrue(re.match(r'[19K]', '\u212a', re.I)) + self.assertTrue(re.match(r'[19k]', '\u212a', re.I)) + self.assertTrue(re.match(r'[19\u212a]', 'K', re.I)) + self.assertTrue(re.match(r'[19\u212a]', 'k', re.I)) + assert '\u017f'.upper() == 'S' # '?' + self.assertTrue(re.match(r'[19S]', '\u017f', re.I)) + self.assertTrue(re.match(r'[19s]', '\u017f', re.I)) + self.assertTrue(re.match(r'[19\u017f]', 'S', re.I)) + self.assertTrue(re.match(r'[19\u017f]', 's', re.I)) + assert '\ufb05'.upper() == '\ufb06'.upper() == 'ST' # '?', '?' + self.assertTrue(re.match(r'[19\ufb05]', '\ufb06', re.I)) + self.assertTrue(re.match(r'[19\ufb06]', '\ufb05', re.I)) + def test_ignore_case_range(self): # Issues #3511, #17381. self.assertTrue(re.match(r'[9-a]', '_', re.I)) @@ -638,6 +675,20 @@ self.assertTrue(re.match(r'[\U00010400-\U00010427]', '\U00010428', re.I)) self.assertTrue(re.match(r'[\U00010400-\U00010427]', '\U00010400', re.I)) + assert '\u212a'.lower() == 'k' # '?' + self.assertTrue(re.match(r'[J-M]', '\u212a', re.I)) + self.assertTrue(re.match(r'[j-m]', '\u212a', re.I)) + self.assertTrue(re.match(r'[\u2129-\u212b]', 'K', re.I)) + self.assertTrue(re.match(r'[\u2129-\u212b]', 'k', re.I)) + assert '\u017f'.upper() == 'S' # '?' + self.assertTrue(re.match(r'[R-T]', '\u017f', re.I)) + self.assertTrue(re.match(r'[r-t]', '\u017f', re.I)) + self.assertTrue(re.match(r'[\u017e-\u0180]', 'S', re.I)) + self.assertTrue(re.match(r'[\u017e-\u0180]', 's', re.I)) + assert '\ufb05'.upper() == '\ufb06'.upper() == 'ST' # '?', '?' + self.assertTrue(re.match(r'[\ufb04-\ufb05]', '\ufb06', re.I)) + self.assertTrue(re.match(r'[\ufb06-\ufb07]', '\ufb05', re.I)) + def test_category(self): self.assertEqual(re.match(r"(\s)", " ").group(1), " ") diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -36,6 +36,9 @@ Library ------- +- Issue #12728: Different Unicode characters having the same uppercase but + different lowercase are now matched in case-insensitive regular expressions. + - Issue #22821: Fixed fcntl() with integer argument on 64-bit big-endian platforms. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 11:47:06 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 10 Nov 2014 10:47:06 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzEyNzI4?= =?utf-8?q?=3A_Different_Unicode_characters_having_the_same_uppercase_but?= Message-ID: <20141110104703.108089.3658@psf.io> https://hg.python.org/cpython/rev/4caa695af94c changeset: 93456:4caa695af94c branch: 2.7 parent: 93453:61e99438c237 user: Serhiy Storchaka date: Mon Nov 10 12:37:02 2014 +0200 summary: Issue #12728: Different Unicode characters having the same uppercase but different lowercase are now matched in case-insensitive regular expressions. files: Lib/sre_compile.py | 87 ++++++++++++++++++++++++++++---- Lib/test/test_re.py | 45 +++++++++++++++++ Misc/NEWS | 3 + 3 files changed, 124 insertions(+), 11 deletions(-) diff --git a/Lib/sre_compile.py b/Lib/sre_compile.py --- a/Lib/sre_compile.py +++ b/Lib/sre_compile.py @@ -1,3 +1,4 @@ +# -*- coding: utf-8 -*- # # Secret Labs' Regular Expression Engine # @@ -26,6 +27,40 @@ _SUCCESS_CODES = set([SUCCESS, FAILURE]) _ASSERT_CODES = set([ASSERT, ASSERT_NOT]) +# Sets of lowercase characters which have the same uppercase. +_equivalences = ( + # LATIN SMALL LETTER I, LATIN SMALL LETTER DOTLESS I + (0x69, 0x131), # i? + # LATIN SMALL LETTER S, LATIN SMALL LETTER LONG S + (0x73, 0x17f), # s? + # MICRO SIGN, GREEK SMALL LETTER MU + (0xb5, 0x3bc), # ?? + # COMBINING GREEK YPOGEGRAMMENI, GREEK SMALL LETTER IOTA, GREEK PROSGEGRAMMENI + (0x345, 0x3b9, 0x1fbe), # \u0345?? + # GREEK SMALL LETTER BETA, GREEK BETA SYMBOL + (0x3b2, 0x3d0), # ?? + # GREEK SMALL LETTER EPSILON, GREEK LUNATE EPSILON SYMBOL + (0x3b5, 0x3f5), # ?? + # GREEK SMALL LETTER THETA, GREEK THETA SYMBOL + (0x3b8, 0x3d1), # ?? + # GREEK SMALL LETTER KAPPA, GREEK KAPPA SYMBOL + (0x3ba, 0x3f0), # ?? + # GREEK SMALL LETTER PI, GREEK PI SYMBOL + (0x3c0, 0x3d6), # ?? + # GREEK SMALL LETTER RHO, GREEK RHO SYMBOL + (0x3c1, 0x3f1), # ?? + # GREEK SMALL LETTER FINAL SIGMA, GREEK SMALL LETTER SIGMA + (0x3c2, 0x3c3), # ?? + # GREEK SMALL LETTER PHI, GREEK PHI SYMBOL + (0x3c6, 0x3d5), # ?? + # LATIN SMALL LETTER S WITH DOT ABOVE, LATIN SMALL LETTER LONG S WITH DOT ABOVE + (0x1e61, 0x1e9b), # ?? +) + +# Maps the lowercase code to lowercase codes which have the same uppercase. +_ignorecase_fixes = {i: tuple(j for j in t if i != j) + for t in _equivalences for i in t} + def _compile(code, pattern, flags): # internal: compile a (sub)pattern emit = code.append @@ -34,11 +69,29 @@ REPEATING_CODES = _REPEATING_CODES SUCCESS_CODES = _SUCCESS_CODES ASSERT_CODES = _ASSERT_CODES + if (flags & SRE_FLAG_IGNORECASE and + not (flags & SRE_FLAG_LOCALE) and + flags & SRE_FLAG_UNICODE): + fixes = _ignorecase_fixes + else: + fixes = None for op, av in pattern: if op in LITERAL_CODES: if flags & SRE_FLAG_IGNORECASE: - emit(OPCODES[OP_IGNORE[op]]) - emit(_sre.getlower(av, flags)) + lo = _sre.getlower(av, flags) + if fixes and lo in fixes: + emit(OPCODES[IN_IGNORE]) + skip = _len(code); emit(0) + if op is NOT_LITERAL: + emit(OPCODES[NEGATE]) + for k in (lo,) + fixes[lo]: + emit(OPCODES[LITERAL]) + emit(k) + emit(OPCODES[FAILURE]) + code[skip] = _len(code) - skip + else: + emit(OPCODES[OP_IGNORE[op]]) + emit(lo) else: emit(OPCODES[op]) emit(av) @@ -51,7 +104,7 @@ emit(OPCODES[op]) fixup = None skip = _len(code); emit(0) - _compile_charset(av, flags, code, fixup) + _compile_charset(av, flags, code, fixup, fixes) code[skip] = _len(code) - skip elif op is ANY: if flags & SRE_FLAG_DOTALL: @@ -172,10 +225,11 @@ else: raise ValueError, ("unsupported operand type", op) -def _compile_charset(charset, flags, code, fixup=None): +def _compile_charset(charset, flags, code, fixup=None, fixes=None): # compile charset subprogram emit = code.append - for op, av in _optimize_charset(charset, fixup, flags & SRE_FLAG_UNICODE): + for op, av in _optimize_charset(charset, fixup, fixes, + flags & SRE_FLAG_UNICODE): emit(OPCODES[op]) if op is NEGATE: pass @@ -199,7 +253,7 @@ raise error, "internal: unsupported set operator" emit(OPCODES[FAILURE]) -def _optimize_charset(charset, fixup, isunicode): +def _optimize_charset(charset, fixup, fixes, isunicode): # internal: optimize character set out = [] tail = [] @@ -208,16 +262,27 @@ while True: try: if op is LITERAL: - i = av if fixup: - i = fixup(i) - charmap[i] = 1 + i = fixup(av) + charmap[i] = 1 + if fixes and i in fixes: + for k in fixes[i]: + charmap[k] = 1 + else: + charmap[av] = 1 elif op is RANGE: r = range(av[0], av[1]+1) if fixup: r = map(fixup, r) - for i in r: - charmap[i] = 1 + if fixup and fixes: + for i in r: + charmap[i] = 1 + if i in fixes: + for k in fixes[i]: + charmap[k] = 1 + else: + for i in r: + charmap[i] = 1 elif op is NEGATE: out.append((op, av)) else: diff --git a/Lib/test/test_re.py b/Lib/test/test_re.py --- a/Lib/test/test_re.py +++ b/Lib/test/test_re.py @@ -1,3 +1,4 @@ +# -*- coding: utf-8 -*- from test.test_support import verbose, run_unittest, import_module from test.test_support import precisionbigmemtest, _2G, cpython_only from test.test_support import captured_stdout, have_unicode, requires_unicode, u @@ -510,6 +511,39 @@ self.assertEqual(re.match(r"((a)\s(abc|a))", "a a", re.I).group(1), "a a") self.assertEqual(re.match(r"((a)\s(abc|a)*)", "a aa", re.I).group(1), "a aa") + if have_unicode: + assert u(r'\u212a').lower() == u'k' # '?' + self.assertTrue(re.match(ur'K', u(r'\u212a'), re.U | re.I)) + self.assertTrue(re.match(ur'k', u(r'\u212a'), re.U | re.I)) + self.assertTrue(re.match(u(r'\u212a'), u'K', re.U | re.I)) + self.assertTrue(re.match(u(r'\u212a'), u'k', re.U | re.I)) + assert u(r'\u017f').upper() == u'S' # '?' + self.assertTrue(re.match(ur'S', u(r'\u017f'), re.U | re.I)) + self.assertTrue(re.match(ur's', u(r'\u017f'), re.U | re.I)) + self.assertTrue(re.match(u(r'\u017f'), u'S', re.U | re.I)) + self.assertTrue(re.match(u(r'\u017f'), u's', re.U | re.I)) + + def test_ignore_case_set(self): + self.assertTrue(re.match(r'[19A]', 'A', re.I)) + self.assertTrue(re.match(r'[19a]', 'a', re.I)) + self.assertTrue(re.match(r'[19a]', 'A', re.I)) + self.assertTrue(re.match(r'[19A]', 'a', re.I)) + if have_unicode: + self.assertTrue(re.match(ur'[19A]', u'A', re.U | re.I)) + self.assertTrue(re.match(ur'[19a]', u'a', re.U | re.I)) + self.assertTrue(re.match(ur'[19a]', u'A', re.U | re.I)) + self.assertTrue(re.match(ur'[19A]', u'a', re.U | re.I)) + assert u(r'\u212a').lower() == u'k' # '?' + self.assertTrue(re.match(u(r'[19K]'), u(r'\u212a'), re.U | re.I)) + self.assertTrue(re.match(u(r'[19k]'), u(r'\u212a'), re.U | re.I)) + self.assertTrue(re.match(u(r'[19\u212a]'), u'K', re.U | re.I)) + self.assertTrue(re.match(u(r'[19\u212a]'), u'k', re.U | re.I)) + assert u(r'\u017f').upper() == u'S' # '?' + self.assertTrue(re.match(ur'[19S]', u(r'\u017f'), re.U | re.I)) + self.assertTrue(re.match(ur'[19s]', u(r'\u017f'), re.U | re.I)) + self.assertTrue(re.match(u(r'[19\u017f]'), u'S', re.U | re.I)) + self.assertTrue(re.match(u(r'[19\u017f]'), u's', re.U | re.I)) + def test_ignore_case_range(self): # Issues #3511, #17381. self.assertTrue(re.match(r'[9-a]', '_', re.I)) @@ -547,6 +581,17 @@ self.assertTrue(re.match(u(r'[\U00010400-\U00010427]'), u(r'\U00010400'), re.U | re.I)) + assert u(r'\u212a').lower() == u'k' # '?' + self.assertTrue(re.match(ur'[J-M]', u(r'\u212a'), re.U | re.I)) + self.assertTrue(re.match(ur'[j-m]', u(r'\u212a'), re.U | re.I)) + self.assertTrue(re.match(u(r'[\u2129-\u212b]'), u'K', re.U | re.I)) + self.assertTrue(re.match(u(r'[\u2129-\u212b]'), u'k', re.U | re.I)) + assert u(r'\u017f').upper() == u'S' # '?' + self.assertTrue(re.match(ur'[R-T]', u(r'\u017f'), re.U | re.I)) + self.assertTrue(re.match(ur'[r-t]', u(r'\u017f'), re.U | re.I)) + self.assertTrue(re.match(u(r'[\u017e-\u0180]'), u'S', re.U | re.I)) + self.assertTrue(re.match(u(r'[\u017e-\u0180]'), u's', re.U | re.I)) + def test_category(self): self.assertEqual(re.match(r"(\s)", " ").group(1), " ") diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -37,6 +37,9 @@ Library ------- +- Issue #12728: Different Unicode characters having the same uppercase but + different lowercase are now matched in case-insensitive regular expressions. + - Issue #22821: Fixed fcntl() with integer argument on 64-bit big-endian platforms. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 11:47:06 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 10 Nov 2014 10:47:06 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2312728=3A_Different_Unicode_characters_having_th?= =?utf-8?q?e_same_uppercase_but?= Message-ID: <20141110104704.108367.88825@psf.io> https://hg.python.org/cpython/rev/09ec09cfe539 changeset: 93458:09ec09cfe539 parent: 93455:2d203a0b7908 parent: 93457:47b3084dd6aa user: Serhiy Storchaka date: Mon Nov 10 12:43:14 2014 +0200 summary: Issue #12728: Different Unicode characters having the same uppercase but different lowercase are now matched in case-insensitive regular expressions. files: Lib/sre_compile.py | 90 +++++++++++++++++++++++++++++--- Lib/test/test_re.py | 51 ++++++++++++++++++ Misc/NEWS | 3 + 3 files changed, 134 insertions(+), 10 deletions(-) diff --git a/Lib/sre_compile.py b/Lib/sre_compile.py --- a/Lib/sre_compile.py +++ b/Lib/sre_compile.py @@ -26,6 +26,46 @@ _SUCCESS_CODES = {SUCCESS, FAILURE} _ASSERT_CODES = {ASSERT, ASSERT_NOT} +# Sets of lowercase characters which have the same uppercase. +_equivalences = ( + # LATIN SMALL LETTER I, LATIN SMALL LETTER DOTLESS I + (0x69, 0x131), # i? + # LATIN SMALL LETTER S, LATIN SMALL LETTER LONG S + (0x73, 0x17f), # s? + # MICRO SIGN, GREEK SMALL LETTER MU + (0xb5, 0x3bc), # ?? + # COMBINING GREEK YPOGEGRAMMENI, GREEK SMALL LETTER IOTA, GREEK PROSGEGRAMMENI + (0x345, 0x3b9, 0x1fbe), # \u0345?? + # GREEK SMALL LETTER IOTA WITH DIALYTIKA AND TONOS, GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA + (0x390, 0x1fd3), # ?? + # GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND TONOS, GREEK SMALL LETTER UPSILON WITH DIALYTIKA AND OXIA + (0x3b0, 0x1fe3), # ?? + # GREEK SMALL LETTER BETA, GREEK BETA SYMBOL + (0x3b2, 0x3d0), # ?? + # GREEK SMALL LETTER EPSILON, GREEK LUNATE EPSILON SYMBOL + (0x3b5, 0x3f5), # ?? + # GREEK SMALL LETTER THETA, GREEK THETA SYMBOL + (0x3b8, 0x3d1), # ?? + # GREEK SMALL LETTER KAPPA, GREEK KAPPA SYMBOL + (0x3ba, 0x3f0), # ?? + # GREEK SMALL LETTER PI, GREEK PI SYMBOL + (0x3c0, 0x3d6), # ?? + # GREEK SMALL LETTER RHO, GREEK RHO SYMBOL + (0x3c1, 0x3f1), # ?? + # GREEK SMALL LETTER FINAL SIGMA, GREEK SMALL LETTER SIGMA + (0x3c2, 0x3c3), # ?? + # GREEK SMALL LETTER PHI, GREEK PHI SYMBOL + (0x3c6, 0x3d5), # ?? + # LATIN SMALL LETTER S WITH DOT ABOVE, LATIN SMALL LETTER LONG S WITH DOT ABOVE + (0x1e61, 0x1e9b), # ?? + # LATIN SMALL LIGATURE LONG S T, LATIN SMALL LIGATURE ST + (0xfb05, 0xfb06), # ?? +) + +# Maps the lowercase code to lowercase codes which have the same uppercase. +_ignorecase_fixes = {i: tuple(j for j in t if i != j) + for t in _equivalences for i in t} + def _compile(code, pattern, flags): # internal: compile a (sub)pattern emit = code.append @@ -34,11 +74,29 @@ REPEATING_CODES = _REPEATING_CODES SUCCESS_CODES = _SUCCESS_CODES ASSERT_CODES = _ASSERT_CODES + if (flags & SRE_FLAG_IGNORECASE and + not (flags & SRE_FLAG_LOCALE) and + flags & SRE_FLAG_UNICODE): + fixes = _ignorecase_fixes + else: + fixes = None for op, av in pattern: if op in LITERAL_CODES: if flags & SRE_FLAG_IGNORECASE: - emit(OP_IGNORE[op]) - emit(_sre.getlower(av, flags)) + lo = _sre.getlower(av, flags) + if fixes and lo in fixes: + emit(IN_IGNORE) + skip = _len(code); emit(0) + if op is NOT_LITERAL: + emit(NEGATE) + for k in (lo,) + fixes[lo]: + emit(LITERAL) + emit(k) + emit(FAILURE) + code[skip] = _len(code) - skip + else: + emit(OP_IGNORE[op]) + emit(lo) else: emit(op) emit(av) @@ -51,7 +109,7 @@ emit(op) fixup = None skip = _len(code); emit(0) - _compile_charset(av, flags, code, fixup) + _compile_charset(av, flags, code, fixup, fixes) code[skip] = _len(code) - skip elif op is ANY: if flags & SRE_FLAG_DOTALL: @@ -165,10 +223,10 @@ else: raise ValueError("unsupported operand type", op) -def _compile_charset(charset, flags, code, fixup=None): +def _compile_charset(charset, flags, code, fixup=None, fixes=None): # compile charset subprogram emit = code.append - for op, av in _optimize_charset(charset, fixup): + for op, av in _optimize_charset(charset, fixup, fixes): emit(op) if op is NEGATE: pass @@ -192,7 +250,7 @@ raise error("internal: unsupported set operator") emit(FAILURE) -def _optimize_charset(charset, fixup): +def _optimize_charset(charset, fixup, fixes): # internal: optimize character set out = [] tail = [] @@ -202,14 +260,26 @@ try: if op is LITERAL: if fixup: - av = fixup(av) - charmap[av] = 1 + lo = fixup(av) + charmap[lo] = 1 + if fixes and lo in fixes: + for k in fixes[lo]: + charmap[k] = 1 + else: + charmap[av] = 1 elif op is RANGE: r = range(av[0], av[1]+1) if fixup: r = map(fixup, r) - for i in r: - charmap[i] = 1 + if fixup and fixes: + for i in r: + charmap[i] = 1 + if i in fixes: + for k in fixes[i]: + charmap[k] = 1 + else: + for i in r: + charmap[i] = 1 elif op is NEGATE: out.append((op, av)) else: diff --git a/Lib/test/test_re.py b/Lib/test/test_re.py --- a/Lib/test/test_re.py +++ b/Lib/test/test_re.py @@ -637,6 +637,43 @@ self.assertEqual(re.match(r"((a)\s(abc|a))", "a a", re.I).group(1), "a a") self.assertEqual(re.match(r"((a)\s(abc|a)*)", "a aa", re.I).group(1), "a aa") + assert '\u212a'.lower() == 'k' # '?' + self.assertTrue(re.match(r'K', '\u212a', re.I)) + self.assertTrue(re.match(r'k', '\u212a', re.I)) + self.assertTrue(re.match(r'\u212a', 'K', re.I)) + self.assertTrue(re.match(r'\u212a', 'k', re.I)) + assert '\u017f'.upper() == 'S' # '?' + self.assertTrue(re.match(r'S', '\u017f', re.I)) + self.assertTrue(re.match(r's', '\u017f', re.I)) + self.assertTrue(re.match(r'\u017f', 'S', re.I)) + self.assertTrue(re.match(r'\u017f', 's', re.I)) + assert '\ufb05'.upper() == '\ufb06'.upper() == 'ST' # '?', '?' + self.assertTrue(re.match(r'\ufb05', '\ufb06', re.I)) + self.assertTrue(re.match(r'\ufb06', '\ufb05', re.I)) + + def test_ignore_case_set(self): + self.assertTrue(re.match(r'[19A]', 'A', re.I)) + self.assertTrue(re.match(r'[19a]', 'a', re.I)) + self.assertTrue(re.match(r'[19a]', 'A', re.I)) + self.assertTrue(re.match(r'[19A]', 'a', re.I)) + self.assertTrue(re.match(br'[19A]', b'A', re.I)) + self.assertTrue(re.match(br'[19a]', b'a', re.I)) + self.assertTrue(re.match(br'[19a]', b'A', re.I)) + self.assertTrue(re.match(br'[19A]', b'a', re.I)) + assert '\u212a'.lower() == 'k' # '?' + self.assertTrue(re.match(r'[19K]', '\u212a', re.I)) + self.assertTrue(re.match(r'[19k]', '\u212a', re.I)) + self.assertTrue(re.match(r'[19\u212a]', 'K', re.I)) + self.assertTrue(re.match(r'[19\u212a]', 'k', re.I)) + assert '\u017f'.upper() == 'S' # '?' + self.assertTrue(re.match(r'[19S]', '\u017f', re.I)) + self.assertTrue(re.match(r'[19s]', '\u017f', re.I)) + self.assertTrue(re.match(r'[19\u017f]', 'S', re.I)) + self.assertTrue(re.match(r'[19\u017f]', 's', re.I)) + assert '\ufb05'.upper() == '\ufb06'.upper() == 'ST' # '?', '?' + self.assertTrue(re.match(r'[19\ufb05]', '\ufb06', re.I)) + self.assertTrue(re.match(r'[19\ufb06]', '\ufb05', re.I)) + def test_ignore_case_range(self): # Issues #3511, #17381. self.assertTrue(re.match(r'[9-a]', '_', re.I)) @@ -656,6 +693,20 @@ self.assertTrue(re.match(r'[\U00010400-\U00010427]', '\U00010428', re.I)) self.assertTrue(re.match(r'[\U00010400-\U00010427]', '\U00010400', re.I)) + assert '\u212a'.lower() == 'k' # '?' + self.assertTrue(re.match(r'[J-M]', '\u212a', re.I)) + self.assertTrue(re.match(r'[j-m]', '\u212a', re.I)) + self.assertTrue(re.match(r'[\u2129-\u212b]', 'K', re.I)) + self.assertTrue(re.match(r'[\u2129-\u212b]', 'k', re.I)) + assert '\u017f'.upper() == 'S' # '?' + self.assertTrue(re.match(r'[R-T]', '\u017f', re.I)) + self.assertTrue(re.match(r'[r-t]', '\u017f', re.I)) + self.assertTrue(re.match(r'[\u017e-\u0180]', 'S', re.I)) + self.assertTrue(re.match(r'[\u017e-\u0180]', 's', re.I)) + assert '\ufb05'.upper() == '\ufb06'.upper() == 'ST' # '?', '?' + self.assertTrue(re.match(r'[\ufb04-\ufb05]', '\ufb06', re.I)) + self.assertTrue(re.match(r'[\ufb06-\ufb07]', '\ufb05', re.I)) + def test_category(self): self.assertEqual(re.match(r"(\s)", " ").group(1), " ") diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -183,6 +183,9 @@ Library ------- +- Issue #12728: Different Unicode characters having the same uppercase but + different lowercase are now matched in case-insensitive regular expressions. + - Issue #22821: Fixed fcntl() with integer argument on 64-bit big-endian platforms. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 12:27:36 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 10 Nov 2014 11:27:36 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Got_rid_of_the_array_module_dependency_in_the_re_module?= =?utf-8?q?=2E?= Message-ID: <20141110112731.127953.23406@psf.io> https://hg.python.org/cpython/rev/3c3cf26e6f7d changeset: 93460:3c3cf26e6f7d parent: 93458:09ec09cfe539 parent: 93459:03d6661c13a0 user: Serhiy Storchaka date: Mon Nov 10 13:25:14 2014 +0200 summary: Got rid of the array module dependency in the re module. The re module could be used during building before array is built. files: Lib/sre_compile.py | 3 +-- 1 files changed, 1 insertions(+), 2 deletions(-) diff --git a/Lib/sre_compile.py b/Lib/sre_compile.py --- a/Lib/sre_compile.py +++ b/Lib/sre_compile.py @@ -382,8 +382,7 @@ def _bytes_to_codes(b): # Convert block indices to word array - import array - a = array.array('I', b) + a = memoryview(b).cast('I') assert a.itemsize == _sre.CODESIZE assert len(a) * a.itemsize == len(b) return a.tolist() -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 12:27:36 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 10 Nov 2014 11:27:36 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E4=29=3A_Got_rid_of_the?= =?utf-8?q?_array_module_dependency_in_the_re_module=2E?= Message-ID: <20141110112731.85200.57061@psf.io> https://hg.python.org/cpython/rev/03d6661c13a0 changeset: 93459:03d6661c13a0 branch: 3.4 parent: 93457:47b3084dd6aa user: Serhiy Storchaka date: Mon Nov 10 13:24:47 2014 +0200 summary: Got rid of the array module dependency in the re module. The re module could be used during building before array is built. files: Lib/sre_compile.py | 3 +-- 1 files changed, 1 insertions(+), 2 deletions(-) diff --git a/Lib/sre_compile.py b/Lib/sre_compile.py --- a/Lib/sre_compile.py +++ b/Lib/sre_compile.py @@ -410,8 +410,7 @@ def _bytes_to_codes(b): # Convert block indices to word array - import array - a = array.array('I', b) + a = memoryview(b).cast('I') assert a.itemsize == _sre.CODESIZE assert len(a) * a.itemsize == len(b) return a.tolist() -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 12:51:31 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 10 Nov 2014 11:51:31 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2322578=3A_Added_at?= =?utf-8?q?tributes_to_the_re=2Eerror_class=2E?= Message-ID: <20141110115106.85194.63069@psf.io> https://hg.python.org/cpython/rev/292c4d853662 changeset: 93461:292c4d853662 user: Serhiy Storchaka date: Mon Nov 10 13:49:00 2014 +0200 summary: Issue #22578: Added attributes to the re.error class. files: Doc/library/re.rst | 27 +++++- Lib/sre_constants.py | 30 ++++++- Lib/sre_parse.py | 141 ++++++++++++++++++------------ Lib/test/test_re.py | 36 +++++++ Misc/NEWS | 2 + 5 files changed, 174 insertions(+), 62 deletions(-) diff --git a/Doc/library/re.rst b/Doc/library/re.rst --- a/Doc/library/re.rst +++ b/Doc/library/re.rst @@ -733,13 +733,36 @@ Clear the regular expression cache. -.. exception:: error +.. exception:: error(msg, pattern=None, pos=None) Exception raised when a string passed to one of the functions here is not a valid regular expression (for example, it might contain unmatched parentheses) or when some other error occurs during compilation or matching. It is never an - error if a string contains no match for a pattern. + error if a string contains no match for a pattern. The error instance has + the following additional attributes: + .. attribute:: msg + + The unformatted error message. + + .. attribute:: pattern + + The regular expression pattern. + + .. attribute:: pos + + The index of *pattern* where compilation failed. + + .. attribute:: lineno + + The line corresponding to *pos*. + + .. attribute:: colno + + The column corresponding to *pos*. + + .. versionchanged:: 3.5 + Added additional attributes. .. _re-objects: diff --git a/Lib/sre_constants.py b/Lib/sre_constants.py --- a/Lib/sre_constants.py +++ b/Lib/sre_constants.py @@ -21,7 +21,35 @@ # should this really be here? class error(Exception): - pass + def __init__(self, msg, pattern=None, pos=None): + self.msg = msg + self.pattern = pattern + self.pos = pos + if pattern is not None and pos is not None: + msg = '%s at position %d' % (msg, pos) + if isinstance(pattern, str): + newline = '\n' + else: + newline = b'\n' + self.lineno = pattern.count(newline, 0, pos) + 1 + self.colno = pos - pattern.rfind(newline, 0, pos) + if newline in pattern: + msg = '%s (line %d, column %d)' % (msg, self.lineno, self.colno) + else: + self.lineno = self.colno = None + super().__init__(msg) + +def linecol(doc, pos): + if isinstance(pattern, str): + newline = '\n' + else: + newline = b'\n' + lineno = pattern.count(newline, 0, pos) + 1 + if lineno == 1: + colno = pos + 1 + else: + colno = pos - doc.rindex(newline, 0, pos) + return lineno, colno class _NamedIntConstant(int): diff --git a/Lib/sre_parse.py b/Lib/sre_parse.py --- a/Lib/sre_parse.py +++ b/Lib/sre_parse.py @@ -81,8 +81,8 @@ if name is not None: ogid = self.groupdict.get(name, None) if ogid is not None: - raise error("redefinition of group name %s as group %d; " - "was group %d" % (repr(name), gid, ogid)) + raise error("redefinition of group name %r as group %d; " + "was group %d" % (name, gid, ogid)) self.groupdict[name] = gid return gid def closegroup(self, gid, p): @@ -206,24 +206,25 @@ class Tokenizer: def __init__(self, string): self.istext = isinstance(string, str) + self.string = string if not self.istext: string = str(string, 'latin1') - self.string = string + self.decoded_string = string self.index = 0 self.__next() def __next(self): index = self.index try: - char = self.string[index] + char = self.decoded_string[index] except IndexError: self.next = None return if char == "\\": index += 1 try: - char += self.string[index] + char += self.decoded_string[index] except IndexError: - raise error("bogus escape (end of line)") + raise self.error("bogus escape (end of line)") from None self.index = index + 1 self.next = char def match(self, char): @@ -250,15 +251,19 @@ c = self.next self.__next() if c is None: - raise error("unterminated name") + raise self.error("unterminated name") if c == terminator: break result += c return result def tell(self): - return self.index, self.next + return self.index - len(self.next or '') def seek(self, index): - self.index, self.next = index + self.index = index + self.__next() + + def error(self, msg, offset=0): + return error(msg, self.string, self.tell() - offset) # The following three functions are not used in this module anymore, but we keep # them here (with DeprecationWarnings) for backwards compatibility. @@ -322,8 +327,8 @@ escape += source.getwhile(2, OCTDIGITS) c = int(escape[1:], 8) if c > 0o377: - raise error('octal escape value %r outside of ' - 'range 0-0o377' % escape) + raise source.error('octal escape value %r outside of ' + 'range 0-0o377' % escape, len(escape)) return LITERAL, c elif c in DIGITS: raise ValueError @@ -331,7 +336,7 @@ return LITERAL, ord(escape[1]) except ValueError: pass - raise error("bogus escape: %s" % repr(escape)) + raise source.error("bogus escape: %r" % escape, len(escape)) def _escape(source, escape, state): # handle escape code in expression @@ -377,21 +382,23 @@ escape += source.get() c = int(escape[1:], 8) if c > 0o377: - raise error('octal escape value %r outside of ' - 'range 0-0o377' % escape) + raise source.error('octal escape value %r outside of ' + 'range 0-0o377' % escape, + len(escape)) return LITERAL, c # not an octal escape, so this is a group reference group = int(escape[1:]) if group < state.groups: if not state.checkgroup(group): - raise error("cannot refer to open group") + raise source.error("cannot refer to open group", + len(escape)) return GROUPREF, group raise ValueError if len(escape) == 2: return LITERAL, ord(escape[1]) except ValueError: pass - raise error("bogus escape: %s" % repr(escape)) + raise source.error("bogus escape: %r" % escape, len(escape)) def _parse_sub(source, state, nested=True): # parse an alternation: a|b|c @@ -404,7 +411,7 @@ if not sourcematch("|"): break if nested and source.next is not None and source.next != ")": - raise error("pattern not properly closed") + raise source.error("pattern not properly closed") if len(items) == 1: return items[0] @@ -449,11 +456,11 @@ if source.match("|"): item_no = _parse(source, state) if source.next == "|": - raise error("conditional backref with more than two branches") + raise source.error("conditional backref with more than two branches") else: item_no = None if source.next is not None and source.next != ")": - raise error("pattern not properly closed") + raise source.error("pattern not properly closed") subpattern = SubPattern(state) subpattern.append((GROUPREF_EXISTS, (condgroup, item_yes, item_no))) return subpattern @@ -510,7 +517,7 @@ while True: this = sourceget() if this is None: - raise error("unexpected end of regular expression") + raise source.error("unexpected end of regular expression") if this == "]" and set != start: break elif this[0] == "\\": @@ -521,7 +528,7 @@ # potential range this = sourceget() if this is None: - raise error("unexpected end of regular expression") + raise source.error("unexpected end of regular expression") if this == "]": if code1[0] is IN: code1 = code1[1][0] @@ -533,11 +540,11 @@ else: code2 = LITERAL, _ord(this) if code1[0] != LITERAL or code2[0] != LITERAL: - raise error("bad character range") + raise source.error("bad character range", len(this)) lo = code1[1] hi = code2[1] if hi < lo: - raise error("bad character range") + raise source.error("bad character range", len(this)) setappend((RANGE, (lo, hi))) else: if code1[0] is IN: @@ -555,6 +562,7 @@ elif this in REPEAT_CHARS: # repeat previous item + here = source.tell() if this == "?": min, max = 0, 1 elif this == "*": @@ -566,7 +574,6 @@ if source.next == "}": subpatternappend((LITERAL, _ord(this))) continue - here = source.tell() min, max = 0, MAXREPEAT lo = hi = "" while source.next in DIGITS: @@ -589,18 +596,21 @@ if max >= MAXREPEAT: raise OverflowError("the repetition number is too large") if max < min: - raise error("bad repeat interval") + raise source.error("bad repeat interval", + source.tell() - here) else: - raise error("not supported") + raise source.error("not supported", len(this)) # figure out which item to repeat if subpattern: item = subpattern[-1:] else: item = None if not item or (_len(item) == 1 and item[0][0] == AT): - raise error("nothing to repeat") + raise source.error("nothing to repeat", + source.tell() - here + len(this)) if item[0][0] in _REPEATCODES: - raise error("multiple repeat") + raise source.error("multiple repeat", + source.tell() - here + len(this)) if sourcematch("?"): subpattern[-1] = (MIN_REPEAT, (min, max, item)) else: @@ -618,7 +628,7 @@ # options char = sourceget() if char is None: - raise error("unexpected end of pattern") + raise self.error("unexpected end of pattern") if char == "P": # python extensions if sourcematch("<"): @@ -626,28 +636,32 @@ name = source.getuntil(">") group = 1 if not name: - raise error("missing group name") + raise source.error("missing group name", 1) if not name.isidentifier(): - raise error("bad character in group name %r" % name) + raise source.error("bad character in group name " + "%r" % name, + len(name) + 1) elif sourcematch("="): # named backreference name = source.getuntil(")") if not name: - raise error("missing group name") + raise source.error("missing group name", 1) if not name.isidentifier(): - raise error("bad character in backref group name " - "%r" % name) + raise source.error("bad character in backref " + "group name %r" % name, + len(name) + 1) gid = state.groupdict.get(name) if gid is None: msg = "unknown group name: {0!r}".format(name) - raise error(msg) + raise source.error(msg, len(name) + 1) subpatternappend((GROUPREF, gid)) continue else: char = sourceget() if char is None: - raise error("unexpected end of pattern") - raise error("unknown specifier: ?P%s" % char) + raise source.error("unexpected end of pattern") + raise source.error("unknown specifier: ?P%s" % char, + len(char)) elif char == ":": # non-capturing group group = 2 @@ -655,7 +669,7 @@ # comment while True: if source.next is None: - raise error("unbalanced parenthesis") + raise source.error("unbalanced parenthesis") if sourceget() == ")": break continue @@ -665,11 +679,11 @@ if char == "<": char = sourceget() if char is None or char not in "=!": - raise error("syntax error") + raise source.error("syntax error") dir = -1 # lookbehind p = _parse_sub(source, state) if not sourcematch(")"): - raise error("unbalanced parenthesis") + raise source.error("unbalanced parenthesis") if char == "=": subpatternappend((ASSERT, (dir, p))) else: @@ -680,23 +694,26 @@ condname = source.getuntil(")") group = 2 if not condname: - raise error("missing group name") + raise source.error("missing group name", 1) if condname.isidentifier(): condgroup = state.groupdict.get(condname) if condgroup is None: msg = "unknown group name: {0!r}".format(condname) - raise error(msg) + raise source.error(msg, len(condname) + 1) else: try: condgroup = int(condname) if condgroup < 0: raise ValueError except ValueError: - raise error("bad character in group name") + raise source.error("bad character in group name", + len(condname) + 1) if not condgroup: - raise error("bad group number") + raise source.error("bad group number", + len(condname) + 1) if condgroup >= MAXGROUPS: - raise error("the group number is too large") + raise source.error("the group number is too large", + len(condname) + 1) elif char in FLAGS: # flags state.flags |= FLAGS[char] @@ -704,20 +721,23 @@ state.flags |= FLAGS[sourceget()] verbose = state.flags & SRE_FLAG_VERBOSE else: - raise error("unexpected end of pattern " + char) + raise source.error("unexpected end of pattern") if group: # parse group contents if group == 2: # anonymous group group = None else: - group = state.opengroup(name) + try: + group = state.opengroup(name) + except error as err: + raise source.error(err.msg, len(name) + 1) if condgroup: p = _parse_sub_cond(source, state, condgroup) else: p = _parse_sub(source, state) if not sourcematch(")"): - raise error("unbalanced parenthesis") + raise source.error("unbalanced parenthesis") if group is not None: state.closegroup(group, p) subpatternappend((SUBPATTERN, (group, p))) @@ -725,10 +745,10 @@ while True: char = sourceget() if char is None: - raise error("unexpected end of pattern") + raise source.error("unexpected end of pattern") if char == ")": break - raise error("unknown extension") + raise source.error("unknown extension", len(char)) elif this == "^": subpatternappend((AT, AT_BEGINNING)) @@ -737,7 +757,7 @@ subpattern.append((AT, AT_END)) else: - raise error("parser error") + raise source.error("parser error", len(this)) return subpattern @@ -768,9 +788,10 @@ if source.next is not None: if source.next == ")": - raise error("unbalanced parenthesis") + raise source.error("unbalanced parenthesis") else: - raise error("bogus characters at end of regular expression") + raise source.error("bogus characters at end of regular expression", + len(tail)) if flags & SRE_FLAG_DEBUG: p.dump() @@ -809,16 +830,18 @@ if s.match("<"): name = s.getuntil(">") if not name: - raise error("missing group name") + raise s.error("missing group name", 1) try: index = int(name) if index < 0: - raise error("negative group number") + raise s.error("negative group number", len(name) + 1) if index >= MAXGROUPS: - raise error("the group number is too large") + raise s.error("the group number is too large", + len(name) + 1) except ValueError: if not name.isidentifier(): - raise error("bad character in group name") + raise s.error("bad character in group name", + len(name) + 1) try: index = pattern.groupindex[name] except KeyError: @@ -841,8 +864,8 @@ isoctal = True c = int(this[1:], 8) if c > 0o377: - raise error('octal escape value %r outside of ' - 'range 0-0o377' % this) + raise s.error('octal escape value %r outside of ' + 'range 0-0o377' % this, len(this)) lappend(chr(c)) if not isoctal: addgroup(int(this[1:])) diff --git a/Lib/test/test_re.py b/Lib/test/test_re.py --- a/Lib/test/test_re.py +++ b/Lib/test/test_re.py @@ -1419,6 +1419,42 @@ self.assertIsNone(re.match(b'(?Li)\xc5', b'\xe5')) self.assertIsNone(re.match(b'(?Li)\xe5', b'\xc5')) + def test_error(self): + with self.assertRaises(re.error) as cm: + re.compile('(\u20ac))') + err = cm.exception + self.assertIsInstance(err.pattern, str) + self.assertEqual(err.pattern, '(\u20ac))') + self.assertEqual(err.pos, 3) + self.assertEqual(err.lineno, 1) + self.assertEqual(err.colno, 4) + self.assertIn(err.msg, str(err)) + self.assertIn(' at position 3', str(err)) + self.assertNotIn(' at position 3', err.msg) + # Bytes pattern + with self.assertRaises(re.error) as cm: + re.compile(b'(\xa4))') + err = cm.exception + self.assertIsInstance(err.pattern, bytes) + self.assertEqual(err.pattern, b'(\xa4))') + self.assertEqual(err.pos, 3) + # Multiline pattern + with self.assertRaises(re.error) as cm: + re.compile(""" + ( + abc + ) + ) + ( + """, re.VERBOSE) + err = cm.exception + self.assertEqual(err.pos, 77) + self.assertEqual(err.lineno, 5) + self.assertEqual(err.colno, 17) + self.assertIn(err.msg, str(err)) + self.assertIn(' at position 77', str(err)) + self.assertIn('(line 5, column 17)', str(err)) + class PatternReprTests(unittest.TestCase): def check(self, pattern, expected): diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -183,6 +183,8 @@ Library ------- +- Issue #22578: Added attributes to the re.error class. + - Issue #12728: Different Unicode characters having the same uppercase but different lowercase are now matched in case-insensitive regular expressions. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 13:36:00 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 10 Nov 2014 12:36:00 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Fixed_IDLE_tests_after_cha?= =?utf-8?q?nging_re_error_messages_=28issue_=2322578=29=2E?= Message-ID: <20141110123544.85216.39224@psf.io> https://hg.python.org/cpython/rev/07f082b200a7 changeset: 93462:07f082b200a7 user: Serhiy Storchaka date: Mon Nov 10 14:18:03 2014 +0200 summary: Fixed IDLE tests after changing re error messages (issue #22578). files: Lib/idlelib/idle_test/test_searchengine.py | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Lib/idlelib/idle_test/test_searchengine.py b/Lib/idlelib/idle_test/test_searchengine.py --- a/Lib/idlelib/idle_test/test_searchengine.py +++ b/Lib/idlelib/idle_test/test_searchengine.py @@ -178,7 +178,7 @@ engine.revar.set(1) Equal(engine.getprog(), None) self.assertEqual(Mbox.showerror.message, - 'Error: nothing to repeat\nPattern: +') + 'Error: nothing to repeat at position 0\nPattern: +') def test_report_error(self): showerror = Mbox.showerror -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 13:40:35 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 10 Nov 2014 12:40:35 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Fixed_AttributeError_when_?= =?utf-8?q?the_regular_expression_starts_from_illegal_escape=2E?= Message-ID: <20141110124022.108371.29124@psf.io> https://hg.python.org/cpython/rev/7972304b9f92 changeset: 93463:7972304b9f92 user: Serhiy Storchaka date: Mon Nov 10 14:38:16 2014 +0200 summary: Fixed AttributeError when the regular expression starts from illegal escape. files: Lib/sre_parse.py | 1 + Lib/test/test_re.py | 14 ++++++++++++++ 2 files changed, 15 insertions(+), 0 deletions(-) diff --git a/Lib/sre_parse.py b/Lib/sre_parse.py --- a/Lib/sre_parse.py +++ b/Lib/sre_parse.py @@ -211,6 +211,7 @@ string = str(string, 'latin1') self.decoded_string = string self.index = 0 + self.next = None self.__next() def __next(self): index = self.index diff --git a/Lib/test/test_re.py b/Lib/test/test_re.py --- a/Lib/test/test_re.py +++ b/Lib/test/test_re.py @@ -531,6 +531,20 @@ self.assertEqual(re.search(br"\d\D\w\W\s\S", b"1aa! a", re.LOCALE).group(0), b"1aa! a") + def test_other_escapes(self): + self.assertRaises(re.error, re.compile, "\\") + self.assertEqual(re.match(r"\(", '(').group(), '(') + self.assertIsNone(re.match(r"\(", ')')) + self.assertEqual(re.match(r"\\", '\\').group(), '\\') + self.assertEqual(re.match(r"\y", 'y').group(), 'y') + self.assertIsNone(re.match(r"\y", 'z')) + self.assertEqual(re.match(r"[\]]", ']').group(), ']') + self.assertIsNone(re.match(r"[\]]", '[')) + self.assertEqual(re.match(r"[a\-c]", '-').group(), '-') + self.assertIsNone(re.match(r"[a\-c]", 'b')) + self.assertEqual(re.match(r"[\^a]+", 'a^').group(), 'a^') + self.assertIsNone(re.match(r"[\^a]+", 'b')) + def test_string_boundaries(self): # See http://bugs.python.org/issue10713 self.assertEqual(re.search(r"\b(abc)\b", "abc").group(1), -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 16:45:22 2014 From: python-checkins at python.org (georg.brandl) Date: Mon, 10 Nov 2014 15:45:22 +0000 Subject: [Python-checkins] =?utf-8?q?devguide=3A_update_my_entries_in_expe?= =?utf-8?q?rts_list?= Message-ID: <20141110154516.85210.35714@psf.io> https://hg.python.org/devguide/rev/ee636682d869 changeset: 724:ee636682d869 user: Georg Brandl date: Mon Nov 10 16:45:12 2014 +0100 summary: update my entries in experts list files: experts.rst | 10 +++++----- 1 files changed, 5 insertions(+), 5 deletions(-) diff --git a/experts.rst b/experts.rst --- a/experts.rst +++ b/experts.rst @@ -54,7 +54,7 @@ aifc r.david.murray argparse bethard array -ast benjamin.peterson +ast benjamin.peterson, georg.brandl asynchat josiahcarlson, giampaolo.rodola*, stutzbach asyncio gvanrossum, haypo, pitrou, yselivanov, giampaolo.rodola asyncore josiahcarlson, giampaolo.rodola*, stutzbach @@ -165,7 +165,7 @@ ossaudiodev parser benjamin.peterson pathlib pitrou* -pdb georg.brandl* +pdb georg.brandl pickle alexandre.vassalotti, pitrou pickletools alexandre.vassalotti pipes @@ -210,7 +210,7 @@ ssl janssen, pitrou, giampaolo.rodola, christian.heimes, dstufft, alex stat christian.heimes statistics steven.daprano -string georg.brandl* +string georg.brandl stringprep struct mark.dickinson, meador.inge subprocess astrand (inactive) @@ -229,7 +229,7 @@ textwrap georg.brandl threading pitrou time belopolsky -timeit georg.brandl +timeit tkinter gpolo, serhiy.storchaka token georg.brandl tokenize meador.inge @@ -249,7 +249,7 @@ warnings wave weakref fdrake, pitrou -webbrowser georg.brandl +webbrowser winreg stutzbach winsound effbot (inactive) wsgiref pje -- Repository URL: https://hg.python.org/devguide From python-checkins at python.org Mon Nov 10 22:15:45 2014 From: python-checkins at python.org (berker.peksag) Date: Mon, 10 Nov 2014 21:15:45 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyODM5?= =?utf-8?q?=3A_Fix_Snapshot=2Estatistics=28=29_link=2E?= Message-ID: <20141110211538.71575.8153@psf.io> https://hg.python.org/cpython/rev/387bbada31e8 changeset: 93464:387bbada31e8 branch: 3.4 parent: 93459:03d6661c13a0 user: Berker Peksag date: Mon Nov 10 23:15:32 2014 +0200 summary: Issue #22839: Fix Snapshot.statistics() link. files: Doc/library/tracemalloc.rst | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Doc/library/tracemalloc.rst b/Doc/library/tracemalloc.rst --- a/Doc/library/tracemalloc.rst +++ b/Doc/library/tracemalloc.rst @@ -435,7 +435,7 @@ Compute the differences with an old snapshot. Get statistics as a sorted list of :class:`StatisticDiff` instances grouped by *group_by*. - See the :meth:`statistics` method for *group_by* and *cumulative* + See the :meth:`Snapshot.statistics` method for *group_by* and *cumulative* parameters. The result is sorted from the biggest to the smallest by: absolute value -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 10 22:15:45 2014 From: python-checkins at python.org (berker.peksag) Date: Mon, 10 Nov 2014 21:15:45 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2322839=3A_Fix_Snapshot=2Estatistics=28=29_link?= =?utf-8?q?=2E?= Message-ID: <20141110211538.17280.93046@psf.io> https://hg.python.org/cpython/rev/524a004e93dd changeset: 93465:524a004e93dd parent: 93463:7972304b9f92 parent: 93464:387bbada31e8 user: Berker Peksag date: Mon Nov 10 23:15:56 2014 +0200 summary: Issue #22839: Fix Snapshot.statistics() link. files: Doc/library/tracemalloc.rst | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Doc/library/tracemalloc.rst b/Doc/library/tracemalloc.rst --- a/Doc/library/tracemalloc.rst +++ b/Doc/library/tracemalloc.rst @@ -435,7 +435,7 @@ Compute the differences with an old snapshot. Get statistics as a sorted list of :class:`StatisticDiff` instances grouped by *group_by*. - See the :meth:`statistics` method for *group_by* and *cumulative* + See the :meth:`Snapshot.statistics` method for *group_by* and *cumulative* parameters. The result is sorted from the biggest to the smallest by: absolute value -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 11 08:48:03 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Tue, 11 Nov 2014 07:48:03 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_default_-=3E_default?= =?utf-8?q?=29=3A_Merge_heads?= Message-ID: <20141111074756.21125.54968@psf.io> https://hg.python.org/cpython/rev/81d1481bc094 changeset: 93467:81d1481bc094 parent: 93466:2b27ffe611f3 parent: 93465:524a004e93dd user: Serhiy Storchaka date: Tue Nov 11 09:45:55 2014 +0200 summary: Merge heads files: Doc/library/tracemalloc.rst | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Doc/library/tracemalloc.rst b/Doc/library/tracemalloc.rst --- a/Doc/library/tracemalloc.rst +++ b/Doc/library/tracemalloc.rst @@ -435,7 +435,7 @@ Compute the differences with an old snapshot. Get statistics as a sorted list of :class:`StatisticDiff` instances grouped by *group_by*. - See the :meth:`statistics` method for *group_by* and *cumulative* + See the :meth:`Snapshot.statistics` method for *group_by* and *cumulative* parameters. The result is sorted from the biggest to the smallest by: absolute value -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 11 08:48:03 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Tue, 11 Nov 2014 07:48:03 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Fixed_error_position_for_t?= =?utf-8?q?he_backslash_at_the_end_of_regex_pattern=2E?= Message-ID: <20141111074756.80126.2430@psf.io> https://hg.python.org/cpython/rev/2b27ffe611f3 changeset: 93466:2b27ffe611f3 parent: 93463:7972304b9f92 user: Serhiy Storchaka date: Mon Nov 10 18:28:53 2014 +0200 summary: Fixed error position for the backslash at the end of regex pattern. files: Lib/sre_parse.py | 3 ++- 1 files changed, 2 insertions(+), 1 deletions(-) diff --git a/Lib/sre_parse.py b/Lib/sre_parse.py --- a/Lib/sre_parse.py +++ b/Lib/sre_parse.py @@ -225,7 +225,8 @@ try: char += self.decoded_string[index] except IndexError: - raise self.error("bogus escape (end of line)") from None + raise error("bogus escape (end of line)", + self.string, len(self.string) - 1) from None self.index = index + 1 self.next = char def match(self, char): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 11 09:06:13 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Tue, 11 Nov 2014 08:06:13 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzIyODQ1?= =?utf-8?q?=3A_Improved_formatting_of_dis_documentation=2E?= Message-ID: <20141111080603.19409.84200@psf.io> https://hg.python.org/cpython/rev/0a32764004ab changeset: 93470:0a32764004ab branch: 2.7 parent: 93456:4caa695af94c user: Serhiy Storchaka date: Tue Nov 11 10:02:57 2014 +0200 summary: Issue #22845: Improved formatting of dis documentation. files: Doc/library/dis.rst | 10 +++++----- 1 files changed, 5 insertions(+), 5 deletions(-) diff --git a/Doc/library/dis.rst b/Doc/library/dis.rst --- a/Doc/library/dis.rst +++ b/Doc/library/dis.rst @@ -446,7 +446,7 @@ Implements the expression statement for the interactive mode. TOS is removed from the stack and printed. In non-interactive mode, an expression statement is - terminated with ``POP_STACK``. + terminated with :opcode:`POP_TOP`. .. opcode:: PRINT_ITEM () @@ -481,7 +481,7 @@ .. opcode:: CONTINUE_LOOP (target) Continues a loop due to a :keyword:`continue` statement. *target* is the - address to jump to (which should be a ``FOR_ITER`` instruction). + address to jump to (which should be a :opcode:`FOR_ITER` instruction). .. opcode:: LIST_APPEND (i) @@ -838,21 +838,21 @@ .. opcode:: CALL_FUNCTION_VAR (argc) - Calls a function. *argc* is interpreted as in ``CALL_FUNCTION``. The top element + Calls a function. *argc* is interpreted as in :opcode:`CALL_FUNCTION`. The top element on the stack contains the variable argument list, followed by keyword and positional arguments. .. opcode:: CALL_FUNCTION_KW (argc) - Calls a function. *argc* is interpreted as in ``CALL_FUNCTION``. The top element + Calls a function. *argc* is interpreted as in :opcode:`CALL_FUNCTION`. The top element on the stack contains the keyword arguments dictionary, followed by explicit keyword and positional arguments. .. opcode:: CALL_FUNCTION_VAR_KW (argc) - Calls a function. *argc* is interpreted as in ``CALL_FUNCTION``. The top + Calls a function. *argc* is interpreted as in :opcode:`CALL_FUNCTION`. The top element on the stack contains the keyword arguments dictionary, followed by the variable-arguments tuple, followed by explicit keyword and positional arguments. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 11 09:06:13 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Tue, 11 Nov 2014 08:06:13 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyODQ1?= =?utf-8?q?=3A_Improved_formatting_of_dis_documentation=2E?= Message-ID: <20141111080602.118395.97109@psf.io> https://hg.python.org/cpython/rev/d676f2725699 changeset: 93468:d676f2725699 branch: 3.4 parent: 93464:387bbada31e8 user: Serhiy Storchaka date: Tue Nov 11 10:02:11 2014 +0200 summary: Issue #22845: Improved formatting of dis documentation. files: Doc/library/dis.rst | 47 ++++++++++++++++---------------- 1 files changed, 24 insertions(+), 23 deletions(-) diff --git a/Doc/library/dis.rst b/Doc/library/dis.rst --- a/Doc/library/dis.rst +++ b/Doc/library/dis.rst @@ -133,7 +133,7 @@ .. versionadded:: 3.2 .. versionchanged:: 3.4 - Added ``file`` parameter + Added *file* parameter. .. function:: dis(x=None, *, file=None) @@ -147,11 +147,11 @@ disassembled. If no object is provided, this function disassembles the last traceback. - The disassembly is written as text to the supplied ``file`` argument if + The disassembly is written as text to the supplied *file* argument if provided and to ``sys.stdout`` otherwise. .. versionchanged:: 3.4 - Added ``file`` parameter + Added *file* parameter. .. function:: distb(tb=None, *, file=None) @@ -160,11 +160,11 @@ traceback if none was passed. The instruction causing the exception is indicated. - The disassembly is written as text to the supplied ``file`` argument if + The disassembly is written as text to the supplied *file* argument if provided and to ``sys.stdout`` otherwise. .. versionchanged:: 3.4 - Added ``file`` parameter + Added *file* parameter. .. function:: disassemble(code, lasti=-1, *, file=None) @@ -184,11 +184,11 @@ The parameter interpretation recognizes local and global variable names, constant values, branch targets, and compare operators. - The disassembly is written as text to the supplied ``file`` argument if + The disassembly is written as text to the supplied *file* argument if provided and to ``sys.stdout`` otherwise. .. versionchanged:: 3.4 - Added ``file`` parameter + Added *file* parameter. .. function:: get_instructions(x, *, first_line=None) @@ -502,7 +502,7 @@ Implements the expression statement for the interactive mode. TOS is removed from the stack and printed. In non-interactive mode, an expression statement is - terminated with ``POP_STACK``. + terminated with :opcode:`POP_TOP`. .. opcode:: BREAK_LOOP @@ -513,7 +513,7 @@ .. opcode:: CONTINUE_LOOP (target) Continues a loop due to a :keyword:`continue` statement. *target* is the - address to jump to (which should be a ``FOR_ITER`` instruction). + address to jump to (which should be a :opcode:`FOR_ITER` instruction). .. opcode:: SET_ADD (i) @@ -531,7 +531,8 @@ Calls ``dict.setitem(TOS1[-i], TOS, TOS1)``. Used to implement dict comprehensions. -For all of the SET_ADD, LIST_APPEND and MAP_ADD instructions, while the +For all of the :opcode:`SET_ADD`, :opcode:`LIST_APPEND` and :opcode:`MAP_ADD` +instructions, while the added value or key/value pair is popped off, the container object remains on the stack so that it is available for further iterations of the loop. @@ -584,7 +585,7 @@ .. opcode:: LOAD_BUILD_CLASS Pushes :func:`builtins.__build_class__` onto the stack. It is later called - by ``CALL_FUNCTION`` to construct a class. + by :opcode:`CALL_FUNCTION` to construct a class. .. opcode:: SETUP_WITH (delta) @@ -615,7 +616,7 @@ If the stack represents an exception, *and* the function call returns a 'true' value, this information is "zapped" and replaced with a single - ``WHY_SILENCED`` to prevent ``END_FINALLY`` from re-raising the exception. + ``WHY_SILENCED`` to prevent :opcode:`END_FINALLY` from re-raising the exception. (But non-local gotos will still be resumed.) .. XXX explain the WHY stuff! @@ -627,8 +628,8 @@ .. opcode:: STORE_NAME (namei) Implements ``name = TOS``. *namei* is the index of *name* in the attribute - :attr:`co_names` of the code object. The compiler tries to use ``STORE_FAST`` - or ``STORE_GLOBAL`` if possible. + :attr:`co_names` of the code object. The compiler tries to use :opcode:`STORE_FAST` + or :opcode:`STORE_GLOBAL` if possible. .. opcode:: DELETE_NAME (namei) @@ -668,12 +669,12 @@ .. opcode:: STORE_GLOBAL (namei) - Works as ``STORE_NAME``, but stores the name as a global. + Works as :opcode:`STORE_NAME`, but stores the name as a global. .. opcode:: DELETE_GLOBAL (namei) - Works as ``DELETE_NAME``, but deletes a global name. + Works as :opcode:`DELETE_NAME`, but deletes a global name. .. opcode:: LOAD_CONST (consti) @@ -694,12 +695,12 @@ .. opcode:: BUILD_LIST (count) - Works as ``BUILD_TUPLE``, but creates a list. + Works as :opcode:`BUILD_TUPLE`, but creates a list. .. opcode:: BUILD_SET (count) - Works as ``BUILD_TUPLE``, but creates a set. + Works as :opcode:`BUILD_TUPLE`, but creates a set. .. opcode:: BUILD_MAP (count) @@ -724,7 +725,7 @@ Imports the module ``co_names[namei]``. TOS and TOS1 are popped and provide the *fromlist* and *level* arguments of :func:`__import__`. The module object is pushed onto the stack. The current namespace is not affected: - for a proper import statement, a subsequent ``STORE_FAST`` instruction + for a proper import statement, a subsequent :opcode:`STORE_FAST` instruction modifies the namespace. @@ -732,7 +733,7 @@ Loads the attribute ``co_names[namei]`` from the module found in TOS. The resulting object is pushed onto the stack, to be subsequently stored by a - ``STORE_FAST`` instruction. + :opcode:`STORE_FAST` instruction. .. opcode:: JUMP_FORWARD (delta) @@ -911,21 +912,21 @@ .. opcode:: CALL_FUNCTION_VAR (argc) - Calls a function. *argc* is interpreted as in ``CALL_FUNCTION``. The top element + Calls a function. *argc* is interpreted as in :opcode:`CALL_FUNCTION`. The top element on the stack contains the variable argument list, followed by keyword and positional arguments. .. opcode:: CALL_FUNCTION_KW (argc) - Calls a function. *argc* is interpreted as in ``CALL_FUNCTION``. The top element + Calls a function. *argc* is interpreted as in :opcode:`CALL_FUNCTION`. The top element on the stack contains the keyword arguments dictionary, followed by explicit keyword and positional arguments. .. opcode:: CALL_FUNCTION_VAR_KW (argc) - Calls a function. *argc* is interpreted as in ``CALL_FUNCTION``. The top + Calls a function. *argc* is interpreted as in :opcode:`CALL_FUNCTION`. The top element on the stack contains the keyword arguments dictionary, followed by the variable-arguments tuple, followed by explicit keyword and positional arguments. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 11 09:06:13 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Tue, 11 Nov 2014 08:06:13 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2322845=3A_Improved_formatting_of_dis_documentati?= =?utf-8?b?b24u?= Message-ID: <20141111080603.19397.29997@psf.io> https://hg.python.org/cpython/rev/ac0334665459 changeset: 93469:ac0334665459 parent: 93467:81d1481bc094 parent: 93468:d676f2725699 user: Serhiy Storchaka date: Tue Nov 11 10:02:46 2014 +0200 summary: Issue #22845: Improved formatting of dis documentation. files: Doc/library/dis.rst | 47 ++++++++++++++++---------------- 1 files changed, 24 insertions(+), 23 deletions(-) diff --git a/Doc/library/dis.rst b/Doc/library/dis.rst --- a/Doc/library/dis.rst +++ b/Doc/library/dis.rst @@ -133,7 +133,7 @@ .. versionadded:: 3.2 .. versionchanged:: 3.4 - Added ``file`` parameter + Added *file* parameter. .. function:: dis(x=None, *, file=None) @@ -147,11 +147,11 @@ disassembled. If no object is provided, this function disassembles the last traceback. - The disassembly is written as text to the supplied ``file`` argument if + The disassembly is written as text to the supplied *file* argument if provided and to ``sys.stdout`` otherwise. .. versionchanged:: 3.4 - Added ``file`` parameter + Added *file* parameter. .. function:: distb(tb=None, *, file=None) @@ -160,11 +160,11 @@ traceback if none was passed. The instruction causing the exception is indicated. - The disassembly is written as text to the supplied ``file`` argument if + The disassembly is written as text to the supplied *file* argument if provided and to ``sys.stdout`` otherwise. .. versionchanged:: 3.4 - Added ``file`` parameter + Added *file* parameter. .. function:: disassemble(code, lasti=-1, *, file=None) @@ -184,11 +184,11 @@ The parameter interpretation recognizes local and global variable names, constant values, branch targets, and compare operators. - The disassembly is written as text to the supplied ``file`` argument if + The disassembly is written as text to the supplied *file* argument if provided and to ``sys.stdout`` otherwise. .. versionchanged:: 3.4 - Added ``file`` parameter + Added *file* parameter. .. function:: get_instructions(x, *, first_line=None) @@ -512,7 +512,7 @@ Implements the expression statement for the interactive mode. TOS is removed from the stack and printed. In non-interactive mode, an expression statement is - terminated with ``POP_STACK``. + terminated with :opcode:`POP_TOP`. .. opcode:: BREAK_LOOP @@ -523,7 +523,7 @@ .. opcode:: CONTINUE_LOOP (target) Continues a loop due to a :keyword:`continue` statement. *target* is the - address to jump to (which should be a ``FOR_ITER`` instruction). + address to jump to (which should be a :opcode:`FOR_ITER` instruction). .. opcode:: SET_ADD (i) @@ -541,7 +541,8 @@ Calls ``dict.setitem(TOS1[-i], TOS, TOS1)``. Used to implement dict comprehensions. -For all of the SET_ADD, LIST_APPEND and MAP_ADD instructions, while the +For all of the :opcode:`SET_ADD`, :opcode:`LIST_APPEND` and :opcode:`MAP_ADD` +instructions, while the added value or key/value pair is popped off, the container object remains on the stack so that it is available for further iterations of the loop. @@ -594,7 +595,7 @@ .. opcode:: LOAD_BUILD_CLASS Pushes :func:`builtins.__build_class__` onto the stack. It is later called - by ``CALL_FUNCTION`` to construct a class. + by :opcode:`CALL_FUNCTION` to construct a class. .. opcode:: SETUP_WITH (delta) @@ -625,7 +626,7 @@ If the stack represents an exception, *and* the function call returns a 'true' value, this information is "zapped" and replaced with a single - ``WHY_SILENCED`` to prevent ``END_FINALLY`` from re-raising the exception. + ``WHY_SILENCED`` to prevent :opcode:`END_FINALLY` from re-raising the exception. (But non-local gotos will still be resumed.) .. XXX explain the WHY stuff! @@ -637,8 +638,8 @@ .. opcode:: STORE_NAME (namei) Implements ``name = TOS``. *namei* is the index of *name* in the attribute - :attr:`co_names` of the code object. The compiler tries to use ``STORE_FAST`` - or ``STORE_GLOBAL`` if possible. + :attr:`co_names` of the code object. The compiler tries to use :opcode:`STORE_FAST` + or :opcode:`STORE_GLOBAL` if possible. .. opcode:: DELETE_NAME (namei) @@ -678,12 +679,12 @@ .. opcode:: STORE_GLOBAL (namei) - Works as ``STORE_NAME``, but stores the name as a global. + Works as :opcode:`STORE_NAME`, but stores the name as a global. .. opcode:: DELETE_GLOBAL (namei) - Works as ``DELETE_NAME``, but deletes a global name. + Works as :opcode:`DELETE_NAME`, but deletes a global name. .. opcode:: LOAD_CONST (consti) @@ -704,12 +705,12 @@ .. opcode:: BUILD_LIST (count) - Works as ``BUILD_TUPLE``, but creates a list. + Works as :opcode:`BUILD_TUPLE`, but creates a list. .. opcode:: BUILD_SET (count) - Works as ``BUILD_TUPLE``, but creates a set. + Works as :opcode:`BUILD_TUPLE`, but creates a set. .. opcode:: BUILD_MAP (count) @@ -734,7 +735,7 @@ Imports the module ``co_names[namei]``. TOS and TOS1 are popped and provide the *fromlist* and *level* arguments of :func:`__import__`. The module object is pushed onto the stack. The current namespace is not affected: - for a proper import statement, a subsequent ``STORE_FAST`` instruction + for a proper import statement, a subsequent :opcode:`STORE_FAST` instruction modifies the namespace. @@ -742,7 +743,7 @@ Loads the attribute ``co_names[namei]`` from the module found in TOS. The resulting object is pushed onto the stack, to be subsequently stored by a - ``STORE_FAST`` instruction. + :opcode:`STORE_FAST` instruction. .. opcode:: JUMP_FORWARD (delta) @@ -921,21 +922,21 @@ .. opcode:: CALL_FUNCTION_VAR (argc) - Calls a function. *argc* is interpreted as in ``CALL_FUNCTION``. The top element + Calls a function. *argc* is interpreted as in :opcode:`CALL_FUNCTION`. The top element on the stack contains the variable argument list, followed by keyword and positional arguments. .. opcode:: CALL_FUNCTION_KW (argc) - Calls a function. *argc* is interpreted as in ``CALL_FUNCTION``. The top element + Calls a function. *argc* is interpreted as in :opcode:`CALL_FUNCTION`. The top element on the stack contains the keyword arguments dictionary, followed by explicit keyword and positional arguments. .. opcode:: CALL_FUNCTION_VAR_KW (argc) - Calls a function. *argc* is interpreted as in ``CALL_FUNCTION``. The top + Calls a function. *argc* is interpreted as in :opcode:`CALL_FUNCTION`. The top element on the stack contains the keyword arguments dictionary, followed by the variable-arguments tuple, followed by explicit keyword and positional arguments. -- Repository URL: https://hg.python.org/cpython From solipsis at pitrou.net Tue Nov 11 09:08:55 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Tue, 11 Nov 2014 09:08:55 +0100 Subject: [Python-checkins] Daily reference leaks (524a004e93dd): sum=3 Message-ID: results for 524a004e93dd on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogVqLPfR', '-x'] From python-checkins at python.org Tue Nov 11 16:24:40 2014 From: python-checkins at python.org (donald.stufft) Date: Tue, 11 Nov 2014 15:24:40 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=282=2E7=29=3A_Implement_PEP_?= =?utf-8?q?477_-_Backport_ensurepip_=28PEP_453=29_to_2=2E7?= Message-ID: <20141111152417.80124.60518@psf.io> https://hg.python.org/cpython/rev/592a5414fabd changeset: 93471:592a5414fabd branch: 2.7 user: Donald Stufft date: Tue Nov 11 10:24:11 2014 -0500 summary: Implement PEP 477 - Backport ensurepip (PEP 453) to 2.7 * Backports ensurepip to the 2.7 branch * Backports some of the improved documentation to the 2.7 branch. * Adds a private backport of the 3.x mock library as test._mock_backport to enable saner testing of ensurepip. Key Differences from 3.x: * Ensurepip does not have any Makefile integration, specifically it is not ran by default in the Makefile. * There is no venv module in 2.7, so downstream distributors can completely disable ensurepip, ideally with a message redirecting to the correct way to install pip. * To match the ``python`` command in 2.7, ensurepip will install the unversioned ``pip`` command as well. * No-op and hide --default-pip and add --no-default-pip to restore the 3.x behavor on 2.7. files: .hgeol | 1 + Doc/library/distribution.rst | 13 + Doc/library/ensurepip.rst | 130 + Doc/library/index.rst | 1 + Doc/library/python.rst | 1 - Doc/whatsnew/2.7.rst | 59 + Lib/ensurepip/__init__.py | 227 + Lib/ensurepip/__main__.py | 4 + Lib/ensurepip/_bundled/pip-1.5.6-py2.py3-none-any.whl | Bin Lib/ensurepip/_bundled/setuptools-3.6-py2.py3-none-any.whl | Bin Lib/ensurepip/_uninstall.py | 30 + Lib/test/_mock_backport.py | 2352 ++++++++++ Lib/test/test_ensurepip.py | 352 + Makefile.pre.in | 1 + Tools/scripts/checkpip.py | 31 + 15 files changed, 3201 insertions(+), 1 deletions(-) diff --git a/.hgeol b/.hgeol --- a/.hgeol +++ b/.hgeol @@ -26,6 +26,7 @@ **.psd = BIN **.tar = BIN **.wav = BIN +**.whl = BIN **.xar = BIN **.zip = BIN diff --git a/Doc/library/distribution.rst b/Doc/library/distribution.rst new file mode 100644 --- /dev/null +++ b/Doc/library/distribution.rst @@ -0,0 +1,13 @@ +*********************************** +Software Packaging and Distribution +*********************************** + +These libraries help you with publishing and installing Python software. +While these modules are designed to work in conjunction with the +`Python Package Index `__, they can also be used +with a local index server, or without any index server at all. + +.. toctree:: + + distutils.rst + ensurepip.rst diff --git a/Doc/library/ensurepip.rst b/Doc/library/ensurepip.rst new file mode 100644 --- /dev/null +++ b/Doc/library/ensurepip.rst @@ -0,0 +1,130 @@ +:mod:`ensurepip` --- Bootstrapping the ``pip`` installer +======================================================== + +.. module:: ensurepip + :synopsis: Bootstrapping the ``pip`` installer into an existing Python + installation or virtual environment. + +.. versionadded:: 2.7.9 + +The :mod:`ensurepip` package provides support for bootstrapping the ``pip`` +installer into an existing Python installation or virtual environment. This +bootstrapping approach reflects the fact that ``pip`` is an independent +project with its own release cycle, and the latest available stable version +is bundled with maintenance and feature releases of the CPython reference +interpreter. + +In most cases, end users of Python shouldn't need to invoke this module +directly (as ``pip`` should be bootstrapped by default), but it may be +needed if installing ``pip`` was skipped when installing Python (or +when creating a virtual environment) or after explicitly uninstalling ``pip``. + +.. note:: + + This module *does not* access the internet. All of the components + needed to bootstrap ``pip`` are included as internal parts of the + package. + +.. seealso:: + + :ref:`installing-index` + The end user guide for installing Python packages + + :pep:`453`: Explicit bootstrapping of pip in Python installations + The original rationale and specification for this module. + + :pep:`477`: Backport ensurepip (PEP 453) to Python 2.7 + The rationale and specification for backporting PEP 453 to Python 2.7. + + +Command line interface +---------------------- + +The command line interface is invoked using the interpreter's ``-m`` switch. + +The simplest possible invocation is:: + + python -m ensurepip + +This invocation will install ``pip`` if it is not already installed, +but otherwise does nothing. To ensure the installed version of ``pip`` +is at least as recent as the one bundled with ``ensurepip``, pass the +``--upgrade`` option:: + + python -m ensurepip --upgrade + +By default, ``pip`` is installed into the current virtual environment +(if one is active) or into the system site packages (if there is no +active virtual environment). The installation location can be controlled +through two additional command line options: + +* ``--root ``: Installs ``pip`` relative to the given root directory + rather than the root of the currently active virtual environment (if any) + or the default root for the current Python installation. +* ``--user``: Installs ``pip`` into the user site packages directory rather + than globally for the current Python installation (this option is not + permitted inside an active virtual environment). + +By default, the scripts ``pip``, ``pipX``, and ``pipX.Y`` will be installed +(where X.Y stands for the version of Python used to invoke ``ensurepip``). The +scripts installed can be controlled through two additional command line +options: + +* ``--altinstall``: if an alternate installation is requested, the ``pip`` and + ``pipX`` script will *not* be installed. + +* ``--no-default-pip``: if a non-default installation is request, the ``pip`` + script will *not* be installed. + + +Module API +---------- + +:mod:`ensurepip` exposes two functions for programmatic use: + +.. function:: version() + + Returns a string specifying the bundled version of pip that will be + installed when bootstrapping an environment. + +.. function:: bootstrap(root=None, upgrade=False, user=False, \ + altinstall=False, default_pip=True, \ + verbosity=0) + + Bootstraps ``pip`` into the current or designated environment. + + *root* specifies an alternative root directory to install relative to. + If *root* is None, then installation uses the default install location + for the current environment. + + *upgrade* indicates whether or not to upgrade an existing installation + of an earlier version of ``pip`` to the bundled version. + + *user* indicates whether to use the user scheme rather than installing + globally. + + By default, the scripts ``pip``, ``pipX``, and ``pipX.Y`` will be installed + (where X.Y stands for the current version of Python). + + If *altinstall* is set, then ``pip`` and ``pipX`` will *not* be installed. + + If *default_pip* is set to ``False``, then ``pip`` will *not* be installed. + + Setting both *altinstall* and *default_pip* will trigger + :exc:`ValueError`. + + *verbosity* controls the level of output to :data:`sys.stdout` from the + bootstrapping operation. + + .. note:: + + The bootstrapping process has side effects on both ``sys.path`` and + ``os.environ``. Invoking the command line interface in a subprocess + instead allows these side effects to be avoided. + + .. note:: + + The bootstrapping process may install additional modules required by + ``pip``, but other software should not assume those dependencies will + always be present by default (as the dependencies may be removed in a + future version of ``pip``). diff --git a/Doc/library/index.rst b/Doc/library/index.rst --- a/Doc/library/index.rst +++ b/Doc/library/index.rst @@ -63,6 +63,7 @@ tk.rst development.rst debug.rst + distribution.rst python.rst custominterp.rst restricted.rst diff --git a/Doc/library/python.rst b/Doc/library/python.rst --- a/Doc/library/python.rst +++ b/Doc/library/python.rst @@ -28,4 +28,3 @@ site.rst user.rst fpectl.rst - distutils.rst diff --git a/Doc/whatsnew/2.7.rst b/Doc/whatsnew/2.7.rst --- a/Doc/whatsnew/2.7.rst +++ b/Doc/whatsnew/2.7.rst @@ -2575,6 +2575,65 @@ Gaynor; :issue:`21305`.) +PEP 477: Backport ensurepip (PEP 453) to Python 2.7 +--------------------------------------------------- + +:pep:`477` approves the inclusion of the :pep:`453` ensurepip module and the +improved documentation that was enabled by it in the Python 2.7 maintenance +releases, appearing first in the the Python 2.7.9 release. + + +Bootstrapping pip By Default +~~~~~~~~~~~~~~~~~~~~~~~~~~~~ + +The new :mod:`ensurepip` module (defined in :pep:`453`) provides a standard +cross-platform mechanism to bootstrap the pip installer into Python +installations. The version of ``pip`` included with Python 2.7.9 is ``pip`` +1.5.6, and future 2.7.x maintenance releases will update the bundled version to +the latest version of ``pip`` that is available at the time of creating the +release candidate. + +By default, the commands ``pip``, ``pipX`` and ``pipX.Y`` will be installed on +all platforms (where X.Y stands for the version of the Python installation), +along with the ``pip`` Python package and its dependencies. + +On Windows and Mac OS X, the CPython installers now default to installing +``pip`` along with CPython itself (users may opt out of installing it +during the installation process). Window users will need to opt in to the +automatic ``PATH`` modifications to have ``pip`` available from the command +line by default, otherwise it can still be accessed through the Python +launcher for Windows as ``py -m pip``. + +As `discussed in the PEP`__, platform packagers may choose not to install +these commands by default, as long as, when invoked, they provide clear and +simple directions on how to install them on that platform (usually using +the system package manager). + +__ https://www.python.org/dev/peps/pep-0477/#disabling-ensurepip-by-downstream-distributors + + +Documentation Changes +~~~~~~~~~~~~~~~~~~~~~ + +As part of this change, the :ref:`installing-index` and +:ref:`distributing-index` sections of the documentation have been +completely redesigned as short getting started and FAQ documents. Most +packaging documentation has now been moved out to the Python Packaging +Authority maintained `Python Packaging User Guide +`__ and the documentation of the individual +projects. + +However, as this migration is currently still incomplete, the legacy +versions of those guides remaining available as :ref:`install-index` +and :ref:`distutils-index`. + +.. seealso:: + + :pep:`453` -- Explicit bootstrapping of pip in Python installations + PEP written by Donald Stufft and Nick Coghlan, implemented by + Donald Stufft, Nick Coghlan, Martin von L?wis and Ned Deily. + + .. ====================================================================== .. _acks27: diff --git a/Lib/ensurepip/__init__.py b/Lib/ensurepip/__init__.py new file mode 100644 --- /dev/null +++ b/Lib/ensurepip/__init__.py @@ -0,0 +1,227 @@ +#!/usr/bin/env python2 +from __future__ import print_function + +import os +import os.path +import pkgutil +import shutil +import sys +import tempfile + + +__all__ = ["version", "bootstrap"] + + +_SETUPTOOLS_VERSION = "3.6" + +_PIP_VERSION = "1.5.6" + +# pip currently requires ssl support, so we try to provide a nicer +# error message when that is missing (http://bugs.python.org/issue19744) +_MISSING_SSL_MESSAGE = ("pip {} requires SSL/TLS".format(_PIP_VERSION)) +try: + import ssl +except ImportError: + ssl = None + + def _require_ssl_for_pip(): + raise RuntimeError(_MISSING_SSL_MESSAGE) +else: + def _require_ssl_for_pip(): + pass + +_PROJECTS = [ + ("setuptools", _SETUPTOOLS_VERSION), + ("pip", _PIP_VERSION), +] + + +def _run_pip(args, additional_paths=None): + # Add our bundled software to the sys.path so we can import it + if additional_paths is not None: + sys.path = additional_paths + sys.path + + # Install the bundled software + import pip + pip.main(args) + + +def version(): + """ + Returns a string specifying the bundled version of pip. + """ + return _PIP_VERSION + + +def _disable_pip_configuration_settings(): + # We deliberately ignore all pip environment variables + # when invoking pip + # See http://bugs.python.org/issue19734 for details + keys_to_remove = [k for k in os.environ if k.startswith("PIP_")] + for k in keys_to_remove: + del os.environ[k] + # We also ignore the settings in the default pip configuration file + # See http://bugs.python.org/issue20053 for details + os.environ['PIP_CONFIG_FILE'] = os.devnull + + +def bootstrap(root=None, upgrade=False, user=False, + altinstall=False, default_pip=True, + verbosity=0): + """ + Bootstrap pip into the current Python installation (or the given root + directory). + + Note that calling this function will alter both sys.path and os.environ. + """ + if altinstall and default_pip: + raise ValueError("Cannot use altinstall and default_pip together") + + _require_ssl_for_pip() + _disable_pip_configuration_settings() + + # By default, installing pip and setuptools installs all of the + # following scripts (X.Y == running Python version): + # + # pip, pipX, pipX.Y, easy_install, easy_install-X.Y + # + # pip 1.5+ allows ensurepip to request that some of those be left out + if altinstall: + # omit pip, pipX and easy_install + os.environ["ENSUREPIP_OPTIONS"] = "altinstall" + elif not default_pip: + # omit pip and easy_install + os.environ["ENSUREPIP_OPTIONS"] = "install" + + tmpdir = tempfile.mkdtemp() + try: + # Put our bundled wheels into a temporary directory and construct the + # additional paths that need added to sys.path + additional_paths = [] + for project, version in _PROJECTS: + wheel_name = "{}-{}-py2.py3-none-any.whl".format(project, version) + whl = pkgutil.get_data( + "ensurepip", + "_bundled/{}".format(wheel_name), + ) + with open(os.path.join(tmpdir, wheel_name), "wb") as fp: + fp.write(whl) + + additional_paths.append(os.path.join(tmpdir, wheel_name)) + + # Construct the arguments to be passed to the pip command + args = ["install", "--no-index", "--find-links", tmpdir] + if root: + args += ["--root", root] + if upgrade: + args += ["--upgrade"] + if user: + args += ["--user"] + if verbosity: + args += ["-" + "v" * verbosity] + + _run_pip(args + [p[0] for p in _PROJECTS], additional_paths) + finally: + shutil.rmtree(tmpdir, ignore_errors=True) + + +def _uninstall_helper(verbosity=0): + """Helper to support a clean default uninstall process on Windows + + Note that calling this function may alter os.environ. + """ + # Nothing to do if pip was never installed, or has been removed + try: + import pip + except ImportError: + return + + # If the pip version doesn't match the bundled one, leave it alone + if pip.__version__ != _PIP_VERSION: + msg = ("ensurepip will only uninstall a matching version " + "({!r} installed, {!r} bundled)") + print(msg.format(pip.__version__, _PIP_VERSION), file=sys.stderr) + return + + _require_ssl_for_pip() + _disable_pip_configuration_settings() + + # Construct the arguments to be passed to the pip command + args = ["uninstall", "-y"] + if verbosity: + args += ["-" + "v" * verbosity] + + _run_pip(args + [p[0] for p in reversed(_PROJECTS)]) + + +def _main(argv=None): + if ssl is None: + print("Ignoring ensurepip failure: {}".format(_MISSING_SSL_MESSAGE), + file=sys.stderr) + return + + import argparse + parser = argparse.ArgumentParser(prog="python -m ensurepip") + parser.add_argument( + "--version", + action="version", + version="pip {}".format(version()), + help="Show the version of pip that is bundled with this Python.", + ) + parser.add_argument( + "-v", "--verbose", + action="count", + default=0, + dest="verbosity", + help=("Give more output. Option is additive, and can be used up to 3 " + "times."), + ) + parser.add_argument( + "-U", "--upgrade", + action="store_true", + default=False, + help="Upgrade pip and dependencies, even if already installed.", + ) + parser.add_argument( + "--user", + action="store_true", + default=False, + help="Install using the user scheme.", + ) + parser.add_argument( + "--root", + default=None, + help="Install everything relative to this alternate root directory.", + ) + parser.add_argument( + "--altinstall", + action="store_true", + default=False, + help=("Make an alternate install, installing only the X.Y versioned" + "scripts (Default: pipX, pipX.Y, easy_install-X.Y)"), + ) + parser.add_argument( + "--default-pip", + action="store_true", + default=True, + dest="default_pip", + help=argparse.SUPPRESS, + ) + parser.add_argument( + "--no-default-pip", + action="store_false", + dest="default_pip", + help=("Make a non default install, installing only the X and X.Y " + "versioned scripts."), + ) + + args = parser.parse_args(argv) + + bootstrap( + root=args.root, + upgrade=args.upgrade, + user=args.user, + verbosity=args.verbosity, + altinstall=args.altinstall, + default_pip=args.default_pip, + ) diff --git a/Lib/ensurepip/__main__.py b/Lib/ensurepip/__main__.py new file mode 100644 --- /dev/null +++ b/Lib/ensurepip/__main__.py @@ -0,0 +1,4 @@ +import ensurepip + +if __name__ == "__main__": + ensurepip._main() diff --git a/Lib/ensurepip/_bundled/pip-1.5.6-py2.py3-none-any.whl b/Lib/ensurepip/_bundled/pip-1.5.6-py2.py3-none-any.whl new file mode 100644 index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..097ab43430d4c1302b0be353a8c16407c370693b GIT binary patch [stripped] diff --git a/Lib/ensurepip/_bundled/setuptools-3.6-py2.py3-none-any.whl b/Lib/ensurepip/_bundled/setuptools-3.6-py2.py3-none-any.whl new file mode 100644 index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..f0ffcfce5bb385e393a8385413f7a6092c51b33e GIT binary patch [stripped] diff --git a/Lib/ensurepip/_uninstall.py b/Lib/ensurepip/_uninstall.py new file mode 100644 --- /dev/null +++ b/Lib/ensurepip/_uninstall.py @@ -0,0 +1,30 @@ +"""Basic pip uninstallation support, helper for the Windows uninstaller""" + +import argparse +import ensurepip + + +def _main(argv=None): + parser = argparse.ArgumentParser(prog="python -m ensurepip._uninstall") + parser.add_argument( + "--version", + action="version", + version="pip {}".format(ensurepip.version()), + help="Show the version of pip this will attempt to uninstall.", + ) + parser.add_argument( + "-v", "--verbose", + action="count", + default=0, + dest="verbosity", + help=("Give more output. Option is additive, and can be used up to 3 " + "times."), + ) + + args = parser.parse_args(argv) + + ensurepip._uninstall_helper(verbosity=args.verbosity) + + +if __name__ == "__main__": + _main() diff --git a/Lib/test/_mock_backport.py b/Lib/test/_mock_backport.py new file mode 100644 --- /dev/null +++ b/Lib/test/_mock_backport.py @@ -0,0 +1,2352 @@ +# mock.py +# Test tools for mocking and patching. +# Maintained by Michael Foord +# Backport for other versions of Python available from +# http://pypi.python.org/pypi/mock + +__all__ = ( + 'Mock', + 'MagicMock', + 'patch', + 'sentinel', + 'DEFAULT', + 'ANY', + 'call', + 'create_autospec', + 'FILTER_DIR', + 'NonCallableMock', + 'NonCallableMagicMock', + 'mock_open', + 'PropertyMock', +) + + +__version__ = '1.0' + + +import inspect +import pprint +import sys + +from types import ModuleType +from functools import wraps, partial + + +_builtins = {name for name in __builtins__ if not name.startswith('_')} + +BaseExceptions = (BaseException,) +if 'java' in sys.platform: + # jython + import java + BaseExceptions = (BaseException, java.lang.Throwable) + + +FILTER_DIR = True + +# Workaround for issue #12370 +# Without this, the __class__ properties wouldn't be set correctly +_safe_super = super + +def _is_instance_mock(obj): + # can't use isinstance on Mock objects because they override __class__ + # The base class for all mocks is NonCallableMock + return issubclass(type(obj), NonCallableMock) + + +def _is_exception(obj): + return ( + isinstance(obj, BaseExceptions) or + isinstance(obj, type) and issubclass(obj, BaseExceptions) + ) + + +class _slotted(object): + __slots__ = ['a'] + + +DescriptorTypes = ( + type(_slotted.a), + property, +) + + +def _get_signature_object(func, as_instance, eat_self): + """ + Given an arbitrary, possibly callable object, try to create a suitable + signature object. + Return a (reduced func, signature) tuple, or None. + """ + if isinstance(func, type) and not as_instance: + # If it's a type and should be modelled as a type, use __init__. + try: + func = func.__init__ + except AttributeError: + return None + # Skip the `self` argument in __init__ + eat_self = True + elif not isinstance(func, FunctionTypes): + # If we really want to model an instance of the passed type, + # __call__ should be looked up, not __init__. + try: + func = func.__call__ + except AttributeError: + return None + if eat_self: + sig_func = partial(func, None) + else: + sig_func = func + try: + return func, inspect.signature(sig_func) + except ValueError: + # Certain callable types are not supported by inspect.signature() + return None + + +def _check_signature(func, mock, skipfirst, instance=False): + sig = _get_signature_object(func, instance, skipfirst) + if sig is None: + return + func, sig = sig + def checksig(_mock_self, *args, **kwargs): + sig.bind(*args, **kwargs) + _copy_func_details(func, checksig) + type(mock)._mock_check_sig = checksig + + +def _copy_func_details(func, funcopy): + funcopy.__name__ = func.__name__ + funcopy.__doc__ = func.__doc__ + try: + funcopy.__text_signature__ = func.__text_signature__ + except AttributeError: + pass + # we explicitly don't copy func.__dict__ into this copy as it would + # expose original attributes that should be mocked + try: + funcopy.__module__ = func.__module__ + except AttributeError: + pass + try: + funcopy.__defaults__ = func.__defaults__ + except AttributeError: + pass + try: + funcopy.__kwdefaults__ = func.__kwdefaults__ + except AttributeError: + pass + + +def _callable(obj): + if isinstance(obj, type): + return True + if getattr(obj, '__call__', None) is not None: + return True + return False + + +def _is_list(obj): + # checks for list or tuples + # XXXX badly named! + return type(obj) in (list, tuple) + + +def _instance_callable(obj): + """Given an object, return True if the object is callable. + For classes, return True if instances would be callable.""" + if not isinstance(obj, type): + # already an instance + return getattr(obj, '__call__', None) is not None + + # *could* be broken by a class overriding __mro__ or __dict__ via + # a metaclass + for base in (obj,) + obj.__mro__: + if base.__dict__.get('__call__') is not None: + return True + return False + + +def _set_signature(mock, original, instance=False): + # creates a function with signature (*args, **kwargs) that delegates to a + # mock. It still does signature checking by calling a lambda with the same + # signature as the original. + if not _callable(original): + return + + skipfirst = isinstance(original, type) + result = _get_signature_object(original, instance, skipfirst) + if result is None: + return + func, sig = result + def checksig(*args, **kwargs): + sig.bind(*args, **kwargs) + _copy_func_details(func, checksig) + + name = original.__name__ + if not name.isidentifier(): + name = 'funcopy' + context = {'_checksig_': checksig, 'mock': mock} + src = """def %s(*args, **kwargs): + _checksig_(*args, **kwargs) + return mock(*args, **kwargs)""" % name + exec (src, context) + funcopy = context[name] + _setup_func(funcopy, mock) + return funcopy + + +def _setup_func(funcopy, mock): + funcopy.mock = mock + + # can't use isinstance with mocks + if not _is_instance_mock(mock): + return + + def assert_called_with(*args, **kwargs): + return mock.assert_called_with(*args, **kwargs) + def assert_called_once_with(*args, **kwargs): + return mock.assert_called_once_with(*args, **kwargs) + def assert_has_calls(*args, **kwargs): + return mock.assert_has_calls(*args, **kwargs) + def assert_any_call(*args, **kwargs): + return mock.assert_any_call(*args, **kwargs) + def reset_mock(): + funcopy.method_calls = _CallList() + funcopy.mock_calls = _CallList() + mock.reset_mock() + ret = funcopy.return_value + if _is_instance_mock(ret) and not ret is mock: + ret.reset_mock() + + funcopy.called = False + funcopy.call_count = 0 + funcopy.call_args = None + funcopy.call_args_list = _CallList() + funcopy.method_calls = _CallList() + funcopy.mock_calls = _CallList() + + funcopy.return_value = mock.return_value + funcopy.side_effect = mock.side_effect + funcopy._mock_children = mock._mock_children + + funcopy.assert_called_with = assert_called_with + funcopy.assert_called_once_with = assert_called_once_with + funcopy.assert_has_calls = assert_has_calls + funcopy.assert_any_call = assert_any_call + funcopy.reset_mock = reset_mock + + mock._mock_delegate = funcopy + + +def _is_magic(name): + return '__%s__' % name[2:-2] == name + + +class _SentinelObject(object): + "A unique, named, sentinel object." + def __init__(self, name): + self.name = name + + def __repr__(self): + return 'sentinel.%s' % self.name + + +class _Sentinel(object): + """Access attributes to return a named object, usable as a sentinel.""" + def __init__(self): + self._sentinels = {} + + def __getattr__(self, name): + if name == '__bases__': + # Without this help(unittest.mock) raises an exception + raise AttributeError + return self._sentinels.setdefault(name, _SentinelObject(name)) + + +sentinel = _Sentinel() + +DEFAULT = sentinel.DEFAULT +_missing = sentinel.MISSING +_deleted = sentinel.DELETED + + +def _copy(value): + if type(value) in (dict, list, tuple, set): + return type(value)(value) + return value + + +_allowed_names = set( + [ + 'return_value', '_mock_return_value', 'side_effect', + '_mock_side_effect', '_mock_parent', '_mock_new_parent', + '_mock_name', '_mock_new_name' + ] +) + + +def _delegating_property(name): + _allowed_names.add(name) + _the_name = '_mock_' + name + def _get(self, name=name, _the_name=_the_name): + sig = self._mock_delegate + if sig is None: + return getattr(self, _the_name) + return getattr(sig, name) + def _set(self, value, name=name, _the_name=_the_name): + sig = self._mock_delegate + if sig is None: + self.__dict__[_the_name] = value + else: + setattr(sig, name, value) + + return property(_get, _set) + + + +class _CallList(list): + + def __contains__(self, value): + if not isinstance(value, list): + return list.__contains__(self, value) + len_value = len(value) + len_self = len(self) + if len_value > len_self: + return False + + for i in range(0, len_self - len_value + 1): + sub_list = self[i:i+len_value] + if sub_list == value: + return True + return False + + def __repr__(self): + return pprint.pformat(list(self)) + + +def _check_and_set_parent(parent, value, name, new_name): + if not _is_instance_mock(value): + return False + if ((value._mock_name or value._mock_new_name) or + (value._mock_parent is not None) or + (value._mock_new_parent is not None)): + return False + + _parent = parent + while _parent is not None: + # setting a mock (value) as a child or return value of itself + # should not modify the mock + if _parent is value: + return False + _parent = _parent._mock_new_parent + + if new_name: + value._mock_new_parent = parent + value._mock_new_name = new_name + if name: + value._mock_parent = parent + value._mock_name = name + return True + +# Internal class to identify if we wrapped an iterator object or not. +class _MockIter(object): + def __init__(self, obj): + self.obj = iter(obj) + def __iter__(self): + return self + def __next__(self): + return next(self.obj) + +class Base(object): + _mock_return_value = DEFAULT + _mock_side_effect = None + def __init__(self, *args, **kwargs): + pass + + + +class NonCallableMock(Base): + """A non-callable version of `Mock`""" + + def __new__(cls, *args, **kw): + # every instance has its own class + # so we can create magic methods on the + # class without stomping on other mocks + new = type(cls.__name__, (cls,), {'__doc__': cls.__doc__}) + instance = object.__new__(new) + return instance + + + def __init__( + self, spec=None, wraps=None, name=None, spec_set=None, + parent=None, _spec_state=None, _new_name='', _new_parent=None, + _spec_as_instance=False, _eat_self=None, unsafe=False, **kwargs + ): + if _new_parent is None: + _new_parent = parent + + __dict__ = self.__dict__ + __dict__['_mock_parent'] = parent + __dict__['_mock_name'] = name + __dict__['_mock_new_name'] = _new_name + __dict__['_mock_new_parent'] = _new_parent + + if spec_set is not None: + spec = spec_set + spec_set = True + if _eat_self is None: + _eat_self = parent is not None + + self._mock_add_spec(spec, spec_set, _spec_as_instance, _eat_self) + + __dict__['_mock_children'] = {} + __dict__['_mock_wraps'] = wraps + __dict__['_mock_delegate'] = None + + __dict__['_mock_called'] = False + __dict__['_mock_call_args'] = None + __dict__['_mock_call_count'] = 0 + __dict__['_mock_call_args_list'] = _CallList() + __dict__['_mock_mock_calls'] = _CallList() + + __dict__['method_calls'] = _CallList() + __dict__['_mock_unsafe'] = unsafe + + if kwargs: + self.configure_mock(**kwargs) + + _safe_super(NonCallableMock, self).__init__( + spec, wraps, name, spec_set, parent, + _spec_state + ) + + + def attach_mock(self, mock, attribute): + """ + Attach a mock as an attribute of this one, replacing its name and + parent. Calls to the attached mock will be recorded in the + `method_calls` and `mock_calls` attributes of this one.""" + mock._mock_parent = None + mock._mock_new_parent = None + mock._mock_name = '' + mock._mock_new_name = None + + setattr(self, attribute, mock) + + + def mock_add_spec(self, spec, spec_set=False): + """Add a spec to a mock. `spec` can either be an object or a + list of strings. Only attributes on the `spec` can be fetched as + attributes from the mock. + + If `spec_set` is True then only attributes on the spec can be set.""" + self._mock_add_spec(spec, spec_set) + + + def _mock_add_spec(self, spec, spec_set, _spec_as_instance=False, + _eat_self=False): + _spec_class = None + _spec_signature = None + + if spec is not None and not _is_list(spec): + if isinstance(spec, type): + _spec_class = spec + else: + _spec_class = _get_class(spec) + res = _get_signature_object(spec, + _spec_as_instance, _eat_self) + _spec_signature = res and res[1] + + spec = dir(spec) + + __dict__ = self.__dict__ + __dict__['_spec_class'] = _spec_class + __dict__['_spec_set'] = spec_set + __dict__['_spec_signature'] = _spec_signature + __dict__['_mock_methods'] = spec + + + def __get_return_value(self): + ret = self._mock_return_value + if self._mock_delegate is not None: + ret = self._mock_delegate.return_value + + if ret is DEFAULT: + ret = self._get_child_mock( + _new_parent=self, _new_name='()' + ) + self.return_value = ret + return ret + + + def __set_return_value(self, value): + if self._mock_delegate is not None: + self._mock_delegate.return_value = value + else: + self._mock_return_value = value + _check_and_set_parent(self, value, None, '()') + + __return_value_doc = "The value to be returned when the mock is called." + return_value = property(__get_return_value, __set_return_value, + __return_value_doc) + + + @property + def __class__(self): + if self._spec_class is None: + return type(self) + return self._spec_class + + called = _delegating_property('called') + call_count = _delegating_property('call_count') + call_args = _delegating_property('call_args') + call_args_list = _delegating_property('call_args_list') + mock_calls = _delegating_property('mock_calls') + + + def __get_side_effect(self): + delegated = self._mock_delegate + if delegated is None: + return self._mock_side_effect + sf = delegated.side_effect + if sf is not None and not callable(sf) and not isinstance(sf, _MockIter): + sf = _MockIter(sf) + delegated.side_effect = sf + return sf + + def __set_side_effect(self, value): + value = _try_iter(value) + delegated = self._mock_delegate + if delegated is None: + self._mock_side_effect = value + else: + delegated.side_effect = value + + side_effect = property(__get_side_effect, __set_side_effect) + + + def reset_mock(self): + "Restore the mock object to its initial state." + self.called = False + self.call_args = None + self.call_count = 0 + self.mock_calls = _CallList() + self.call_args_list = _CallList() + self.method_calls = _CallList() + + for child in self._mock_children.values(): + if isinstance(child, _SpecState): + continue + child.reset_mock() + + ret = self._mock_return_value + if _is_instance_mock(ret) and ret is not self: + ret.reset_mock() + + + def configure_mock(self, **kwargs): + """Set attributes on the mock through keyword arguments. + + Attributes plus return values and side effects can be set on child + mocks using standard dot notation and unpacking a dictionary in the + method call: + + >>> attrs = {'method.return_value': 3, 'other.side_effect': KeyError} + >>> mock.configure_mock(**attrs)""" + for arg, val in sorted(kwargs.items(), + # we sort on the number of dots so that + # attributes are set before we set attributes on + # attributes + key=lambda entry: entry[0].count('.')): + args = arg.split('.') + final = args.pop() + obj = self + for entry in args: + obj = getattr(obj, entry) + setattr(obj, final, val) + + + def __getattr__(self, name): + if name in {'_mock_methods', '_mock_unsafe'}: + raise AttributeError(name) + elif self._mock_methods is not None: + if name not in self._mock_methods or name in _all_magics: + raise AttributeError("Mock object has no attribute %r" % name) + elif _is_magic(name): + raise AttributeError(name) + if not self._mock_unsafe: + if name.startswith(('assert', 'assret')): + raise AttributeError(name) + + result = self._mock_children.get(name) + if result is _deleted: + raise AttributeError(name) + elif result is None: + wraps = None + if self._mock_wraps is not None: + # XXXX should we get the attribute without triggering code + # execution? + wraps = getattr(self._mock_wraps, name) + + result = self._get_child_mock( + parent=self, name=name, wraps=wraps, _new_name=name, + _new_parent=self + ) + self._mock_children[name] = result + + elif isinstance(result, _SpecState): + result = create_autospec( + result.spec, result.spec_set, result.instance, + result.parent, result.name + ) + self._mock_children[name] = result + + return result + + + def __repr__(self): + _name_list = [self._mock_new_name] + _parent = self._mock_new_parent + last = self + + dot = '.' + if _name_list == ['()']: + dot = '' + seen = set() + while _parent is not None: + last = _parent + + _name_list.append(_parent._mock_new_name + dot) + dot = '.' + if _parent._mock_new_name == '()': + dot = '' + + _parent = _parent._mock_new_parent + + # use ids here so as not to call __hash__ on the mocks + if id(_parent) in seen: + break + seen.add(id(_parent)) + + _name_list = list(reversed(_name_list)) + _first = last._mock_name or 'mock' + if len(_name_list) > 1: + if _name_list[1] not in ('()', '().'): + _first += '.' + _name_list[0] = _first + name = ''.join(_name_list) + + name_string = '' + if name not in ('mock', 'mock.'): + name_string = ' name=%r' % name + + spec_string = '' + if self._spec_class is not None: + spec_string = ' spec=%r' + if self._spec_set: + spec_string = ' spec_set=%r' + spec_string = spec_string % self._spec_class.__name__ + return "<%s%s%s id='%s'>" % ( + type(self).__name__, + name_string, + spec_string, + id(self) + ) + + + def __dir__(self): + """Filter the output of `dir(mock)` to only useful members.""" + if not FILTER_DIR: + return object.__dir__(self) + + extras = self._mock_methods or [] + from_type = dir(type(self)) + from_dict = list(self.__dict__) + + from_type = [e for e in from_type if not e.startswith('_')] + from_dict = [e for e in from_dict if not e.startswith('_') or + _is_magic(e)] + return sorted(set(extras + from_type + from_dict + + list(self._mock_children))) + + + def __setattr__(self, name, value): + if name in _allowed_names: + # property setters go through here + return object.__setattr__(self, name, value) + elif (self._spec_set and self._mock_methods is not None and + name not in self._mock_methods and + name not in self.__dict__): + raise AttributeError("Mock object has no attribute '%s'" % name) + elif name in _unsupported_magics: + msg = 'Attempting to set unsupported magic method %r.' % name + raise AttributeError(msg) + elif name in _all_magics: + if self._mock_methods is not None and name not in self._mock_methods: + raise AttributeError("Mock object has no attribute '%s'" % name) + + if not _is_instance_mock(value): + setattr(type(self), name, _get_method(name, value)) + original = value + value = lambda *args, **kw: original(self, *args, **kw) + else: + # only set _new_name and not name so that mock_calls is tracked + # but not method calls + _check_and_set_parent(self, value, None, name) + setattr(type(self), name, value) + self._mock_children[name] = value + elif name == '__class__': + self._spec_class = value + return + else: + if _check_and_set_parent(self, value, name, name): + self._mock_children[name] = value + return object.__setattr__(self, name, value) + + + def __delattr__(self, name): + if name in _all_magics and name in type(self).__dict__: + delattr(type(self), name) + if name not in self.__dict__: + # for magic methods that are still MagicProxy objects and + # not set on the instance itself + return + + if name in self.__dict__: + object.__delattr__(self, name) + + obj = self._mock_children.get(name, _missing) + if obj is _deleted: + raise AttributeError(name) + if obj is not _missing: + del self._mock_children[name] + self._mock_children[name] = _deleted + + + def _format_mock_call_signature(self, args, kwargs): + name = self._mock_name or 'mock' + return _format_call_signature(name, args, kwargs) + + + def _format_mock_failure_message(self, args, kwargs): + message = 'Expected call: %s\nActual call: %s' + expected_string = self._format_mock_call_signature(args, kwargs) + call_args = self.call_args + if len(call_args) == 3: + call_args = call_args[1:] + actual_string = self._format_mock_call_signature(*call_args) + return message % (expected_string, actual_string) + + + def _call_matcher(self, _call): + """ + Given a call (or simply a (args, kwargs) tuple), return a + comparison key suitable for matching with other calls. + This is a best effort method which relies on the spec's signature, + if available, or falls back on the arguments themselves. + """ + sig = self._spec_signature + if sig is not None: + if len(_call) == 2: + name = '' + args, kwargs = _call + else: + name, args, kwargs = _call + try: + return name, sig.bind(*args, **kwargs) + except TypeError as e: + return e.with_traceback(None) + else: + return _call + + def assert_not_called(_mock_self): + """assert that the mock was never called. + """ + self = _mock_self + if self.call_count != 0: + msg = ("Expected '%s' to not have been called. Called %s times." % + (self._mock_name or 'mock', self.call_count)) + raise AssertionError(msg) + + def assert_called_with(_mock_self, *args, **kwargs): + """assert that the mock was called with the specified arguments. + + Raises an AssertionError if the args and keyword args passed in are + different to the last call to the mock.""" + self = _mock_self + if self.call_args is None: + expected = self._format_mock_call_signature(args, kwargs) + raise AssertionError('Expected call: %s\nNot called' % (expected,)) + + def _error_message(): + msg = self._format_mock_failure_message(args, kwargs) + return msg + expected = self._call_matcher((args, kwargs)) + actual = self._call_matcher(self.call_args) + if expected != actual: + raise AssertionError(_error_message()) + + + def assert_called_once_with(_mock_self, *args, **kwargs): + """assert that the mock was called exactly once and with the specified + arguments.""" + self = _mock_self + if not self.call_count == 1: + msg = ("Expected '%s' to be called once. Called %s times." % + (self._mock_name or 'mock', self.call_count)) + raise AssertionError(msg) + return self.assert_called_with(*args, **kwargs) + + + def assert_has_calls(self, calls, any_order=False): + """assert the mock has been called with the specified calls. + The `mock_calls` list is checked for the calls. + + If `any_order` is False (the default) then the calls must be + sequential. There can be extra calls before or after the + specified calls. + + If `any_order` is True then the calls can be in any order, but + they must all appear in `mock_calls`.""" + expected = [self._call_matcher(c) for c in calls] + all_calls = _CallList(self._call_matcher(c) for c in self.mock_calls) + if not any_order: + if expected not in all_calls: + raise AssertionError( + 'Calls not found.\nExpected: %r\n' + 'Actual: %r' % (calls, self.mock_calls) + ) + return + + all_calls = list(all_calls) + + not_found = [] + for kall in expected: + try: + all_calls.remove(kall) + except ValueError: + not_found.append(kall) + if not_found: + raise AssertionError( + '%r not all found in call list' % (tuple(not_found),) + ) + + + def assert_any_call(self, *args, **kwargs): + """assert the mock has been called with the specified arguments. + + The assert passes if the mock has *ever* been called, unlike + `assert_called_with` and `assert_called_once_with` that only pass if + the call is the most recent one.""" + expected = self._call_matcher((args, kwargs)) + actual = [self._call_matcher(c) for c in self.call_args_list] + if expected not in actual: + expected_string = self._format_mock_call_signature(args, kwargs) + raise AssertionError( + '%s call not found' % expected_string + ) + + + def _get_child_mock(self, **kw): + """Create the child mocks for attributes and return value. + By default child mocks will be the same type as the parent. + Subclasses of Mock may want to override this to customize the way + child mocks are made. + + For non-callable mocks the callable variant will be used (rather than + any custom subclass).""" + _type = type(self) + if not issubclass(_type, CallableMixin): + if issubclass(_type, NonCallableMagicMock): + klass = MagicMock + elif issubclass(_type, NonCallableMock) : + klass = Mock + else: + klass = _type.__mro__[1] + return klass(**kw) + + + +def _try_iter(obj): + if obj is None: + return obj + if _is_exception(obj): + return obj + if _callable(obj): + return obj + try: + return iter(obj) + except TypeError: + # XXXX backwards compatibility + # but this will blow up on first call - so maybe we should fail early? + return obj + + + +class CallableMixin(Base): + + def __init__(self, spec=None, side_effect=None, return_value=DEFAULT, + wraps=None, name=None, spec_set=None, parent=None, + _spec_state=None, _new_name='', _new_parent=None, **kwargs): + self.__dict__['_mock_return_value'] = return_value + + _safe_super(CallableMixin, self).__init__( + spec, wraps, name, spec_set, parent, + _spec_state, _new_name, _new_parent, **kwargs + ) + + self.side_effect = side_effect + + + def _mock_check_sig(self, *args, **kwargs): + # stub method that can be replaced with one with a specific signature + pass + + + def __call__(_mock_self, *args, **kwargs): + # can't use self in-case a function / method we are mocking uses self + # in the signature + _mock_self._mock_check_sig(*args, **kwargs) + return _mock_self._mock_call(*args, **kwargs) + + + def _mock_call(_mock_self, *args, **kwargs): + self = _mock_self + self.called = True + self.call_count += 1 + _new_name = self._mock_new_name + _new_parent = self._mock_new_parent + + _call = _Call((args, kwargs), two=True) + self.call_args = _call + self.call_args_list.append(_call) + self.mock_calls.append(_Call(('', args, kwargs))) + + seen = set() + skip_next_dot = _new_name == '()' + do_method_calls = self._mock_parent is not None + name = self._mock_name + while _new_parent is not None: + this_mock_call = _Call((_new_name, args, kwargs)) + if _new_parent._mock_new_name: + dot = '.' + if skip_next_dot: + dot = '' + + skip_next_dot = False + if _new_parent._mock_new_name == '()': + skip_next_dot = True + + _new_name = _new_parent._mock_new_name + dot + _new_name + + if do_method_calls: + if _new_name == name: + this_method_call = this_mock_call + else: + this_method_call = _Call((name, args, kwargs)) + _new_parent.method_calls.append(this_method_call) + + do_method_calls = _new_parent._mock_parent is not None + if do_method_calls: + name = _new_parent._mock_name + '.' + name + + _new_parent.mock_calls.append(this_mock_call) + _new_parent = _new_parent._mock_new_parent + + # use ids here so as not to call __hash__ on the mocks + _new_parent_id = id(_new_parent) + if _new_parent_id in seen: + break + seen.add(_new_parent_id) + + ret_val = DEFAULT + effect = self.side_effect + if effect is not None: + if _is_exception(effect): + raise effect + + if not _callable(effect): + result = next(effect) + if _is_exception(result): + raise result + if result is DEFAULT: + result = self.return_value + return result + + ret_val = effect(*args, **kwargs) + + if (self._mock_wraps is not None and + self._mock_return_value is DEFAULT): + return self._mock_wraps(*args, **kwargs) + if ret_val is DEFAULT: + ret_val = self.return_value + return ret_val + + + +class Mock(CallableMixin, NonCallableMock): + """ + Create a new `Mock` object. `Mock` takes several optional arguments + that specify the behaviour of the Mock object: + + * `spec`: This can be either a list of strings or an existing object (a + class or instance) that acts as the specification for the mock object. If + you pass in an object then a list of strings is formed by calling dir on + the object (excluding unsupported magic attributes and methods). Accessing + any attribute not in this list will raise an `AttributeError`. + + If `spec` is an object (rather than a list of strings) then + `mock.__class__` returns the class of the spec object. This allows mocks + to pass `isinstance` tests. + + * `spec_set`: A stricter variant of `spec`. If used, attempting to *set* + or get an attribute on the mock that isn't on the object passed as + `spec_set` will raise an `AttributeError`. + + * `side_effect`: A function to be called whenever the Mock is called. See + the `side_effect` attribute. Useful for raising exceptions or + dynamically changing return values. The function is called with the same + arguments as the mock, and unless it returns `DEFAULT`, the return + value of this function is used as the return value. + + If `side_effect` is an iterable then each call to the mock will return + the next value from the iterable. If any of the members of the iterable + are exceptions they will be raised instead of returned. + + * `return_value`: The value returned when the mock is called. By default + this is a new Mock (created on first access). See the + `return_value` attribute. + + * `wraps`: Item for the mock object to wrap. If `wraps` is not None then + calling the Mock will pass the call through to the wrapped object + (returning the real result). Attribute access on the mock will return a + Mock object that wraps the corresponding attribute of the wrapped object + (so attempting to access an attribute that doesn't exist will raise an + `AttributeError`). + + If the mock has an explicit `return_value` set then calls are not passed + to the wrapped object and the `return_value` is returned instead. + + * `name`: If the mock has a name then it will be used in the repr of the + mock. This can be useful for debugging. The name is propagated to child + mocks. + + Mocks can also be called with arbitrary keyword arguments. These will be + used to set attributes on the mock after it is created. + """ + + + +def _dot_lookup(thing, comp, import_path): + try: + return getattr(thing, comp) + except AttributeError: + __import__(import_path) + return getattr(thing, comp) + + +def _importer(target): + components = target.split('.') + import_path = components.pop(0) + thing = __import__(import_path) + + for comp in components: + import_path += ".%s" % comp + thing = _dot_lookup(thing, comp, import_path) + return thing + + +def _is_started(patcher): + # XXXX horrible + return hasattr(patcher, 'is_local') + + +class _patch(object): + + attribute_name = None + _active_patches = [] + + def __init__( + self, getter, attribute, new, spec, create, + spec_set, autospec, new_callable, kwargs + ): + if new_callable is not None: + if new is not DEFAULT: + raise ValueError( + "Cannot use 'new' and 'new_callable' together" + ) + if autospec is not None: + raise ValueError( + "Cannot use 'autospec' and 'new_callable' together" + ) + + self.getter = getter + self.attribute = attribute + self.new = new + self.new_callable = new_callable + self.spec = spec + self.create = create + self.has_local = False + self.spec_set = spec_set + self.autospec = autospec + self.kwargs = kwargs + self.additional_patchers = [] + + + def copy(self): + patcher = _patch( + self.getter, self.attribute, self.new, self.spec, + self.create, self.spec_set, + self.autospec, self.new_callable, self.kwargs + ) + patcher.attribute_name = self.attribute_name + patcher.additional_patchers = [ + p.copy() for p in self.additional_patchers + ] + return patcher + + + def __call__(self, func): + if isinstance(func, type): + return self.decorate_class(func) + return self.decorate_callable(func) + + + def decorate_class(self, klass): + for attr in dir(klass): + if not attr.startswith(patch.TEST_PREFIX): + continue + + attr_value = getattr(klass, attr) + if not hasattr(attr_value, "__call__"): + continue + + patcher = self.copy() + setattr(klass, attr, patcher(attr_value)) + return klass + + + def decorate_callable(self, func): + if hasattr(func, 'patchings'): + func.patchings.append(self) + return func + + @wraps(func) + def patched(*args, **keywargs): + extra_args = [] + entered_patchers = [] + + exc_info = tuple() + try: + for patching in patched.patchings: + arg = patching.__enter__() + entered_patchers.append(patching) + if patching.attribute_name is not None: + keywargs.update(arg) + elif patching.new is DEFAULT: + extra_args.append(arg) + + args += tuple(extra_args) + return func(*args, **keywargs) + except: + if (patching not in entered_patchers and + _is_started(patching)): + # the patcher may have been started, but an exception + # raised whilst entering one of its additional_patchers + entered_patchers.append(patching) + # Pass the exception to __exit__ + exc_info = sys.exc_info() + # re-raise the exception + raise + finally: + for patching in reversed(entered_patchers): + patching.__exit__(*exc_info) + + patched.patchings = [self] + return patched + + + def get_original(self): + target = self.getter() + name = self.attribute + + original = DEFAULT + local = False + + try: + original = target.__dict__[name] + except (AttributeError, KeyError): + original = getattr(target, name, DEFAULT) + else: + local = True + + if name in _builtins and isinstance(target, ModuleType): + self.create = True + + if not self.create and original is DEFAULT: + raise AttributeError( + "%s does not have the attribute %r" % (target, name) + ) + return original, local + + + def __enter__(self): + """Perform the patch.""" + new, spec, spec_set = self.new, self.spec, self.spec_set + autospec, kwargs = self.autospec, self.kwargs + new_callable = self.new_callable + self.target = self.getter() + + # normalise False to None + if spec is False: + spec = None + if spec_set is False: + spec_set = None + if autospec is False: + autospec = None + + if spec is not None and autospec is not None: + raise TypeError("Can't specify spec and autospec") + if ((spec is not None or autospec is not None) and + spec_set not in (True, None)): + raise TypeError("Can't provide explicit spec_set *and* spec or autospec") + + original, local = self.get_original() + + if new is DEFAULT and autospec is None: + inherit = False + if spec is True: + # set spec to the object we are replacing + spec = original + if spec_set is True: + spec_set = original + spec = None + elif spec is not None: + if spec_set is True: + spec_set = spec + spec = None + elif spec_set is True: + spec_set = original + + if spec is not None or spec_set is not None: + if original is DEFAULT: + raise TypeError("Can't use 'spec' with create=True") + if isinstance(original, type): + # If we're patching out a class and there is a spec + inherit = True + + Klass = MagicMock + _kwargs = {} + if new_callable is not None: + Klass = new_callable + elif spec is not None or spec_set is not None: + this_spec = spec + if spec_set is not None: + this_spec = spec_set + if _is_list(this_spec): + not_callable = '__call__' not in this_spec + else: + not_callable = not callable(this_spec) + if not_callable: + Klass = NonCallableMagicMock + + if spec is not None: + _kwargs['spec'] = spec + if spec_set is not None: + _kwargs['spec_set'] = spec_set + + # add a name to mocks + if (isinstance(Klass, type) and + issubclass(Klass, NonCallableMock) and self.attribute): + _kwargs['name'] = self.attribute + + _kwargs.update(kwargs) + new = Klass(**_kwargs) + + if inherit and _is_instance_mock(new): + # we can only tell if the instance should be callable if the + # spec is not a list + this_spec = spec + if spec_set is not None: + this_spec = spec_set + if (not _is_list(this_spec) and not + _instance_callable(this_spec)): + Klass = NonCallableMagicMock + + _kwargs.pop('name') + new.return_value = Klass(_new_parent=new, _new_name='()', + **_kwargs) + elif autospec is not None: + # spec is ignored, new *must* be default, spec_set is treated + # as a boolean. Should we check spec is not None and that spec_set + # is a bool? + if new is not DEFAULT: + raise TypeError( + "autospec creates the mock for you. Can't specify " + "autospec and new." + ) + if original is DEFAULT: + raise TypeError("Can't use 'autospec' with create=True") + spec_set = bool(spec_set) + if autospec is True: + autospec = original + + new = create_autospec(autospec, spec_set=spec_set, + _name=self.attribute, **kwargs) + elif kwargs: + # can't set keyword args when we aren't creating the mock + # XXXX If new is a Mock we could call new.configure_mock(**kwargs) + raise TypeError("Can't pass kwargs to a mock we aren't creating") + + new_attr = new + + self.temp_original = original + self.is_local = local + setattr(self.target, self.attribute, new_attr) + if self.attribute_name is not None: + extra_args = {} + if self.new is DEFAULT: + extra_args[self.attribute_name] = new + for patching in self.additional_patchers: + arg = patching.__enter__() + if patching.new is DEFAULT: + extra_args.update(arg) + return extra_args + + return new + + + def __exit__(self, *exc_info): + """Undo the patch.""" + if not _is_started(self): + raise RuntimeError('stop called on unstarted patcher') + + if self.is_local and self.temp_original is not DEFAULT: + setattr(self.target, self.attribute, self.temp_original) + else: + delattr(self.target, self.attribute) + if not self.create and not hasattr(self.target, self.attribute): + # needed for proxy objects like django settings + setattr(self.target, self.attribute, self.temp_original) + + del self.temp_original + del self.is_local + del self.target + for patcher in reversed(self.additional_patchers): + if _is_started(patcher): + patcher.__exit__(*exc_info) + + + def start(self): + """Activate a patch, returning any created mock.""" + result = self.__enter__() + self._active_patches.append(self) + return result + + + def stop(self): + """Stop an active patch.""" + try: + self._active_patches.remove(self) + except ValueError: + # If the patch hasn't been started this will fail + pass + + return self.__exit__() + + + +def _get_target(target): + try: + target, attribute = target.rsplit('.', 1) + except (TypeError, ValueError): + raise TypeError("Need a valid target to patch. You supplied: %r" % + (target,)) + getter = lambda: _importer(target) + return getter, attribute + + +def _patch_object( + target, attribute, new=DEFAULT, spec=None, + create=False, spec_set=None, autospec=None, + new_callable=None, **kwargs + ): + """ + patch the named member (`attribute`) on an object (`target`) with a mock + object. + + `patch.object` can be used as a decorator, class decorator or a context + manager. Arguments `new`, `spec`, `create`, `spec_set`, + `autospec` and `new_callable` have the same meaning as for `patch`. Like + `patch`, `patch.object` takes arbitrary keyword arguments for configuring + the mock object it creates. + + When used as a class decorator `patch.object` honours `patch.TEST_PREFIX` + for choosing which methods to wrap. + """ + getter = lambda: target + return _patch( + getter, attribute, new, spec, create, + spec_set, autospec, new_callable, kwargs + ) + + +def _patch_multiple(target, spec=None, create=False, spec_set=None, + autospec=None, new_callable=None, **kwargs): + """Perform multiple patches in a single call. It takes the object to be + patched (either as an object or a string to fetch the object by importing) + and keyword arguments for the patches:: + + with patch.multiple(settings, FIRST_PATCH='one', SECOND_PATCH='two'): + ... + + Use `DEFAULT` as the value if you want `patch.multiple` to create + mocks for you. In this case the created mocks are passed into a decorated + function by keyword, and a dictionary is returned when `patch.multiple` is + used as a context manager. + + `patch.multiple` can be used as a decorator, class decorator or a context + manager. The arguments `spec`, `spec_set`, `create`, + `autospec` and `new_callable` have the same meaning as for `patch`. These + arguments will be applied to *all* patches done by `patch.multiple`. + + When used as a class decorator `patch.multiple` honours `patch.TEST_PREFIX` + for choosing which methods to wrap. + """ + if type(target) is str: + getter = lambda: _importer(target) + else: + getter = lambda: target + + if not kwargs: + raise ValueError( + 'Must supply at least one keyword argument with patch.multiple' + ) + # need to wrap in a list for python 3, where items is a view + items = list(kwargs.items()) + attribute, new = items[0] + patcher = _patch( + getter, attribute, new, spec, create, spec_set, + autospec, new_callable, {} + ) + patcher.attribute_name = attribute + for attribute, new in items[1:]: + this_patcher = _patch( + getter, attribute, new, spec, create, spec_set, + autospec, new_callable, {} + ) + this_patcher.attribute_name = attribute + patcher.additional_patchers.append(this_patcher) + return patcher + + +def patch( + target, new=DEFAULT, spec=None, create=False, + spec_set=None, autospec=None, new_callable=None, **kwargs + ): + """ + `patch` acts as a function decorator, class decorator or a context + manager. Inside the body of the function or with statement, the `target` + is patched with a `new` object. When the function/with statement exits + the patch is undone. + + If `new` is omitted, then the target is replaced with a + `MagicMock`. If `patch` is used as a decorator and `new` is + omitted, the created mock is passed in as an extra argument to the + decorated function. If `patch` is used as a context manager the created + mock is returned by the context manager. + + `target` should be a string in the form `'package.module.ClassName'`. The + `target` is imported and the specified object replaced with the `new` + object, so the `target` must be importable from the environment you are + calling `patch` from. The target is imported when the decorated function + is executed, not at decoration time. + + The `spec` and `spec_set` keyword arguments are passed to the `MagicMock` + if patch is creating one for you. + + In addition you can pass `spec=True` or `spec_set=True`, which causes + patch to pass in the object being mocked as the spec/spec_set object. + + `new_callable` allows you to specify a different class, or callable object, + that will be called to create the `new` object. By default `MagicMock` is + used. + + A more powerful form of `spec` is `autospec`. If you set `autospec=True` + then the mock with be created with a spec from the object being replaced. + All attributes of the mock will also have the spec of the corresponding + attribute of the object being replaced. Methods and functions being + mocked will have their arguments checked and will raise a `TypeError` if + they are called with the wrong signature. For mocks replacing a class, + their return value (the 'instance') will have the same spec as the class. + + Instead of `autospec=True` you can pass `autospec=some_object` to use an + arbitrary object as the spec instead of the one being replaced. + + By default `patch` will fail to replace attributes that don't exist. If + you pass in `create=True`, and the attribute doesn't exist, patch will + create the attribute for you when the patched function is called, and + delete it again afterwards. This is useful for writing tests against + attributes that your production code creates at runtime. It is off by + default because it can be dangerous. With it switched on you can write + passing tests against APIs that don't actually exist! + + Patch can be used as a `TestCase` class decorator. It works by + decorating each test method in the class. This reduces the boilerplate + code when your test methods share a common patchings set. `patch` finds + tests by looking for method names that start with `patch.TEST_PREFIX`. + By default this is `test`, which matches the way `unittest` finds tests. + You can specify an alternative prefix by setting `patch.TEST_PREFIX`. + + Patch can be used as a context manager, with the with statement. Here the + patching applies to the indented block after the with statement. If you + use "as" then the patched object will be bound to the name after the + "as"; very useful if `patch` is creating a mock object for you. + + `patch` takes arbitrary keyword arguments. These will be passed to + the `Mock` (or `new_callable`) on construction. + + `patch.dict(...)`, `patch.multiple(...)` and `patch.object(...)` are + available for alternate use-cases. + """ + getter, attribute = _get_target(target) + return _patch( + getter, attribute, new, spec, create, + spec_set, autospec, new_callable, kwargs + ) + + +class _patch_dict(object): + """ + Patch a dictionary, or dictionary like object, and restore the dictionary + to its original state after the test. + + `in_dict` can be a dictionary or a mapping like container. If it is a + mapping then it must at least support getting, setting and deleting items + plus iterating over keys. + + `in_dict` can also be a string specifying the name of the dictionary, which + will then be fetched by importing it. + + `values` can be a dictionary of values to set in the dictionary. `values` + can also be an iterable of `(key, value)` pairs. + + If `clear` is True then the dictionary will be cleared before the new + values are set. + + `patch.dict` can also be called with arbitrary keyword arguments to set + values in the dictionary:: + + with patch.dict('sys.modules', mymodule=Mock(), other_module=Mock()): + ... + + `patch.dict` can be used as a context manager, decorator or class + decorator. When used as a class decorator `patch.dict` honours + `patch.TEST_PREFIX` for choosing which methods to wrap. + """ + + def __init__(self, in_dict, values=(), clear=False, **kwargs): + if isinstance(in_dict, str): + in_dict = _importer(in_dict) + self.in_dict = in_dict + # support any argument supported by dict(...) constructor + self.values = dict(values) + self.values.update(kwargs) + self.clear = clear + self._original = None + + + def __call__(self, f): + if isinstance(f, type): + return self.decorate_class(f) + @wraps(f) + def _inner(*args, **kw): + self._patch_dict() + try: + return f(*args, **kw) + finally: + self._unpatch_dict() + + return _inner + + + def decorate_class(self, klass): + for attr in dir(klass): + attr_value = getattr(klass, attr) + if (attr.startswith(patch.TEST_PREFIX) and + hasattr(attr_value, "__call__")): + decorator = _patch_dict(self.in_dict, self.values, self.clear) + decorated = decorator(attr_value) + setattr(klass, attr, decorated) + return klass + + + def __enter__(self): + """Patch the dict.""" + self._patch_dict() + + + def _patch_dict(self): + values = self.values + in_dict = self.in_dict + clear = self.clear + + try: + original = in_dict.copy() + except AttributeError: + # dict like object with no copy method + # must support iteration over keys + original = {} + for key in in_dict: + original[key] = in_dict[key] + self._original = original + + if clear: + _clear_dict(in_dict) + + try: + in_dict.update(values) + except AttributeError: + # dict like object with no update method + for key in values: + in_dict[key] = values[key] + + + def _unpatch_dict(self): + in_dict = self.in_dict + original = self._original + + _clear_dict(in_dict) + + try: + in_dict.update(original) + except AttributeError: + for key in original: + in_dict[key] = original[key] + + + def __exit__(self, *args): + """Unpatch the dict.""" + self._unpatch_dict() + return False + + start = __enter__ + stop = __exit__ + + +def _clear_dict(in_dict): + try: + in_dict.clear() + except AttributeError: + keys = list(in_dict) + for key in keys: + del in_dict[key] + + +def _patch_stopall(): + """Stop all active patches. LIFO to unroll nested patches.""" + for patch in reversed(_patch._active_patches): + patch.stop() + + +patch.object = _patch_object +patch.dict = _patch_dict +patch.multiple = _patch_multiple +patch.stopall = _patch_stopall +patch.TEST_PREFIX = 'test' + +magic_methods = ( + "lt le gt ge eq ne " + "getitem setitem delitem " + "len contains iter " + "hash str sizeof " + "enter exit " + "divmod neg pos abs invert " + "complex int float index " + "trunc floor ceil " + "bool next " +) + +numerics = ( + "add sub mul div floordiv mod lshift rshift and xor or pow truediv" +) +inplace = ' '.join('i%s' % n for n in numerics.split()) +right = ' '.join('r%s' % n for n in numerics.split()) + +# not including __prepare__, __instancecheck__, __subclasscheck__ +# (as they are metaclass methods) +# __del__ is not supported at all as it causes problems if it exists + +_non_defaults = set('__%s__' % method for method in [ + 'get', 'set', 'delete', 'reversed', 'missing', 'reduce', 'reduce_ex', + 'getinitargs', 'getnewargs', 'getstate', 'setstate', 'getformat', + 'setformat', 'repr', 'dir', 'subclasses', 'format', +]) + + +def _get_method(name, func): + "Turns a callable object (like a mock) into a real function" + def method(self, *args, **kw): + return func(self, *args, **kw) + method.__name__ = name + return method + + +_magics = set( + '__%s__' % method for method in + ' '.join([magic_methods, numerics, inplace, right]).split() +) + +_all_magics = _magics | _non_defaults + +_unsupported_magics = set([ + '__getattr__', '__setattr__', + '__init__', '__new__', '__prepare__' + '__instancecheck__', '__subclasscheck__', + '__del__' +]) + +_calculate_return_value = { + '__hash__': lambda self: object.__hash__(self), + '__str__': lambda self: object.__str__(self), + '__sizeof__': lambda self: object.__sizeof__(self), +} + +_return_values = { + '__lt__': NotImplemented, + '__gt__': NotImplemented, + '__le__': NotImplemented, + '__ge__': NotImplemented, + '__int__': 1, + '__contains__': False, + '__len__': 0, + '__exit__': False, + '__complex__': 1j, + '__float__': 1.0, + '__bool__': True, + '__index__': 1, +} + + +def _get_eq(self): + def __eq__(other): + ret_val = self.__eq__._mock_return_value + if ret_val is not DEFAULT: + return ret_val + return self is other + return __eq__ + +def _get_ne(self): + def __ne__(other): + if self.__ne__._mock_return_value is not DEFAULT: + return DEFAULT + return self is not other + return __ne__ + +def _get_iter(self): + def __iter__(): + ret_val = self.__iter__._mock_return_value + if ret_val is DEFAULT: + return iter([]) + # if ret_val was already an iterator, then calling iter on it should + # return the iterator unchanged + return iter(ret_val) + return __iter__ + +_side_effect_methods = { + '__eq__': _get_eq, + '__ne__': _get_ne, + '__iter__': _get_iter, +} + + + +def _set_return_value(mock, method, name): + fixed = _return_values.get(name, DEFAULT) + if fixed is not DEFAULT: + method.return_value = fixed + return + + return_calulator = _calculate_return_value.get(name) + if return_calulator is not None: + try: + return_value = return_calulator(mock) + except AttributeError: + # XXXX why do we return AttributeError here? + # set it as a side_effect instead? + return_value = AttributeError(name) + method.return_value = return_value + return + + side_effector = _side_effect_methods.get(name) + if side_effector is not None: + method.side_effect = side_effector(mock) + + + +class MagicMixin(object): + def __init__(self, *args, **kw): + _safe_super(MagicMixin, self).__init__(*args, **kw) + self._mock_set_magics() + + + def _mock_set_magics(self): + these_magics = _magics + + if self._mock_methods is not None: + these_magics = _magics.intersection(self._mock_methods) + + remove_magics = set() + remove_magics = _magics - these_magics + + for entry in remove_magics: + if entry in type(self).__dict__: + # remove unneeded magic methods + delattr(self, entry) + + # don't overwrite existing attributes if called a second time + these_magics = these_magics - set(type(self).__dict__) + + _type = type(self) + for entry in these_magics: + setattr(_type, entry, MagicProxy(entry, self)) + + + +class NonCallableMagicMock(MagicMixin, NonCallableMock): + """A version of `MagicMock` that isn't callable.""" + def mock_add_spec(self, spec, spec_set=False): + """Add a spec to a mock. `spec` can either be an object or a + list of strings. Only attributes on the `spec` can be fetched as + attributes from the mock. + + If `spec_set` is True then only attributes on the spec can be set.""" + self._mock_add_spec(spec, spec_set) + self._mock_set_magics() + + + +class MagicMock(MagicMixin, Mock): + """ + MagicMock is a subclass of Mock with default implementations + of most of the magic methods. You can use MagicMock without having to + configure the magic methods yourself. + + If you use the `spec` or `spec_set` arguments then *only* magic + methods that exist in the spec will be created. + + Attributes and the return value of a `MagicMock` will also be `MagicMocks`. + """ + def mock_add_spec(self, spec, spec_set=False): + """Add a spec to a mock. `spec` can either be an object or a + list of strings. Only attributes on the `spec` can be fetched as + attributes from the mock. + + If `spec_set` is True then only attributes on the spec can be set.""" + self._mock_add_spec(spec, spec_set) + self._mock_set_magics() + + + +class MagicProxy(object): + def __init__(self, name, parent): + self.name = name + self.parent = parent + + def __call__(self, *args, **kwargs): + m = self.create_mock() + return m(*args, **kwargs) + + def create_mock(self): + entry = self.name + parent = self.parent + m = parent._get_child_mock(name=entry, _new_name=entry, + _new_parent=parent) + setattr(parent, entry, m) + _set_return_value(parent, m, entry) + return m + + def __get__(self, obj, _type=None): + return self.create_mock() + + + +class _ANY(object): + "A helper object that compares equal to everything." + + def __eq__(self, other): + return True + + def __ne__(self, other): + return False + + def __repr__(self): + return '' + +ANY = _ANY() + + + +def _format_call_signature(name, args, kwargs): + message = '%s(%%s)' % name + formatted_args = '' + args_string = ', '.join([repr(arg) for arg in args]) + kwargs_string = ', '.join([ + '%s=%r' % (key, value) for key, value in sorted(kwargs.items()) + ]) + if args_string: + formatted_args = args_string + if kwargs_string: + if formatted_args: + formatted_args += ', ' + formatted_args += kwargs_string + + return message % formatted_args + + + +class _Call(tuple): + """ + A tuple for holding the results of a call to a mock, either in the form + `(args, kwargs)` or `(name, args, kwargs)`. + + If args or kwargs are empty then a call tuple will compare equal to + a tuple without those values. This makes comparisons less verbose:: + + _Call(('name', (), {})) == ('name',) + _Call(('name', (1,), {})) == ('name', (1,)) + _Call(((), {'a': 'b'})) == ({'a': 'b'},) + + The `_Call` object provides a useful shortcut for comparing with call:: + + _Call(((1, 2), {'a': 3})) == call(1, 2, a=3) + _Call(('foo', (1, 2), {'a': 3})) == call.foo(1, 2, a=3) + + If the _Call has no name then it will match any name. + """ + def __new__(cls, value=(), name=None, parent=None, two=False, + from_kall=True): + name = '' + args = () + kwargs = {} + _len = len(value) + if _len == 3: + name, args, kwargs = value + elif _len == 2: + first, second = value + if isinstance(first, str): + name = first + if isinstance(second, tuple): + args = second + else: + kwargs = second + else: + args, kwargs = first, second + elif _len == 1: + value, = value + if isinstance(value, str): + name = value + elif isinstance(value, tuple): + args = value + else: + kwargs = value + + if two: + return tuple.__new__(cls, (args, kwargs)) + + return tuple.__new__(cls, (name, args, kwargs)) + + + def __init__(self, value=(), name=None, parent=None, two=False, + from_kall=True): + self.name = name + self.parent = parent + self.from_kall = from_kall + + + def __eq__(self, other): + if other is ANY: + return True + try: + len_other = len(other) + except TypeError: + return False + + self_name = '' + if len(self) == 2: + self_args, self_kwargs = self + else: + self_name, self_args, self_kwargs = self + + other_name = '' + if len_other == 0: + other_args, other_kwargs = (), {} + elif len_other == 3: + other_name, other_args, other_kwargs = other + elif len_other == 1: + value, = other + if isinstance(value, tuple): + other_args = value + other_kwargs = {} + elif isinstance(value, str): + other_name = value + other_args, other_kwargs = (), {} + else: + other_args = () + other_kwargs = value + else: + # len 2 + # could be (name, args) or (name, kwargs) or (args, kwargs) + first, second = other + if isinstance(first, str): + other_name = first + if isinstance(second, tuple): + other_args, other_kwargs = second, {} + else: + other_args, other_kwargs = (), second + else: + other_args, other_kwargs = first, second + + if self_name and other_name != self_name: + return False + + # this order is important for ANY to work! + return (other_args, other_kwargs) == (self_args, self_kwargs) + + + def __ne__(self, other): + return not self.__eq__(other) + + + def __call__(self, *args, **kwargs): + if self.name is None: + return _Call(('', args, kwargs), name='()') + + name = self.name + '()' + return _Call((self.name, args, kwargs), name=name, parent=self) + + + def __getattr__(self, attr): + if self.name is None: + return _Call(name=attr, from_kall=False) + name = '%s.%s' % (self.name, attr) + return _Call(name=name, parent=self, from_kall=False) + + + def count(self, *args, **kwargs): + return self.__getattr__('count')(*args, **kwargs) + + def index(self, *args, **kwargs): + return self.__getattr__('index')(*args, **kwargs) + + def __repr__(self): + if not self.from_kall: + name = self.name or 'call' + if name.startswith('()'): + name = 'call%s' % name + return name + + if len(self) == 2: + name = 'call' + args, kwargs = self + else: + name, args, kwargs = self + if not name: + name = 'call' + elif not name.startswith('()'): + name = 'call.%s' % name + else: + name = 'call%s' % name + return _format_call_signature(name, args, kwargs) + + + def call_list(self): + """For a call object that represents multiple calls, `call_list` + returns a list of all the intermediate calls as well as the + final call.""" + vals = [] + thing = self + while thing is not None: + if thing.from_kall: + vals.append(thing) + thing = thing.parent + return _CallList(reversed(vals)) + + +call = _Call(from_kall=False) + + + +def create_autospec(spec, spec_set=False, instance=False, _parent=None, + _name=None, **kwargs): + """Create a mock object using another object as a spec. Attributes on the + mock will use the corresponding attribute on the `spec` object as their + spec. + + Functions or methods being mocked will have their arguments checked + to check that they are called with the correct signature. + + If `spec_set` is True then attempting to set attributes that don't exist + on the spec object will raise an `AttributeError`. + + If a class is used as a spec then the return value of the mock (the + instance of the class) will have the same spec. You can use a class as the + spec for an instance object by passing `instance=True`. The returned mock + will only be callable if instances of the mock are callable. + + `create_autospec` also takes arbitrary keyword arguments that are passed to + the constructor of the created mock.""" + if _is_list(spec): + # can't pass a list instance to the mock constructor as it will be + # interpreted as a list of strings + spec = type(spec) + + is_type = isinstance(spec, type) + + _kwargs = {'spec': spec} + if spec_set: + _kwargs = {'spec_set': spec} + elif spec is None: + # None we mock with a normal mock without a spec + _kwargs = {} + if _kwargs and instance: + _kwargs['_spec_as_instance'] = True + + _kwargs.update(kwargs) + + Klass = MagicMock + if type(spec) in DescriptorTypes: + # descriptors don't have a spec + # because we don't know what type they return + _kwargs = {} + elif not _callable(spec): + Klass = NonCallableMagicMock + elif is_type and instance and not _instance_callable(spec): + Klass = NonCallableMagicMock + + _name = _kwargs.pop('name', _name) + + _new_name = _name + if _parent is None: + # for a top level object no _new_name should be set + _new_name = '' + + mock = Klass(parent=_parent, _new_parent=_parent, _new_name=_new_name, + name=_name, **_kwargs) + + if isinstance(spec, FunctionTypes): + # should only happen at the top level because we don't + # recurse for functions + mock = _set_signature(mock, spec) + else: + _check_signature(spec, mock, is_type, instance) + + if _parent is not None and not instance: + _parent._mock_children[_name] = mock + + if is_type and not instance and 'return_value' not in kwargs: + mock.return_value = create_autospec(spec, spec_set, instance=True, + _name='()', _parent=mock) + + for entry in dir(spec): + if _is_magic(entry): + # MagicMock already does the useful magic methods for us + continue + + # XXXX do we need a better way of getting attributes without + # triggering code execution (?) Probably not - we need the actual + # object to mock it so we would rather trigger a property than mock + # the property descriptor. Likewise we want to mock out dynamically + # provided attributes. + # XXXX what about attributes that raise exceptions other than + # AttributeError on being fetched? + # we could be resilient against it, or catch and propagate the + # exception when the attribute is fetched from the mock + try: + original = getattr(spec, entry) + except AttributeError: + continue + + kwargs = {'spec': original} + if spec_set: + kwargs = {'spec_set': original} + + if not isinstance(original, FunctionTypes): + new = _SpecState(original, spec_set, mock, entry, instance) + mock._mock_children[entry] = new + else: + parent = mock + if isinstance(spec, FunctionTypes): + parent = mock.mock + + skipfirst = _must_skip(spec, entry, is_type) + kwargs['_eat_self'] = skipfirst + new = MagicMock(parent=parent, name=entry, _new_name=entry, + _new_parent=parent, + **kwargs) + mock._mock_children[entry] = new + _check_signature(original, new, skipfirst=skipfirst) + + # so functions created with _set_signature become instance attributes, + # *plus* their underlying mock exists in _mock_children of the parent + # mock. Adding to _mock_children may be unnecessary where we are also + # setting as an instance attribute? + if isinstance(new, FunctionTypes): + setattr(mock, entry, new) + + return mock + + +def _must_skip(spec, entry, is_type): + """ + Return whether we should skip the first argument on spec's `entry` + attribute. + """ + if not isinstance(spec, type): + if entry in getattr(spec, '__dict__', {}): + # instance attribute - shouldn't skip + return False + spec = spec.__class__ + + for klass in spec.__mro__: + result = klass.__dict__.get(entry, DEFAULT) + if result is DEFAULT: + continue + if isinstance(result, (staticmethod, classmethod)): + return False + elif isinstance(getattr(result, '__get__', None), MethodWrapperTypes): + # Normal method => skip if looked up on type + # (if looked up on instance, self is already skipped) + return is_type + else: + return False + + # shouldn't get here unless function is a dynamically provided attribute + # XXXX untested behaviour + return is_type + + +def _get_class(obj): + try: + return obj.__class__ + except AttributeError: + # it is possible for objects to have no __class__ + return type(obj) + + +class _SpecState(object): + + def __init__(self, spec, spec_set=False, parent=None, + name=None, ids=None, instance=False): + self.spec = spec + self.ids = ids + self.spec_set = spec_set + self.parent = parent + self.instance = instance + self.name = name + + +FunctionTypes = ( + # python function + type(create_autospec), + # instance method + type(ANY.__eq__), +) + +MethodWrapperTypes = ( + type(ANY.__eq__.__get__), +) + + +file_spec = None + +def _iterate_read_data(read_data): + # Helper for mock_open: + # Retrieve lines from read_data via a generator so that separate calls to + # readline, read, and readlines are properly interleaved + data_as_list = ['{}\n'.format(l) for l in read_data.split('\n')] + + if data_as_list[-1] == '\n': + # If the last line ended in a newline, the list comprehension will have an + # extra entry that's just a newline. Remove this. + data_as_list = data_as_list[:-1] + else: + # If there wasn't an extra newline by itself, then the file being + # emulated doesn't have a newline to end the last line remove the + # newline that our naive format() added + data_as_list[-1] = data_as_list[-1][:-1] + + for line in data_as_list: + yield line + +def mock_open(mock=None, read_data=''): + """ + A helper function to create a mock to replace the use of `open`. It works + for `open` called directly or used as a context manager. + + The `mock` argument is the mock object to configure. If `None` (the + default) then a `MagicMock` will be created for you, with the API limited + to methods or attributes available on standard file handles. + + `read_data` is a string for the `read` methoddline`, and `readlines` of the + file handle to return. This is an empty string by default. + """ + def _readlines_side_effect(*args, **kwargs): + if handle.readlines.return_value is not None: + return handle.readlines.return_value + return list(_data) + + def _read_side_effect(*args, **kwargs): + if handle.read.return_value is not None: + return handle.read.return_value + return ''.join(_data) + + def _readline_side_effect(): + if handle.readline.return_value is not None: + while True: + yield handle.readline.return_value + for line in _data: + yield line + + + global file_spec + if file_spec is None: + import _io + file_spec = list(set(dir(_io.TextIOWrapper)).union(set(dir(_io.BytesIO)))) + + if mock is None: + mock = MagicMock(name='open', spec=open) + + handle = MagicMock(spec=file_spec) + handle.__enter__.return_value = handle + + _data = _iterate_read_data(read_data) + + handle.write.return_value = None + handle.read.return_value = None + handle.readline.return_value = None + handle.readlines.return_value = None + + handle.read.side_effect = _read_side_effect + handle.readline.side_effect = _readline_side_effect() + handle.readlines.side_effect = _readlines_side_effect + + mock.return_value = handle + return mock + + +class PropertyMock(Mock): + """ + A mock intended to be used as a property, or other descriptor, on a class. + `PropertyMock` provides `__get__` and `__set__` methods so you can specify + a return value when it is fetched. + + Fetching a `PropertyMock` instance from an object calls the mock, with + no args. Setting it calls the mock with the value being set. + """ + def _get_child_mock(self, **kwargs): + return MagicMock(**kwargs) + + def __get__(self, obj, obj_type): + return self() + def __set__(self, obj, val): + self(val) diff --git a/Lib/test/test_ensurepip.py b/Lib/test/test_ensurepip.py new file mode 100644 --- /dev/null +++ b/Lib/test/test_ensurepip.py @@ -0,0 +1,352 @@ +import unittest +import os +import os.path +import contextlib +import sys +import test._mock_backport as mock +import test.test_support + +import ensurepip +import ensurepip._uninstall + +# pip currently requires ssl support, so we ensure we handle +# it being missing (http://bugs.python.org/issue19744) +ensurepip_no_ssl = test.test_support.import_fresh_module("ensurepip", + blocked=["ssl"]) +try: + import ssl +except ImportError: + ssl = None + + def requires_usable_pip(f): + deco = unittest.skip(ensurepip._MISSING_SSL_MESSAGE) + return deco(f) +else: + def requires_usable_pip(f): + return f + + +class TestEnsurePipVersion(unittest.TestCase): + + def test_returns_version(self): + self.assertEqual(ensurepip._PIP_VERSION, ensurepip.version()) + + +class EnsurepipMixin: + + def setUp(self): + run_pip_patch = mock.patch("ensurepip._run_pip") + self.run_pip = run_pip_patch.start() + self.addCleanup(run_pip_patch.stop) + + # Avoid side effects on the actual os module + real_devnull = os.devnull + os_patch = mock.patch("ensurepip.os") + patched_os = os_patch.start() + self.addCleanup(os_patch.stop) + patched_os.devnull = real_devnull + patched_os.path = os.path + self.os_environ = patched_os.environ = os.environ.copy() + + +class TestBootstrap(EnsurepipMixin, unittest.TestCase): + + @requires_usable_pip + def test_basic_bootstrapping(self): + ensurepip.bootstrap() + + self.run_pip.assert_called_once_with( + [ + "install", "--no-index", "--find-links", + mock.ANY, "setuptools", "pip", + ], + mock.ANY, + ) + + additional_paths = self.run_pip.call_args[0][1] + self.assertEqual(len(additional_paths), 2) + + @requires_usable_pip + def test_bootstrapping_with_root(self): + ensurepip.bootstrap(root="/foo/bar/") + + self.run_pip.assert_called_once_with( + [ + "install", "--no-index", "--find-links", + mock.ANY, "--root", "/foo/bar/", + "setuptools", "pip", + ], + mock.ANY, + ) + + @requires_usable_pip + def test_bootstrapping_with_user(self): + ensurepip.bootstrap(user=True) + + self.run_pip.assert_called_once_with( + [ + "install", "--no-index", "--find-links", + mock.ANY, "--user", "setuptools", "pip", + ], + mock.ANY, + ) + + @requires_usable_pip + def test_bootstrapping_with_upgrade(self): + ensurepip.bootstrap(upgrade=True) + + self.run_pip.assert_called_once_with( + [ + "install", "--no-index", "--find-links", + mock.ANY, "--upgrade", "setuptools", "pip", + ], + mock.ANY, + ) + + @requires_usable_pip + def test_bootstrapping_with_verbosity_1(self): + ensurepip.bootstrap(verbosity=1) + + self.run_pip.assert_called_once_with( + [ + "install", "--no-index", "--find-links", + mock.ANY, "-v", "setuptools", "pip", + ], + mock.ANY, + ) + + @requires_usable_pip + def test_bootstrapping_with_verbosity_2(self): + ensurepip.bootstrap(verbosity=2) + + self.run_pip.assert_called_once_with( + [ + "install", "--no-index", "--find-links", + mock.ANY, "-vv", "setuptools", "pip", + ], + mock.ANY, + ) + + @requires_usable_pip + def test_bootstrapping_with_verbosity_3(self): + ensurepip.bootstrap(verbosity=3) + + self.run_pip.assert_called_once_with( + [ + "install", "--no-index", "--find-links", + mock.ANY, "-vvv", "setuptools", "pip", + ], + mock.ANY, + ) + + @requires_usable_pip + def test_bootstrapping_with_regular_install(self): + ensurepip.bootstrap() + self.assertEqual(self.os_environ["ENSUREPIP_OPTIONS"], "install") + + @requires_usable_pip + def test_bootstrapping_with_alt_install(self): + ensurepip.bootstrap(altinstall=True) + self.assertEqual(self.os_environ["ENSUREPIP_OPTIONS"], "altinstall") + + @requires_usable_pip + def test_bootstrapping_with_default_pip(self): + ensurepip.bootstrap(default_pip=True) + self.assertNotIn("ENSUREPIP_OPTIONS", self.os_environ) + + def test_altinstall_default_pip_conflict(self): + with self.assertRaises(ValueError): + ensurepip.bootstrap(altinstall=True, default_pip=True) + self.assertFalse(self.run_pip.called) + + @requires_usable_pip + def test_pip_environment_variables_removed(self): + # ensurepip deliberately ignores all pip environment variables + # See http://bugs.python.org/issue19734 for details + self.os_environ["PIP_THIS_SHOULD_GO_AWAY"] = "test fodder" + ensurepip.bootstrap() + self.assertNotIn("PIP_THIS_SHOULD_GO_AWAY", self.os_environ) + + @requires_usable_pip + def test_pip_config_file_disabled(self): + # ensurepip deliberately ignores the pip config file + # See http://bugs.python.org/issue20053 for details + ensurepip.bootstrap() + self.assertEqual(self.os_environ["PIP_CONFIG_FILE"], os.devnull) + + + at contextlib.contextmanager +def fake_pip(version=ensurepip._PIP_VERSION): + if version is None: + pip = None + else: + class FakePip(): + __version__ = version + pip = FakePip() + sentinel = object() + orig_pip = sys.modules.get("pip", sentinel) + sys.modules["pip"] = pip + try: + yield pip + finally: + if orig_pip is sentinel: + del sys.modules["pip"] + else: + sys.modules["pip"] = orig_pip + + +class TestUninstall(EnsurepipMixin, unittest.TestCase): + + def test_uninstall_skipped_when_not_installed(self): + with fake_pip(None): + ensurepip._uninstall_helper() + self.assertFalse(self.run_pip.called) + + def test_uninstall_skipped_with_warning_for_wrong_version(self): + with fake_pip("not a valid version"): + with test.test_support.captured_stderr() as stderr: + ensurepip._uninstall_helper() + warning = stderr.getvalue().strip() + self.assertIn("only uninstall a matching version", warning) + self.assertFalse(self.run_pip.called) + + @requires_usable_pip + def test_uninstall(self): + with fake_pip(): + ensurepip._uninstall_helper() + + self.run_pip.assert_called_once_with( + ["uninstall", "-y", "pip", "setuptools"] + ) + + @requires_usable_pip + def test_uninstall_with_verbosity_1(self): + with fake_pip(): + ensurepip._uninstall_helper(verbosity=1) + + self.run_pip.assert_called_once_with( + ["uninstall", "-y", "-v", "pip", "setuptools"] + ) + + @requires_usable_pip + def test_uninstall_with_verbosity_2(self): + with fake_pip(): + ensurepip._uninstall_helper(verbosity=2) + + self.run_pip.assert_called_once_with( + ["uninstall", "-y", "-vv", "pip", "setuptools"] + ) + + @requires_usable_pip + def test_uninstall_with_verbosity_3(self): + with fake_pip(): + ensurepip._uninstall_helper(verbosity=3) + + self.run_pip.assert_called_once_with( + ["uninstall", "-y", "-vvv", "pip", "setuptools"] + ) + + @requires_usable_pip + def test_pip_environment_variables_removed(self): + # ensurepip deliberately ignores all pip environment variables + # See http://bugs.python.org/issue19734 for details + self.os_environ["PIP_THIS_SHOULD_GO_AWAY"] = "test fodder" + with fake_pip(): + ensurepip._uninstall_helper() + self.assertNotIn("PIP_THIS_SHOULD_GO_AWAY", self.os_environ) + + @requires_usable_pip + def test_pip_config_file_disabled(self): + # ensurepip deliberately ignores the pip config file + # See http://bugs.python.org/issue20053 for details + with fake_pip(): + ensurepip._uninstall_helper() + self.assertEqual(self.os_environ["PIP_CONFIG_FILE"], os.devnull) + + +class TestMissingSSL(EnsurepipMixin, unittest.TestCase): + + def setUp(self): + sys.modules["ensurepip"] = ensurepip_no_ssl + + @self.addCleanup + def restore_module(): + sys.modules["ensurepip"] = ensurepip + super(TestMissingSSL, self).setUp() + + def test_bootstrap_requires_ssl(self): + self.os_environ["PIP_THIS_SHOULD_STAY"] = "test fodder" + with self.assertRaisesRegexp(RuntimeError, "requires SSL/TLS"): + ensurepip_no_ssl.bootstrap() + self.assertFalse(self.run_pip.called) + self.assertIn("PIP_THIS_SHOULD_STAY", self.os_environ) + + def test_uninstall_requires_ssl(self): + self.os_environ["PIP_THIS_SHOULD_STAY"] = "test fodder" + with self.assertRaisesRegexp(RuntimeError, "requires SSL/TLS"): + with fake_pip(): + ensurepip_no_ssl._uninstall_helper() + self.assertFalse(self.run_pip.called) + self.assertIn("PIP_THIS_SHOULD_STAY", self.os_environ) + + def test_main_exits_early_with_warning(self): + with test.test_support.captured_stderr() as stderr: + ensurepip_no_ssl._main(["--version"]) + warning = stderr.getvalue().strip() + self.assertTrue(warning.endswith("requires SSL/TLS"), warning) + self.assertFalse(self.run_pip.called) + +# Basic testing of the main functions and their argument parsing + +EXPECTED_VERSION_OUTPUT = "pip " + ensurepip._PIP_VERSION + + +class TestBootstrappingMainFunction(EnsurepipMixin, unittest.TestCase): + + @requires_usable_pip + def test_bootstrap_version(self): + with test.test_support.captured_stderr() as stderr: + with self.assertRaises(SystemExit): + ensurepip._main(["--version"]) + result = stderr.getvalue().strip() + self.assertEqual(result, EXPECTED_VERSION_OUTPUT) + self.assertFalse(self.run_pip.called) + + @requires_usable_pip + def test_basic_bootstrapping(self): + ensurepip._main([]) + + self.run_pip.assert_called_once_with( + [ + "install", "--no-index", "--find-links", + mock.ANY, "setuptools", "pip", + ], + mock.ANY, + ) + + additional_paths = self.run_pip.call_args[0][1] + self.assertEqual(len(additional_paths), 2) + + +class TestUninstallationMainFunction(EnsurepipMixin, unittest.TestCase): + + def test_uninstall_version(self): + with test.test_support.captured_stderr() as stderr: + with self.assertRaises(SystemExit): + ensurepip._uninstall._main(["--version"]) + result = stderr.getvalue().strip() + self.assertEqual(result, EXPECTED_VERSION_OUTPUT) + self.assertFalse(self.run_pip.called) + + @requires_usable_pip + def test_basic_uninstall(self): + with fake_pip(): + ensurepip._uninstall._main([]) + + self.run_pip.assert_called_once_with( + ["uninstall", "-y", "pip", "setuptools"] + ) + + +if __name__ == "__main__": + test.test_support.run_unittest(__name__) diff --git a/Makefile.pre.in b/Makefile.pre.in --- a/Makefile.pre.in +++ b/Makefile.pre.in @@ -947,6 +947,7 @@ test/tracedmodules \ encodings compiler hotshot \ email email/mime email/test email/test/data \ + ensurepip ensurepip/_bundled \ json json/tests \ sqlite3 sqlite3/test \ logging bsddb bsddb/test csv importlib wsgiref \ diff --git a/Tools/scripts/checkpip.py b/Tools/scripts/checkpip.py new file mode 100644 --- /dev/null +++ b/Tools/scripts/checkpip.py @@ -0,0 +1,31 @@ +#!/usr/bin/env python2 +""" +Checks that the version of the projects bundled in ensurepip are the latest +versions available. +""" +import ensurepip +import json +import urllib2 +import sys + + +def main(): + outofdate = False + + for project, version in ensurepip._PROJECTS: + data = json.loads(urllib2.urlopen( + "https://pypi.python.org/pypi/{}/json".format(project), + ).read().decode("utf8")) + upstream_version = data["info"]["version"] + + if version != upstream_version: + outofdate = True + print("The latest version of {} on PyPI is {}, but ensurepip " + "has {}".format(project, upstream_version, version)) + + if outofdate: + sys.exit(1) + + +if __name__ == "__main__": + main() -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 11 16:54:16 2014 From: python-checkins at python.org (donald.stufft) Date: Tue, 11 Nov 2014 15:54:16 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=282=2E7=29=3A_Upgrade_setupt?= =?utf-8?q?ools_to_7=2E0?= Message-ID: <20141111155404.118387.9654@psf.io> https://hg.python.org/cpython/rev/ed696903ad48 changeset: 93472:ed696903ad48 branch: 2.7 user: Donald Stufft date: Tue Nov 11 10:53:50 2014 -0500 summary: Upgrade setuptools to 7.0 files: Lib/ensurepip/__init__.py | 2 +- Lib/ensurepip/_bundled/setuptools-3.6-py2.py3-none-any.whl | Bin Lib/ensurepip/_bundled/setuptools-7.0-py2.py3-none-any.whl | Bin 3 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Lib/ensurepip/__init__.py b/Lib/ensurepip/__init__.py --- a/Lib/ensurepip/__init__.py +++ b/Lib/ensurepip/__init__.py @@ -12,7 +12,7 @@ __all__ = ["version", "bootstrap"] -_SETUPTOOLS_VERSION = "3.6" +_SETUPTOOLS_VERSION = "7.0" _PIP_VERSION = "1.5.6" diff --git a/Lib/ensurepip/_bundled/setuptools-3.6-py2.py3-none-any.whl b/Lib/ensurepip/_bundled/setuptools-3.6-py2.py3-none-any.whl deleted file mode 100644 index f0ffcfce5bb385e393a8385413f7a6092c51b33e..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 GIT binary patch [stripped] diff --git a/Lib/ensurepip/_bundled/setuptools-7.0-py2.py3-none-any.whl b/Lib/ensurepip/_bundled/setuptools-7.0-py2.py3-none-any.whl new file mode 100644 index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..fa1d1054da1dab98f8906555d31a9fda271b3a85 GIT binary patch [stripped] -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 11 17:02:02 2014 From: python-checkins at python.org (donald.stufft) Date: Tue, 11 Nov 2014 16:02:02 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E4=29=3A_Upgrade_setupt?= =?utf-8?q?ools_to_7=2E0?= Message-ID: <20141111160115.9575.48252@psf.io> https://hg.python.org/cpython/rev/33908f14c0eb changeset: 93473:33908f14c0eb branch: 3.4 parent: 93468:d676f2725699 user: Donald Stufft date: Tue Nov 11 11:01:09 2014 -0500 summary: Upgrade setuptools to 7.0 files: Lib/ensurepip/__init__.py | 2 +- Lib/ensurepip/_bundled/setuptools-2.1-py2.py3-none-any.whl | Bin Lib/ensurepip/_bundled/setuptools-7.0-py2.py3-none-any.whl | Bin 3 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Lib/ensurepip/__init__.py b/Lib/ensurepip/__init__.py --- a/Lib/ensurepip/__init__.py +++ b/Lib/ensurepip/__init__.py @@ -8,7 +8,7 @@ __all__ = ["version", "bootstrap"] -_SETUPTOOLS_VERSION = "2.1" +_SETUPTOOLS_VERSION = "7.0" _PIP_VERSION = "1.5.6" diff --git a/Lib/ensurepip/_bundled/setuptools-2.1-py2.py3-none-any.whl b/Lib/ensurepip/_bundled/setuptools-2.1-py2.py3-none-any.whl deleted file mode 100644 index ed77b59e632f32d09a3ae52adaa7f3e6659d8b48..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 GIT binary patch [stripped] diff --git a/Lib/ensurepip/_bundled/setuptools-7.0-py2.py3-none-any.whl b/Lib/ensurepip/_bundled/setuptools-7.0-py2.py3-none-any.whl new file mode 100644 index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..fa1d1054da1dab98f8906555d31a9fda271b3a85 GIT binary patch [stripped] -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 11 17:08:59 2014 From: python-checkins at python.org (donald.stufft) Date: Tue, 11 Nov 2014 16:08:59 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Merge_-_Upgrade_setuptools_to_7=2E0?= Message-ID: <20141111160701.118383.98440@psf.io> https://hg.python.org/cpython/rev/d25c58a420d6 changeset: 93474:d25c58a420d6 parent: 93469:ac0334665459 parent: 93473:33908f14c0eb user: Donald Stufft date: Tue Nov 11 11:06:49 2014 -0500 summary: Merge - Upgrade setuptools to 7.0 files: Lib/ensurepip/__init__.py | 2 +- Lib/ensurepip/_bundled/setuptools-3.6-py2.py3-none-any.whl | Bin Lib/ensurepip/_bundled/setuptools-7.0-py2.py3-none-any.whl | Bin 3 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Lib/ensurepip/__init__.py b/Lib/ensurepip/__init__.py --- a/Lib/ensurepip/__init__.py +++ b/Lib/ensurepip/__init__.py @@ -8,7 +8,7 @@ __all__ = ["version", "bootstrap"] -_SETUPTOOLS_VERSION = "3.6" +_SETUPTOOLS_VERSION = "7.0" _PIP_VERSION = "1.5.6" diff --git a/Lib/ensurepip/_bundled/setuptools-3.6-py2.py3-none-any.whl b/Lib/ensurepip/_bundled/setuptools-3.6-py2.py3-none-any.whl deleted file mode 100644 index f0ffcfce5bb385e393a8385413f7a6092c51b33e..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 GIT binary patch [stripped] diff --git a/Lib/ensurepip/_bundled/setuptools-7.0-py2.py3-none-any.whl b/Lib/ensurepip/_bundled/setuptools-7.0-py2.py3-none-any.whl new file mode 100644 index e69de29bb2d1d6434b8b29ae775ad8c2e48c5391..fa1d1054da1dab98f8906555d31a9fda271b3a85 GIT binary patch [stripped] -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 11 18:33:24 2014 From: python-checkins at python.org (donald.stufft) Date: Tue, 11 Nov 2014 17:33:24 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogRGVmaW5lIGEgX19o?= =?utf-8?q?ash=5F=5F_to_quiet_down_a_-3_warning?= Message-ID: <20141111173302.118381.24834@psf.io> https://hg.python.org/cpython/rev/e4c32152b25b changeset: 93475:e4c32152b25b branch: 2.7 parent: 93472:ed696903ad48 user: Donald Stufft date: Tue Nov 11 12:32:57 2014 -0500 summary: Define a __hash__ to quiet down a -3 warning files: Lib/test/_mock_backport.py | 5 +++++ 1 files changed, 5 insertions(+), 0 deletions(-) diff --git a/Lib/test/_mock_backport.py b/Lib/test/_mock_backport.py --- a/Lib/test/_mock_backport.py +++ b/Lib/test/_mock_backport.py @@ -1873,6 +1873,8 @@ class _ANY(object): "A helper object that compares equal to everything." + __hash__ = object.__hash__ + def __eq__(self, other): return True @@ -1923,6 +1925,9 @@ If the _Call has no name then it will match any name. """ + + __hash__ = object.__hash__ + def __new__(cls, value=(), name=None, parent=None, two=False, from_kall=True): name = '' -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 11 20:16:13 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Tue, 11 Nov 2014 19:16:13 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Minor_code_clean_up_and_im?= =?utf-8?q?provements_in_the_re_module=2E?= Message-ID: <20141111191528.21117.82488@psf.io> https://hg.python.org/cpython/rev/30a6c74ad87f changeset: 93476:30a6c74ad87f parent: 93474:d25c58a420d6 user: Serhiy Storchaka date: Tue Nov 11 21:13:28 2014 +0200 summary: Minor code clean up and improvements in the re module. files: Lib/re.py | 2 +- Lib/sre_compile.py | 16 ++++++---------- Lib/sre_parse.py | 8 ++++---- Lib/test/test_re.py | 4 ++-- 4 files changed, 13 insertions(+), 17 deletions(-) diff --git a/Lib/re.py b/Lib/re.py --- a/Lib/re.py +++ b/Lib/re.py @@ -363,7 +363,7 @@ append = result.append match = self.scanner.scanner(string).match i = 0 - while 1: + while True: m = match() if not m: break diff --git a/Lib/sre_compile.py b/Lib/sre_compile.py --- a/Lib/sre_compile.py +++ b/Lib/sre_compile.py @@ -16,11 +16,6 @@ assert _sre.MAGIC == MAGIC, "SRE module mismatch" -if _sre.CODESIZE == 2: - MAXCODE = 65535 -else: - MAXCODE = 0xFFFFFFFF - _LITERAL_CODES = {LITERAL, NOT_LITERAL} _REPEATING_CODES = {REPEAT, MIN_REPEAT, MAX_REPEAT} _SUCCESS_CODES = {SUCCESS, FAILURE} @@ -191,7 +186,7 @@ emit(JUMP) tailappend(_len(code)); emit(0) code[skip] = _len(code) - skip - emit(0) # end of branch + emit(FAILURE) # end of branch for tail in tail: code[tail] = _len(code) - tail elif op is CATEGORY: @@ -374,6 +369,7 @@ return out _CODEBITS = _sre.CODESIZE * 8 +MAXCODE = (1 << _CODEBITS) - 1 _BITS_TRANS = b'0' + b'1' * 255 def _mk_bitmap(bits, _CODEBITS=_CODEBITS, _int=int): s = bits.translate(_BITS_TRANS)[::-1] @@ -477,9 +473,9 @@ elif op is IN: charset = av ## if prefix: -## print "*** PREFIX", prefix, prefix_skip +## print("*** PREFIX", prefix, prefix_skip) ## if charset: -## print "*** CHARSET", charset +## print("*** CHARSET", charset) # add an info block emit = code.append emit(INFO) @@ -489,9 +485,9 @@ if prefix: mask = SRE_INFO_PREFIX if len(prefix) == prefix_skip == len(pattern.data): - mask = mask + SRE_INFO_LITERAL + mask = mask | SRE_INFO_LITERAL elif charset: - mask = mask + SRE_INFO_CHARSET + mask = mask | SRE_INFO_CHARSET emit(mask) # pattern length if lo < MAXCODE: diff --git a/Lib/sre_parse.py b/Lib/sre_parse.py --- a/Lib/sre_parse.py +++ b/Lib/sre_parse.py @@ -103,18 +103,18 @@ seqtypes = (tuple, list) for op, av in self.data: print(level*" " + str(op), end='') - if op == IN: + if op is IN: # member sublanguage print() for op, a in av: print((level+1)*" " + str(op), a) - elif op == BRANCH: + elif op is BRANCH: print() for i, a in enumerate(av[1]): if i: print(level*" " + "OR") a.dump(level+1) - elif op == GROUPREF_EXISTS: + elif op is GROUPREF_EXISTS: condgroup, item_yes, item_no = av print('', condgroup) item_yes.dump(level+1) @@ -607,7 +607,7 @@ item = subpattern[-1:] else: item = None - if not item or (_len(item) == 1 and item[0][0] == AT): + if not item or (_len(item) == 1 and item[0][0] is AT): raise source.error("nothing to repeat", source.tell() - here + len(this)) if item[0][0] in _REPEATCODES: diff --git a/Lib/test/test_re.py b/Lib/test/test_re.py --- a/Lib/test/test_re.py +++ b/Lib/test/test_re.py @@ -1101,8 +1101,8 @@ def test_inline_flags(self): # Bug #1700 - upper_char = chr(0x1ea0) # Latin Capital Letter A with Dot Bellow - lower_char = chr(0x1ea1) # Latin Small Letter A with Dot Bellow + upper_char = '\u1ea0' # Latin Capital Letter A with Dot Below + lower_char = '\u1ea1' # Latin Small Letter A with Dot Below p = re.compile(upper_char, re.I | re.U) q = p.match(lower_char) -- Repository URL: https://hg.python.org/cpython From solipsis at pitrou.net Wed Nov 12 10:32:12 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Wed, 12 Nov 2014 10:32:12 +0100 Subject: [Python-checkins] Daily reference leaks (30a6c74ad87f): sum=0 Message-ID: results for 30a6c74ad87f on branch "default" -------------------------------------------- test_collections leaked [4, 0, -6] references, sum=-2 test_collections leaked [2, 0, -3] memory blocks, sum=-1 test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflog6b1Mhr', '-x'] From python-checkins at python.org Wed Nov 12 14:34:16 2014 From: python-checkins at python.org (nick.coghlan) Date: Wed, 12 Nov 2014 13:34:16 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Close_=2319494=3A_add_urrl?= =?utf-8?q?ib=2Erequest=2EHTTPBasicPriorAuthHandler?= Message-ID: <20141112133402.47808.62976@psf.io> https://hg.python.org/cpython/rev/fb3061ba6fd2 changeset: 93477:fb3061ba6fd2 user: Nick Coghlan date: Wed Nov 12 23:33:50 2014 +1000 summary: Close #19494: add urrlib.request.HTTPBasicPriorAuthHandler This auth handler adds the Authorization header to the first HTTP request rather than waiting for a HTTP 401 Unauthorized response from the server as the default HTTPBasicAuthHandler does. This allows working with websites like https://api.github.com which do not follow the strict interpretation of RFC, but more the dicta in the end of section 2 of RFC 2617: > A client MAY preemptively send the corresponding Authorization > header with requests for resources in that space without receipt > of another challenge from the server. Similarly, when a client > sends a request to a proxy, it may reuse a userid and password in > the Proxy-Authorization header field without receiving another > challenge from the proxy server. See section 4 for security > considerations associated with Basic authentication. Patch by Matej Cepl. files: Doc/library/urllib.request.rst | 11 +++++++++++ Doc/whatsnew/3.5.rst | 9 +++++++++ Lib/test/test_urllib2.py | 15 +++++++++++++++ Lib/urllib/request.py | 15 +++++++++++++++ Misc/NEWS | 3 +++ 5 files changed, 53 insertions(+), 0 deletions(-) diff --git a/Doc/library/urllib.request.rst b/Doc/library/urllib.request.rst --- a/Doc/library/urllib.request.rst +++ b/Doc/library/urllib.request.rst @@ -304,6 +304,17 @@ presented with a wrong Authentication scheme. +.. class:: HTTPBasicPriorAuthHandler(password_mgr=None) + + A variant of :class:`HTTPBasicAuthHandler` which automatically sends + authorization credentials with the first request, rather than waiting to + first receive a HTTP 401 "Unauthorised" error response. This allows + authentication to sites that don't provide a 401 response when receiving + a request without an Authorization header. Aside from this difference, + this behaves exactly as :class:`HTTPBasicAuthHandler`. + + .. versionadded:: 3.5 + .. class:: ProxyBasicAuthHandler(password_mgr=None) Handle authentication with the proxy. *password_mgr*, if given, should be diff --git a/Doc/whatsnew/3.5.rst b/Doc/whatsnew/3.5.rst --- a/Doc/whatsnew/3.5.rst +++ b/Doc/whatsnew/3.5.rst @@ -297,6 +297,15 @@ * The :func:`time.monotonic` function is now always available. (Contributed by Victor Stinner in :issue:`22043`.) +time +---- + +* A new :class:`urllib.request.HTTPBasicPriorAuthHandler` allows HTTP Basic + Authentication credentials to be sent unconditionally with the first HTTP + request, rather than waiting for a HTTP 401 Unauthorized response from the + server. + (Contributed by Matej Cepl in :issue:`19494`.) + wsgiref ------- diff --git a/Lib/test/test_urllib2.py b/Lib/test/test_urllib2.py --- a/Lib/test/test_urllib2.py +++ b/Lib/test/test_urllib2.py @@ -1422,6 +1422,21 @@ handler.do_open(conn, req) self.assertTrue(conn.fakesock.closed, "Connection not closed") + def test_auth_prior_handler(self): + pwd_manager = MockPasswordManager() + pwd_manager.add_password(None, 'https://example.com', + 'somebody', 'verysecret') + auth_prior_handler = urllib.request.HTTPBasicPriorAuthHandler( + pwd_manager) + http_hand = MockHTTPSHandler() + + opener = OpenerDirector() + opener.add_handler(http_hand) + opener.add_handler(auth_prior_handler) + + req = Request("https://example.com") + opener.open(req) + self.assertNotIn('Authorization', http_hand.httpconn.req_headers) class MiscTests(unittest.TestCase): diff --git a/Lib/urllib/request.py b/Lib/urllib/request.py --- a/Lib/urllib/request.py +++ b/Lib/urllib/request.py @@ -916,6 +916,21 @@ return response +class HTTPBasicPriorAuthHandler(HTTPBasicAuthHandler): + handler_order = 400 + + def http_request(self, req): + if not req.has_header('Authorization'): + user, passwd = self.passwd.find_user_password(None, req.host) + credentials = '{0}:{1}'.format(user, passwd).encode() + auth_str = base64.standard_b64encode(credentials).decode() + req.add_unredirected_header('Authorization', + 'Basic {}'.format(auth_str.strip())) + return req + + https_request = http_request + + # Return n random bytes. _randombytes = os.urandom diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -183,6 +183,9 @@ Library ------- +- Issue #19494: Added urllib.request.HTTPBasicPriorAuthHandler. Patch by + Matej Cepl. + - Issue #22578: Added attributes to the re.error class. - Issue #12728: Different Unicode characters having the same uppercase but -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 12 16:24:31 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 12 Nov 2014 15:24:31 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_add_space?= Message-ID: <20141112152406.67922.8051@psf.io> https://hg.python.org/cpython/rev/19b2c54e5f09 changeset: 93480:19b2c54e5f09 user: Benjamin Peterson date: Wed Nov 12 10:23:44 2014 -0500 summary: add space files: Lib/test/test_io.py | 1 + 1 files changed, 1 insertions(+), 0 deletions(-) diff --git a/Lib/test/test_io.py b/Lib/test/test_io.py --- a/Lib/test/test_io.py +++ b/Lib/test/test_io.py @@ -2890,6 +2890,7 @@ arr.frombytes(buf[:idx]) return memoryview(arr) + class CTextIOWrapperTest(TextIOWrapperTest): io = io shutdown_error = "RuntimeError: could not find io module state" -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 12 16:24:31 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 12 Nov 2014 15:24:31 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=283=2E4=29=3A_fix_possible_d?= =?utf-8?q?ouble_free_in_TextIOWrapper=2E=5F=5Finit=5F=5F_=28closes_=23228?= =?utf-8?b?NDkp?= Message-ID: <20141112152405.47788.48154@psf.io> https://hg.python.org/cpython/rev/ec1948191461 changeset: 93478:ec1948191461 branch: 3.4 parent: 93473:33908f14c0eb user: Benjamin Peterson date: Wed Nov 12 10:19:46 2014 -0500 summary: fix possible double free in TextIOWrapper.__init__ (closes #22849) files: Lib/test/test_io.py | 15 +++++++++++++++ Misc/NEWS | 2 ++ Modules/_io/textio.c | 2 +- 3 files changed, 18 insertions(+), 1 deletions(-) diff --git a/Lib/test/test_io.py b/Lib/test/test_io.py --- a/Lib/test/test_io.py +++ b/Lib/test/test_io.py @@ -2784,6 +2784,21 @@ self.assertFalse(err) self.assertEqual("ok", out.decode().strip()) + def test_issue22849(self): + class F(object): + def readable(self): return True + def writable(self): return True + def seekable(self): return True + + for i in range(10): + try: + self.TextIOWrapper(F(), encoding='utf-8') + except Exception: + pass + + F.tell = lambda x: 0 + t = self.TextIOWrapper(F(), encoding='utf-8') + class CTextIOWrapperTest(TextIOWrapperTest): io = io diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -36,6 +36,8 @@ Library ------- +- Issue #22849: Fix possible double free in the io.TextIOWrapper constructor. + - Issue #12728: Different Unicode characters having the same uppercase but different lowercase are now matched in case-insensitive regular expressions. diff --git a/Modules/_io/textio.c b/Modules/_io/textio.c --- a/Modules/_io/textio.c +++ b/Modules/_io/textio.c @@ -1061,7 +1061,7 @@ } /* Finished sorting out the codec details */ - Py_DECREF(codec_info); + Py_CLEAR(codec_info); self->buffer = buffer; Py_INCREF(buffer); -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 12 16:24:31 2014 From: python-checkins at python.org (benjamin.peterson) Date: Wed, 12 Nov 2014 15:24:31 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?b?KTogbWVyZ2UgMy40ICgjMjI4NDkp?= Message-ID: <20141112152405.118103.78819@psf.io> https://hg.python.org/cpython/rev/a664b150b6c2 changeset: 93479:a664b150b6c2 parent: 93477:fb3061ba6fd2 parent: 93478:ec1948191461 user: Benjamin Peterson date: Wed Nov 12 10:23:35 2014 -0500 summary: merge 3.4 (#22849) files: Lib/test/test_io.py | 16 ++++++++++++++++ Misc/NEWS | 2 ++ Modules/_io/textio.c | 2 +- 3 files changed, 19 insertions(+), 1 deletions(-) diff --git a/Lib/test/test_io.py b/Lib/test/test_io.py --- a/Lib/test/test_io.py +++ b/Lib/test/test_io.py @@ -2856,6 +2856,22 @@ self.assertEqual(t.read(200), bytes_val.decode('utf-8')) + def test_issue22849(self): + class F(object): + def readable(self): return True + def writable(self): return True + def seekable(self): return True + + for i in range(10): + try: + self.TextIOWrapper(F(), encoding='utf-8') + except Exception: + pass + + F.tell = lambda x: 0 + t = self.TextIOWrapper(F(), encoding='utf-8') + + class MemviewBytesIO(io.BytesIO): '''A BytesIO object whose read method returns memoryviews rather than bytes''' diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -188,6 +188,8 @@ - Issue #22578: Added attributes to the re.error class. +- Issue #22849: Fix possible double free in the io.TextIOWrapper constructor. + - Issue #12728: Different Unicode characters having the same uppercase but different lowercase are now matched in case-insensitive regular expressions. diff --git a/Modules/_io/textio.c b/Modules/_io/textio.c --- a/Modules/_io/textio.c +++ b/Modules/_io/textio.c @@ -1061,7 +1061,7 @@ } /* Finished sorting out the codec details */ - Py_DECREF(codec_info); + Py_CLEAR(codec_info); self->buffer = buffer; Py_INCREF(buffer); -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 13 04:03:06 2014 From: python-checkins at python.org (steve.dower) Date: Thu, 13 Nov 2014 03:03:06 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzIyODUw?= =?utf-8?q?=3A_Backport_ensurepip_Windows_installer_changes_to_2=2E7?= Message-ID: <20141113030255.118111.30981@psf.io> https://hg.python.org/cpython/rev/c248a6bdc1d7 changeset: 93481:c248a6bdc1d7 branch: 2.7 parent: 93475:e4c32152b25b user: Steve Dower date: Wed Nov 12 19:02:20 2014 -0800 summary: Issue #22850: Backport ensurepip Windows installer changes to 2.7 files: Tools/msi/msi.py | 47 +++++++++++++++++++++++++---------- 1 files changed, 33 insertions(+), 14 deletions(-) diff --git a/Tools/msi/msi.py b/Tools/msi/msi.py --- a/Tools/msi/msi.py +++ b/Tools/msi/msi.py @@ -410,6 +410,8 @@ compileargs = r'-Wi "[TARGETDIR]Lib\compileall.py" -f -x "bad_coding|badsyntax|site-packages|py3_" "[TARGETDIR]Lib"' lib2to3args = r'-c "import lib2to3.pygram, lib2to3.patcomp;lib2to3.patcomp.PatternCompiler()"' + updatepipargs = r'-m ensurepip -U --default-pip' + removepipargs = r'-B -m ensurepip._uninstall' # See "CustomAction Table" add_data(db, "CustomAction", [ # msidbCustomActionTypeFirstSequence + msidbCustomActionTypeTextData + msidbCustomActionTypeProperty @@ -421,9 +423,13 @@ ("SetDLLDirToSystem32", 307, "DLLDIR", SystemFolderName), # msidbCustomActionTypeExe + msidbCustomActionTypeSourceFile # See "Custom Action Type 18" - ("CompilePyc", 18, "python.exe", compileargs), - ("CompilePyo", 18, "python.exe", "-O "+compileargs), - ("CompileGrammar", 18, "python.exe", lib2to3args), + # msidbCustomActionTypeInScript (1024); run during actual installation + # msidbCustomActionTypeNoImpersonate (2048); run action in system account, not user account + ("CompilePyc", 18+1024+2048, "python.exe", compileargs), + ("CompilePyo", 18+1024+2048, "python.exe", "-O "+compileargs), + ("CompileGrammar", 18+1024+2048, "python.exe", lib2to3args), + ("UpdatePip", 18+1024+2048, "python.exe", updatepipargs), + ("RemovePip", 18+1024+2048, "python.exe", removepipargs), ]) # UI Sequences, see "InstallUISequence Table", "Using a Sequence Table" @@ -447,7 +453,7 @@ # Prepend TARGETDIR to the system path, and remove it on uninstall. add_data(db, "Environment", - [("PathAddition", "=-*Path", "[TARGETDIR];[~]", "REGISTRY.path")]) + [("PathAddition", "=-*Path", "[TARGETDIR];[TARGETDIR]Scripts;[~]", "REGISTRY.path")]) # Execute Sequences add_data(db, "InstallExecuteSequence", @@ -455,16 +461,19 @@ ("SetDLLDirToSystem32", 'DLLDIR="" and ' + sys32cond, 751), ("SetDLLDirToTarget", 'DLLDIR="" and not ' + sys32cond, 752), ("UpdateEditIDLE", None, 1050), - ("CompilePyc", "COMPILEALL", 6800), - ("CompilePyo", "COMPILEALL", 6801), - ("CompileGrammar", "COMPILEALL", 6802), + # run command if install state of pip changes to INSTALLSTATE_LOCAL + # run after InstallFiles + ("UpdatePip", "&pip_feature=3", 4001), + # remove pip when state changes to INSTALLSTATE_ABSENT + # run before RemoveFiles + ("RemovePip", "&pip_feature=2", 3499), + ("CompilePyc", "COMPILEALL", 4002), + ("CompilePyo", "COMPILEALL", 4003), + ("CompileGrammar", "COMPILEALL", 4004), ]) add_data(db, "AdminExecuteSequence", [("InitialTargetDir", 'TARGETDIR=""', 750), ("SetDLLDirToTarget", 'DLLDIR=""', 751), - ("CompilePyc", "COMPILEALL", 6800), - ("CompilePyo", "COMPILEALL", 6801), - ("CompileGrammar", "COMPILEALL", 6802), ]) ##################################################################### @@ -830,7 +839,8 @@ # (i.e. additional Python libraries) need to follow the parent feature. # Features that have no advertisement trigger (e.g. the test suite) # must not support advertisement - global default_feature, tcltk, htmlfiles, tools, testsuite, ext_feature, private_crt, prepend_path + global default_feature, tcltk, htmlfiles, tools, testsuite + global ext_feature, private_crt, prepend_path, pip_feature default_feature = Feature(db, "DefaultFeature", "Python", "Python Interpreter and Libraries", 1, directory = "TARGETDIR") @@ -852,8 +862,12 @@ tools = Feature(db, "Tools", "Utility Scripts", "Python utility scripts (Tools/", 9, parent = default_feature, attributes=2) + pip_feature = Feature(db, "pip_feature", "pip", + "Install or upgrade pip, a tool for installing and managing " + "Python packages.", 11, + parent = default_feature, attributes=2|8) testsuite = Feature(db, "Testsuite", "Test suite", - "Python test suite (Lib/test/)", 11, + "Python test suite (Lib/test/)", 13, parent = default_feature, attributes=2|8) # prepend_path is an additional feature which is to be off by default. # Since the default level for the above features is 1, this needs to be @@ -861,7 +875,7 @@ prepend_path = Feature(db, "PrependPath", "Add python.exe to Path", "Prepend [TARGETDIR] to the system Path variable. " "This allows you to type 'python' into a command " - "prompt without needing the full path.", 13, + "prompt without needing the full path.", 15, parent = default_feature, attributes=2|8, level=2) @@ -1188,6 +1202,8 @@ "Documentation"), ("REGISTRY.path", msilib.gen_uuid(), "TARGETDIR", registry_component, None, None), + ("REGISTRY.ensurepip", msilib.gen_uuid(), "TARGETDIR", registry_component, "EnsurePipRun", + None), ("REGISTRY.def", msilib.gen_uuid(), "TARGETDIR", registry_component, None, None)] + tcldata) # See "FeatureComponents Table". @@ -1205,6 +1221,7 @@ [(default_feature.id, "REGISTRY"), (htmlfiles.id, "REGISTRY.doc"), (prepend_path.id, "REGISTRY.path"), + (pip_feature.id, "REGISTRY.ensurepip"), (ext_feature.id, "REGISTRY.def")] + tcldata ) @@ -1287,7 +1304,9 @@ "", r"[TARGETDIR]Python.exe", "REGISTRY.def"), ("DisplayIcon", -1, r"Software\Microsoft\Windows\CurrentVersion\Uninstall\%s" % product_code, - "DisplayIcon", "[TARGETDIR]python.exe", "REGISTRY") + "DisplayIcon", "[TARGETDIR]python.exe", "REGISTRY"), + # Fake registry entry to allow installer to track whether ensurepip has been run + ("EnsurePipRun", -1, prefix+r"\EnsurePipRun", "", "#1", "REGISTRY.ensurepip"), ]) # Shortcuts, see "Shortcut Table" add_data(db, "Directory", -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 13 08:20:06 2014 From: python-checkins at python.org (larry.hastings) Date: Thu, 13 Nov 2014 07:20:06 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_Fixed_reference_to_Argument_C?= =?utf-8?q?linic_PEP_in_3=2E5_schedule=2E?= Message-ID: <20141113071952.67900.67624@psf.io> https://hg.python.org/peps/rev/23c7fb8febda changeset: 5593:23c7fb8febda user: Larry Hastings date: Wed Nov 12 23:19:48 2014 -0800 summary: Fixed reference to Argument Clinic PEP in 3.5 schedule. files: pep-0478.txt | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/pep-0478.txt b/pep-0478.txt --- a/pep-0478.txt +++ b/pep-0478.txt @@ -68,11 +68,11 @@ * PEP 431, improved support for time zone databases * PEP 432, simplifying Python's startup sequence +* PEP 436, a build tool generating boilerplate for extension modules * PEP 441, improved Python zip application support * PEP 447, support for __locallookup__ metaclass method * PEP 448, additional unpacking generalizations * PEP 455, key transforming dictionary -* PEP 457, a build tool generating boilerplate for extension modules * PEP 475, retrying system calls that fail with EINTR -- Repository URL: https://hg.python.org/peps From solipsis at pitrou.net Thu Nov 13 10:34:37 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Thu, 13 Nov 2014 10:34:37 +0100 Subject: [Python-checkins] Daily reference leaks (19b2c54e5f09): sum=3 Message-ID: results for 19b2c54e5f09 on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogiFlHZd', '-x'] From solipsis at pitrou.net Fri Nov 14 10:33:13 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Fri, 14 Nov 2014 10:33:13 +0100 Subject: [Python-checkins] Daily reference leaks (19b2c54e5f09): sum=3 Message-ID: results for 19b2c54e5f09 on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogDED6tb', '-x'] From python-checkins at python.org Fri Nov 14 11:05:44 2014 From: python-checkins at python.org (nick.coghlan) Date: Fri, 14 Nov 2014 10:05:44 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogQ2xvc2UgIzIyMzAw?= =?utf-8?q?_by_tweaking_2=2E7=2E9_What=27s_New_announcements?= Message-ID: <20141114100525.57230.57@psf.io> https://hg.python.org/cpython/rev/0dacd614839c changeset: 93482:0dacd614839c branch: 2.7 user: Nick Coghlan date: Fri Nov 14 20:05:04 2014 +1000 summary: Close #22300 by tweaking 2.7.9 What's New announcements files: Doc/whatsnew/2.7.rst | 8 ++++++++ 1 files changed, 8 insertions(+), 0 deletions(-) diff --git a/Doc/whatsnew/2.7.rst b/Doc/whatsnew/2.7.rst --- a/Doc/whatsnew/2.7.rst +++ b/Doc/whatsnew/2.7.rst @@ -2570,10 +2570,18 @@ certificate store, the :class:`~ssl.SSLContext` class, and other features. (Contributed by Alex Gaynor and David Reid; :issue:`21308`.) + Refer to the "Version added: 2.7.9" notes in the module documentation for + specific details. + * :func:`os.urandom` was changed to cache a file descriptor to ``/dev/urandom`` instead of reopening ``/dev/urandom`` on every call. (Contributed by Alex Gaynor; :issue:`21305`.) +* :data:`hashlib.algorithms_guaranteed` and + :data:`hashlib.algorithms_available` were backported from Python 3 to make + it easier for Python 2 applications to select the strongest available hash + algorithm. (Contributed by Alex Gaynor in :issue:`21307`) + PEP 477: Backport ensurepip (PEP 453) to Python 2.7 --------------------------------------------------- -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 14 11:13:16 2014 From: python-checkins at python.org (georg.brandl) Date: Fri, 14 Nov 2014 10:13:16 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogQ2xvc2VzICMyMjg2?= =?utf-8?q?8=3A_make_example_less_ambiguous=2E?= Message-ID: <20141114101307.36978.11606@psf.io> https://hg.python.org/cpython/rev/5dd835edde1e changeset: 93483:5dd835edde1e branch: 2.7 user: Georg Brandl date: Fri Nov 14 11:12:53 2014 +0100 summary: Closes #22868: make example less ambiguous. files: Doc/tutorial/datastructures.rst | 6 +++--- 1 files changed, 3 insertions(+), 3 deletions(-) diff --git a/Doc/tutorial/datastructures.rst b/Doc/tutorial/datastructures.rst --- a/Doc/tutorial/datastructures.rst +++ b/Doc/tutorial/datastructures.rst @@ -181,12 +181,12 @@ the sequence for which ``function(item)`` is true. If *sequence* is a :class:`string` or :class:`tuple`, the result will be of the same type; otherwise, it is always a :class:`list`. For example, to compute a sequence of -numbers not divisible by 2 or 3:: +numbers divisible by 2 or 3:: - >>> def f(x): return x % 2 != 0 and x % 3 != 0 + >>> def f(x): return x % 3 == 0 or x % 5 == 0 ... >>> filter(f, range(2, 25)) - [5, 7, 11, 13, 17, 19, 23] + [3, 5, 6, 9, 10, 12, 15, 18, 20, 21, 24] ``map(function, sequence)`` calls ``function(item)`` for each of the sequence's items and returns a list of the return values. For example, to compute some -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 14 11:21:40 2014 From: python-checkins at python.org (georg.brandl) Date: Fri, 14 Nov 2014 10:21:40 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=282=2E7=29=3A_Fix_descriptio?= =?utf-8?q?n=2E?= Message-ID: <20141114102013.57214.64608@psf.io> https://hg.python.org/cpython/rev/e106d9368bff changeset: 93484:e106d9368bff branch: 2.7 user: Georg Brandl date: Fri Nov 14 11:20:07 2014 +0100 summary: Fix description. files: Doc/tutorial/datastructures.rst | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Doc/tutorial/datastructures.rst b/Doc/tutorial/datastructures.rst --- a/Doc/tutorial/datastructures.rst +++ b/Doc/tutorial/datastructures.rst @@ -181,7 +181,7 @@ the sequence for which ``function(item)`` is true. If *sequence* is a :class:`string` or :class:`tuple`, the result will be of the same type; otherwise, it is always a :class:`list`. For example, to compute a sequence of -numbers divisible by 2 or 3:: +numbers divisible by 3 or 5:: >>> def f(x): return x % 3 == 0 or x % 5 == 0 ... -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 14 18:18:41 2014 From: python-checkins at python.org (benjamin.peterson) Date: Fri, 14 Nov 2014 17:18:41 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_use_https_url_to_hg=2Epython?= =?utf-8?q?=2Eorg?= Message-ID: <20141114171749.29230.51897@psf.io> https://hg.python.org/peps/rev/90d77400cae4 changeset: 5594:90d77400cae4 user: Benjamin Peterson date: Fri Nov 14 12:17:47 2014 -0500 summary: use https url to hg.python.org files: pep0/constants.py | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/pep0/constants.py b/pep0/constants.py --- a/pep0/constants.py +++ b/pep0/constants.py @@ -24,7 +24,7 @@ references = u""" [1] PEP 1: PEP Purpose and Guidelines [2] View PEP history online - http://hg.python.org/peps/ + https://hg.python.org/peps/ """ footer = u""" -- Repository URL: https://hg.python.org/peps From python-checkins at python.org Fri Nov 14 20:46:09 2014 From: python-checkins at python.org (guido.van.rossum) Date: Fri, 14 Nov 2014 19:46:09 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogLSBJc3N1ZSAjMjI4?= =?utf-8?q?41=3A_Reject_coroutines_in_asyncio_add=5Fsignal=5Fhandler=28=29?= =?utf-8?q?=2E?= Message-ID: <20141114194600.57222.28572@psf.io> https://hg.python.org/cpython/rev/d244e1770f1b changeset: 93485:d244e1770f1b branch: 3.4 parent: 93478:ec1948191461 user: Guido van Rossum date: Fri Nov 14 11:45:47 2014 -0800 summary: - Issue #22841: Reject coroutines in asyncio add_signal_handler(). Patch by Ludovic.Gasc. files: Lib/asyncio/unix_events.py | 3 ++ Lib/test/test_asyncio/test_unix_events.py | 12 +++++++++++ Misc/NEWS | 3 ++ 3 files changed, 18 insertions(+), 0 deletions(-) diff --git a/Lib/asyncio/unix_events.py b/Lib/asyncio/unix_events.py --- a/Lib/asyncio/unix_events.py +++ b/Lib/asyncio/unix_events.py @@ -13,6 +13,7 @@ from . import base_events from . import base_subprocess from . import constants +from . import coroutines from . import events from . import selector_events from . import selectors @@ -66,6 +67,8 @@ Raise ValueError if the signal number is invalid or uncatchable. Raise RuntimeError if there is a problem setting up the handler. """ + if coroutines.iscoroutinefunction(callback): + raise TypeError("coroutines cannot be used with call_soon()") self._check_signal(sig) try: # set_wakeup_fd() raises ValueError if this is not the diff --git a/Lib/test/test_asyncio/test_unix_events.py b/Lib/test/test_asyncio/test_unix_events.py --- a/Lib/test/test_asyncio/test_unix_events.py +++ b/Lib/test/test_asyncio/test_unix_events.py @@ -64,6 +64,18 @@ signal.SIGINT, lambda: True) @mock.patch('asyncio.unix_events.signal') + def test_add_signal_handler_coroutine_error(self, m_signal): + + @asyncio.coroutine + def simple_coroutine(): + yield from [] + + self.assertRaises( + TypeError, + self.loop.add_signal_handler, + signal.SIGINT, simple_coroutine) + + @mock.patch('asyncio.unix_events.signal') def test_add_signal_handler(self, m_signal): m_signal.NSIG = signal.NSIG diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -36,6 +36,9 @@ Library ------- +- Issue #22841: Reject coroutines in asyncio add_signal_handler(). + Patch by Ludovic.Gasc. + - Issue #22849: Fix possible double free in the io.TextIOWrapper constructor. - Issue #12728: Different Unicode characters having the same uppercase but -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 14 20:49:05 2014 From: python-checkins at python.org (guido.van.rossum) Date: Fri, 14 Nov 2014 19:49:05 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_-_Issue_=2322841=3A_Reject_coroutines_in_asyncio_add=5Fs?= =?utf-8?q?ignal=5Fhandler=28=29=2E?= Message-ID: <20141114194853.36980.40853@psf.io> https://hg.python.org/cpython/rev/44e77709daa4 changeset: 93486:44e77709daa4 parent: 93480:19b2c54e5f09 parent: 93485:d244e1770f1b user: Guido van Rossum date: Fri Nov 14 11:48:37 2014 -0800 summary: - Issue #22841: Reject coroutines in asyncio add_signal_handler(). Patch by Ludovic.Gasc. files: Lib/asyncio/unix_events.py | 3 ++ Lib/test/test_asyncio/test_unix_events.py | 12 +++++++++++ Misc/NEWS | 3 ++ 3 files changed, 18 insertions(+), 0 deletions(-) diff --git a/Lib/asyncio/unix_events.py b/Lib/asyncio/unix_events.py --- a/Lib/asyncio/unix_events.py +++ b/Lib/asyncio/unix_events.py @@ -13,6 +13,7 @@ from . import base_events from . import base_subprocess from . import constants +from . import coroutines from . import events from . import selector_events from . import selectors @@ -66,6 +67,8 @@ Raise ValueError if the signal number is invalid or uncatchable. Raise RuntimeError if there is a problem setting up the handler. """ + if coroutines.iscoroutinefunction(callback): + raise TypeError("coroutines cannot be used with call_soon()") self._check_signal(sig) try: # set_wakeup_fd() raises ValueError if this is not the diff --git a/Lib/test/test_asyncio/test_unix_events.py b/Lib/test/test_asyncio/test_unix_events.py --- a/Lib/test/test_asyncio/test_unix_events.py +++ b/Lib/test/test_asyncio/test_unix_events.py @@ -64,6 +64,18 @@ signal.SIGINT, lambda: True) @mock.patch('asyncio.unix_events.signal') + def test_add_signal_handler_coroutine_error(self, m_signal): + + @asyncio.coroutine + def simple_coroutine(): + yield from [] + + self.assertRaises( + TypeError, + self.loop.add_signal_handler, + signal.SIGINT, simple_coroutine) + + @mock.patch('asyncio.unix_events.signal') def test_add_signal_handler(self, m_signal): m_signal.NSIG = signal.NSIG diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -183,6 +183,9 @@ Library ------- +- Issue #22841: Reject coroutines in asyncio add_signal_handler(). + Patch by Ludovic.Gasc. + - Issue #19494: Added urllib.request.HTTPBasicPriorAuthHandler. Patch by Matej Cepl. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 15 01:35:11 2014 From: python-checkins at python.org (antoine.pitrou) Date: Sat, 15 Nov 2014 00:35:11 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2322847=3A_Improve_?= =?utf-8?q?method_cache_efficiency=2E?= Message-ID: <20141115003501.36968.88616@psf.io> https://hg.python.org/cpython/rev/97dc64adb6fe changeset: 93487:97dc64adb6fe user: Antoine Pitrou date: Sat Nov 15 00:56:27 2014 +0100 summary: Issue #22847: Improve method cache efficiency. files: Misc/NEWS | 2 + Objects/typeobject.c | 40 ++++++++++++++++++++++++++++--- 2 files changed, 38 insertions(+), 4 deletions(-) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -10,6 +10,8 @@ Core and Builtins ----------------- +- Issue #22847: Improve method cache efficiency. + - Issue #22335: Fix crash when trying to enlarge a bytearray to 0x7fffffff bytes on a 32-bit platform. diff --git a/Objects/typeobject.c b/Objects/typeobject.c --- a/Objects/typeobject.c +++ b/Objects/typeobject.c @@ -14,10 +14,11 @@ MCACHE_MAX_ATTR_SIZE, since it might be a problem if very large strings are used as attribute names. */ #define MCACHE_MAX_ATTR_SIZE 100 -#define MCACHE_SIZE_EXP 9 +#define MCACHE_SIZE_EXP 12 #define MCACHE_HASH(version, name_hash) \ - (((unsigned int)(version) * (unsigned int)(name_hash)) \ - >> (8*sizeof(unsigned int) - MCACHE_SIZE_EXP)) + (((unsigned int)(version) ^ (unsigned int)(name_hash)) \ + & ((1 << MCACHE_SIZE_EXP) - 1)) + #define MCACHE_HASH_METHOD(type, name) \ MCACHE_HASH((type)->tp_version_tag, \ ((PyASCIIObject *)(name))->hash) @@ -35,6 +36,14 @@ static struct method_cache_entry method_cache[1 << MCACHE_SIZE_EXP]; static unsigned int next_version_tag = 0; +#define MCACHE_STATS 0 + +#if MCACHE_STATS +static size_t method_cache_hits = 0; +static size_t method_cache_misses = 0; +static size_t method_cache_collisions = 0; +#endif + /* alphabetical order */ _Py_IDENTIFIER(__abstractmethods__); _Py_IDENTIFIER(__class__); @@ -165,6 +174,18 @@ Py_ssize_t i; unsigned int cur_version_tag = next_version_tag - 1; +#if MCACHE_STATS + size_t total = method_cache_hits + method_cache_collisions + method_cache_misses; + fprintf(stderr, "-- Method cache hits = %zd (%d%%)\n", + method_cache_hits, (int) (100.0 * method_cache_hits / total)); + fprintf(stderr, "-- Method cache true misses = %zd (%d%%)\n", + method_cache_misses, (int) (100.0 * method_cache_misses / total)); + fprintf(stderr, "-- Method cache collisions = %zd (%d%%)\n", + method_cache_collisions, (int) (100.0 * method_cache_collisions / total)); + fprintf(stderr, "-- Method cache size = %zd KB\n", + sizeof(method_cache) / 1024); +#endif + for (i = 0; i < (1 << MCACHE_SIZE_EXP); i++) { method_cache[i].version = 0; Py_CLEAR(method_cache[i].name); @@ -2708,8 +2729,12 @@ /* fast path */ h = MCACHE_HASH_METHOD(type, name); if (method_cache[h].version == type->tp_version_tag && - method_cache[h].name == name) + method_cache[h].name == name) { +#if MCACHE_STATS + method_cache_hits++; +#endif return method_cache[h].value; + } } /* Look in tp_dict of types in MRO */ @@ -2743,6 +2768,13 @@ method_cache[h].version = type->tp_version_tag; method_cache[h].value = res; /* borrowed */ Py_INCREF(name); + assert(((PyASCIIObject *)(name))->hash != -1); +#if MCACHE_STATS + if (method_cache[h].name != Py_None && method_cache[h].name != name) + method_cache_collisions++; + else + method_cache_misses++; +#endif Py_DECREF(method_cache[h].name); method_cache[h].name = name; } -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 15 04:00:03 2014 From: python-checkins at python.org (ned.deily) Date: Sat, 15 Nov 2014 03:00:03 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyODc3?= =?utf-8?q?=3A_PEP_477_-_keep_2=2E7_and_3=2Ex_installers_in_sync=2E?= Message-ID: <20141115030001.29220.2059@psf.io> https://hg.python.org/cpython/rev/e8182c6c9ef1 changeset: 93489:e8182c6c9ef1 branch: 3.4 parent: 93485:d244e1770f1b user: Ned Deily date: Fri Nov 14 18:55:05 2014 -0800 summary: Issue #22877: PEP 477 - keep 2.7 and 3.x installers in sync. files: Mac/BuildScript/build-installer.py | 42 +++---- Mac/BuildScript/scripts/postflight.ensurepip | 50 +++++---- 2 files changed, 46 insertions(+), 46 deletions(-) diff --git a/Mac/BuildScript/build-installer.py b/Mac/BuildScript/build-installer.py --- a/Mac/BuildScript/build-installer.py +++ b/Mac/BuildScript/build-installer.py @@ -198,7 +198,7 @@ LT_10_5 = bool(getDeptargetTuple() < (10, 5)) # Disable for now - if False: # if (getDeptargetTuple() > (10, 5)) and (getVersionTuple() >= (3, 5)): + if False: # if getDeptargetTuple() > (10, 5): result.extend([ dict( name="Tcl 8.5.15", @@ -239,7 +239,7 @@ ), ]) - if getVersionTuple() >= (3, 3): + if PYTHON_3: result.extend([ dict( name="XZ 5.0.5", @@ -369,8 +369,6 @@ # Instructions for building packages inside the .mpkg. def pkg_recipes(): unselected_for_python3 = ('selected', 'unselected')[PYTHON_3] - # unselected if 3.0 through 3.3, selected otherwise (2.x or >= 3.4) - unselected_for_lt_python34 = ('selected', 'unselected')[(3, 0) <= getVersionTuple() < (3, 4)] result = [ dict( name="PythonFramework", @@ -439,27 +437,23 @@ topdir="/Library/Frameworks/Python.framework", source="/empty-dir", required=False, - selected=unselected_for_lt_python34, + selected='selected', + ), + dict( + name="PythonInstallPip", + long_name="Install or upgrade pip", + readme="""\ + This package installs (or upgrades from an earlier version) + pip, a tool for installing and managing Python packages. + """, + postflight="scripts/postflight.ensurepip", + topdir="/Library/Frameworks/Python.framework", + source="/empty-dir", + required=False, + selected='selected', ), ] - if getVersionTuple() >= (3, 4): - result.append( - dict( - name="PythonInstallPip", - long_name="Install or upgrade pip", - readme="""\ - This package installs (or upgrades from an earlier version) - pip, a tool for installing and managing Python packages. - """, - postflight="scripts/postflight.ensurepip", - topdir="/Library/Frameworks/Python.framework", - source="/empty-dir", - required=False, - selected='selected', - ) - ) - if getDeptargetTuple() < (10, 4) and not PYTHON_3: result.append( dict( @@ -977,7 +971,7 @@ shellQuote(os.path.join(SRCDIR, 'configure')), shellQuote(SDKPATH), UNIVERSALARCHS, (' ', '--with-computed-gotos ')[PYTHON_3], - (' ', '--without-ensurepip ')[getVersionTuple() >= (3, 4)], + (' ', '--without-ensurepip ')[PYTHON_3], shellQuote(WORKDIR)[1:-1], shellQuote(WORKDIR)[1:-1])) @@ -1159,7 +1153,9 @@ fp.close() def patchScript(inPath, outPath): + major, minor = getVersionMajorMinor() data = fileContents(inPath) + data = data.replace('@PYMAJOR@', str(major)) data = data.replace('@PYVER@', getVersion()) fp = open(outPath, 'w') fp.write(data) diff --git a/Mac/BuildScript/scripts/postflight.ensurepip b/Mac/BuildScript/scripts/postflight.ensurepip --- a/Mac/BuildScript/scripts/postflight.ensurepip +++ b/Mac/BuildScript/scripts/postflight.ensurepip @@ -4,7 +4,7 @@ # PYVER="@PYVER@" -PYMAJOR="3" +PYMAJOR="@PYMAJOR@" FWK="/Library/Frameworks/Python.framework/Versions/${PYVER}" RELFWKBIN="../../..${FWK}/bin" @@ -34,32 +34,36 @@ if [ -d /usr/local/bin ] ; then ( + install_links_if_our_fw() { + if [ "$(readlink -n ./$1)" = "${RELFWKBIN}/$1" ] ; then + shift + for fn ; + do + if [ -e "${RELFWKBIN}/${fn}" ] ; then + rm -f ./${fn} + ln -s "${RELFWKBIN}/${fn}" "./${fn}" + chgrp -h admin "./${fn}" + chmod -h g+w "./${fn}" + fi + done + fi + } + cd /usr/local/bin + # Create pipx.y and easy_install-x.y links if /usr/local/bin/pythonx.y # is linked to this framework version - if [ "$(readlink -n ./python${PYVER})" = "${RELFWKBIN}/python${PYVER}" ] ; then - for fn in "pip${PYVER}" "easy_install-${PYVER}" ; - do - if [ -e "${RELFWKBIN}/${fn}" ] ; then - rm -f ./${fn} - ln -s "${RELFWKBIN}/${fn}" "./${fn}" - chgrp -h admin "./${fn}" - chmod -h g+w "./${fn}" - fi - done - fi + install_links_if_our_fw "python${PYVER}" \ + "pip${PYVER}" "easy_install-${PYVER}" + # Create pipx link if /usr/local/bin/pythonx is linked to this version - if [ "$(readlink -n ./python${PYMAJOR})" = "${RELFWKBIN}/python${PYMAJOR}" ] ; then - for fn in "pip${PYMAJOR}" ; - do - if [ -e "${RELFWKBIN}/${fn}" ] ; then - rm -f ./${fn} - ln -s "${RELFWKBIN}/${fn}" "./${fn}" - chgrp -h admin "./${fn}" - chmod -h g+w "./${fn}" - fi - done - fi + install_links_if_our_fw "python${PYMAJOR}" \ + "pip${PYMAJOR}" + + # Create pip and easy_install link if /usr/local/bin/python + # is linked to this version + install_links_if_our_fw "python" \ + "pip" "easy_install" ) fi exit 0 -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 15 04:00:03 2014 From: python-checkins at python.org (ned.deily) Date: Sat, 15 Nov 2014 03:00:03 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2322877=3A_PEP_477_-_keep_2=2E7_and_3=2Ex_install?= =?utf-8?q?ers_in_sync=2E?= Message-ID: <20141115030001.36984.57390@psf.io> https://hg.python.org/cpython/rev/6270a2181ed3 changeset: 93490:6270a2181ed3 parent: 93487:97dc64adb6fe parent: 93489:e8182c6c9ef1 user: Ned Deily date: Fri Nov 14 18:56:28 2014 -0800 summary: Issue #22877: PEP 477 - keep 2.7 and 3.x installers in sync. files: Mac/BuildScript/build-installer.py | 42 +++---- Mac/BuildScript/scripts/postflight.ensurepip | 50 +++++---- 2 files changed, 46 insertions(+), 46 deletions(-) diff --git a/Mac/BuildScript/build-installer.py b/Mac/BuildScript/build-installer.py --- a/Mac/BuildScript/build-installer.py +++ b/Mac/BuildScript/build-installer.py @@ -198,7 +198,7 @@ LT_10_5 = bool(getDeptargetTuple() < (10, 5)) # Disable for now - if False: # if (getDeptargetTuple() > (10, 5)) and (getVersionTuple() >= (3, 5)): + if False: # if getDeptargetTuple() > (10, 5): result.extend([ dict( name="Tcl 8.5.15", @@ -239,7 +239,7 @@ ), ]) - if getVersionTuple() >= (3, 3): + if PYTHON_3: result.extend([ dict( name="XZ 5.0.5", @@ -369,8 +369,6 @@ # Instructions for building packages inside the .mpkg. def pkg_recipes(): unselected_for_python3 = ('selected', 'unselected')[PYTHON_3] - # unselected if 3.0 through 3.3, selected otherwise (2.x or >= 3.4) - unselected_for_lt_python34 = ('selected', 'unselected')[(3, 0) <= getVersionTuple() < (3, 4)] result = [ dict( name="PythonFramework", @@ -439,27 +437,23 @@ topdir="/Library/Frameworks/Python.framework", source="/empty-dir", required=False, - selected=unselected_for_lt_python34, + selected='selected', + ), + dict( + name="PythonInstallPip", + long_name="Install or upgrade pip", + readme="""\ + This package installs (or upgrades from an earlier version) + pip, a tool for installing and managing Python packages. + """, + postflight="scripts/postflight.ensurepip", + topdir="/Library/Frameworks/Python.framework", + source="/empty-dir", + required=False, + selected='selected', ), ] - if getVersionTuple() >= (3, 4): - result.append( - dict( - name="PythonInstallPip", - long_name="Install or upgrade pip", - readme="""\ - This package installs (or upgrades from an earlier version) - pip, a tool for installing and managing Python packages. - """, - postflight="scripts/postflight.ensurepip", - topdir="/Library/Frameworks/Python.framework", - source="/empty-dir", - required=False, - selected='selected', - ) - ) - if getDeptargetTuple() < (10, 4) and not PYTHON_3: result.append( dict( @@ -977,7 +971,7 @@ shellQuote(os.path.join(SRCDIR, 'configure')), shellQuote(SDKPATH), UNIVERSALARCHS, (' ', '--with-computed-gotos ')[PYTHON_3], - (' ', '--without-ensurepip ')[getVersionTuple() >= (3, 4)], + (' ', '--without-ensurepip ')[PYTHON_3], shellQuote(WORKDIR)[1:-1], shellQuote(WORKDIR)[1:-1])) @@ -1159,7 +1153,9 @@ fp.close() def patchScript(inPath, outPath): + major, minor = getVersionMajorMinor() data = fileContents(inPath) + data = data.replace('@PYMAJOR@', str(major)) data = data.replace('@PYVER@', getVersion()) fp = open(outPath, 'w') fp.write(data) diff --git a/Mac/BuildScript/scripts/postflight.ensurepip b/Mac/BuildScript/scripts/postflight.ensurepip --- a/Mac/BuildScript/scripts/postflight.ensurepip +++ b/Mac/BuildScript/scripts/postflight.ensurepip @@ -4,7 +4,7 @@ # PYVER="@PYVER@" -PYMAJOR="3" +PYMAJOR="@PYMAJOR@" FWK="/Library/Frameworks/Python.framework/Versions/${PYVER}" RELFWKBIN="../../..${FWK}/bin" @@ -34,32 +34,36 @@ if [ -d /usr/local/bin ] ; then ( + install_links_if_our_fw() { + if [ "$(readlink -n ./$1)" = "${RELFWKBIN}/$1" ] ; then + shift + for fn ; + do + if [ -e "${RELFWKBIN}/${fn}" ] ; then + rm -f ./${fn} + ln -s "${RELFWKBIN}/${fn}" "./${fn}" + chgrp -h admin "./${fn}" + chmod -h g+w "./${fn}" + fi + done + fi + } + cd /usr/local/bin + # Create pipx.y and easy_install-x.y links if /usr/local/bin/pythonx.y # is linked to this framework version - if [ "$(readlink -n ./python${PYVER})" = "${RELFWKBIN}/python${PYVER}" ] ; then - for fn in "pip${PYVER}" "easy_install-${PYVER}" ; - do - if [ -e "${RELFWKBIN}/${fn}" ] ; then - rm -f ./${fn} - ln -s "${RELFWKBIN}/${fn}" "./${fn}" - chgrp -h admin "./${fn}" - chmod -h g+w "./${fn}" - fi - done - fi + install_links_if_our_fw "python${PYVER}" \ + "pip${PYVER}" "easy_install-${PYVER}" + # Create pipx link if /usr/local/bin/pythonx is linked to this version - if [ "$(readlink -n ./python${PYMAJOR})" = "${RELFWKBIN}/python${PYMAJOR}" ] ; then - for fn in "pip${PYMAJOR}" ; - do - if [ -e "${RELFWKBIN}/${fn}" ] ; then - rm -f ./${fn} - ln -s "${RELFWKBIN}/${fn}" "./${fn}" - chgrp -h admin "./${fn}" - chmod -h g+w "./${fn}" - fi - done - fi + install_links_if_our_fw "python${PYMAJOR}" \ + "pip${PYMAJOR}" + + # Create pip and easy_install link if /usr/local/bin/python + # is linked to this version + install_links_if_our_fw "python" \ + "pip" "easy_install" ) fi exit 0 -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 15 04:00:03 2014 From: python-checkins at python.org (ned.deily) Date: Sat, 15 Nov 2014 03:00:03 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzIyODc3?= =?utf-8?q?=3A_PEP_477_-_OS_X_installer_for_2=2E7=2E9_now_installs_pip=2E?= Message-ID: <20141115030001.29226.12344@psf.io> https://hg.python.org/cpython/rev/6b8e107622b3 changeset: 93488:6b8e107622b3 branch: 2.7 parent: 93484:e106d9368bff user: Ned Deily date: Fri Nov 14 18:53:59 2014 -0800 summary: Issue #22877: PEP 477 - OS X installer for 2.7.9 now installs pip. files: Mac/BuildScript/build-installer.py | 42 ++--- Mac/BuildScript/scripts/postflight.ensurepip | 69 ++++++++++ Misc/NEWS | 2 + 3 files changed, 90 insertions(+), 23 deletions(-) diff --git a/Mac/BuildScript/build-installer.py b/Mac/BuildScript/build-installer.py --- a/Mac/BuildScript/build-installer.py +++ b/Mac/BuildScript/build-installer.py @@ -198,7 +198,7 @@ LT_10_5 = bool(getDeptargetTuple() < (10, 5)) # Disable for now - if False: # if (getDeptargetTuple() > (10, 5)) and (getVersionTuple() >= (3, 5)): + if False: # if getDeptargetTuple() > (10, 5): result.extend([ dict( name="Tcl 8.5.15", @@ -239,7 +239,7 @@ ), ]) - if getVersionTuple() >= (3, 3): + if PYTHON_3: result.extend([ dict( name="XZ 5.0.5", @@ -369,8 +369,6 @@ # Instructions for building packages inside the .mpkg. def pkg_recipes(): unselected_for_python3 = ('selected', 'unselected')[PYTHON_3] - # unselected if 3.0 through 3.3, selected otherwise (2.x or >= 3.4) - unselected_for_lt_python34 = ('selected', 'unselected')[(3, 0) <= getVersionTuple() < (3, 4)] result = [ dict( name="PythonFramework", @@ -439,27 +437,23 @@ topdir="/Library/Frameworks/Python.framework", source="/empty-dir", required=False, - selected=unselected_for_lt_python34, + selected='selected', + ), + dict( + name="PythonInstallPip", + long_name="Install or upgrade pip", + readme="""\ + This package installs (or upgrades from an earlier version) + pip, a tool for installing and managing Python packages. + """, + postflight="scripts/postflight.ensurepip", + topdir="/Library/Frameworks/Python.framework", + source="/empty-dir", + required=False, + selected='selected', ), ] - if getVersionTuple() >= (3, 4): - result.append( - dict( - name="PythonInstallPip", - long_name="Install or upgrade pip", - readme="""\ - This package installs (or upgrades from an earlier version) - pip, a tool for installing and managing Python packages. - """, - postflight="scripts/postflight.ensurepip", - topdir="/Library/Frameworks/Python.framework", - source="/empty-dir", - required=False, - selected='selected', - ) - ) - if getDeptargetTuple() < (10, 4) and not PYTHON_3: result.append( dict( @@ -977,7 +971,7 @@ shellQuote(os.path.join(SRCDIR, 'configure')), shellQuote(SDKPATH), UNIVERSALARCHS, (' ', '--with-computed-gotos ')[PYTHON_3], - (' ', '--without-ensurepip ')[getVersionTuple() >= (3, 4)], + (' ', '--without-ensurepip ')[PYTHON_3], shellQuote(WORKDIR)[1:-1], shellQuote(WORKDIR)[1:-1])) @@ -1159,7 +1153,9 @@ fp.close() def patchScript(inPath, outPath): + major, minor = getVersionMajorMinor() data = fileContents(inPath) + data = data.replace('@PYMAJOR@', str(major)) data = data.replace('@PYVER@', getVersion()) fp = open(outPath, 'w') fp.write(data) diff --git a/Mac/BuildScript/scripts/postflight.ensurepip b/Mac/BuildScript/scripts/postflight.ensurepip new file mode 100755 --- /dev/null +++ b/Mac/BuildScript/scripts/postflight.ensurepip @@ -0,0 +1,69 @@ +#!/bin/sh +# +# Install/upgrade pip. +# + +PYVER="@PYVER@" +PYMAJOR="@PYMAJOR@" +FWK="/Library/Frameworks/Python.framework/Versions/${PYVER}" +RELFWKBIN="../../..${FWK}/bin" + +umask 022 + +"${FWK}/bin/python${PYVER}" -m ensurepip --upgrade + +"${FWK}/bin/python${PYVER}" -Wi \ + "${FWK}/lib/python${PYVER}/compileall.py" \ + -f -x badsyntax \ + "${FWK}/lib/python${PYVER}/site-packages" + +"${FWK}/bin/python${PYVER}" -Wi -O \ + "${FWK}/lib/python${PYVER}/compileall.py" \ + -f -x badsyntax \ + "${FWK}/lib/python${PYVER}/site-packages" + +chgrp -R admin "${FWK}/lib/python${PYVER}/site-packages" "${FWK}/bin" +chmod -R g+w "${FWK}/lib/python${PYVER}/site-packages" "${FWK}/bin" + +# We do not know if the user selected the Python command-line tools +# package that installs symlinks to /usr/local/bin. So we assume +# that the command-line tools package has already completed or was +# not selected and we will only install /usr/local/bin symlinks for +# pip et al if there are /usr/local/bin/python* symlinks to our +# framework bin directory. + +if [ -d /usr/local/bin ] ; then + ( + install_links_if_our_fw() { + if [ "$(readlink -n ./$1)" = "${RELFWKBIN}/$1" ] ; then + shift + for fn ; + do + if [ -e "${RELFWKBIN}/${fn}" ] ; then + rm -f ./${fn} + ln -s "${RELFWKBIN}/${fn}" "./${fn}" + chgrp -h admin "./${fn}" + chmod -h g+w "./${fn}" + fi + done + fi + } + + cd /usr/local/bin + + # Create pipx.y and easy_install-x.y links if /usr/local/bin/pythonx.y + # is linked to this framework version + install_links_if_our_fw "python${PYVER}" \ + "pip${PYVER}" "easy_install-${PYVER}" + + # Create pipx link if /usr/local/bin/pythonx is linked to this version + install_links_if_our_fw "python${PYMAJOR}" \ + "pip${PYMAJOR}" + + # Create pip and easy_install link if /usr/local/bin/python + # is linked to this version + install_links_if_our_fw "python" \ + "pip" "easy_install" + ) +fi +exit 0 diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -324,6 +324,8 @@ - Issue #17219: Add library build dir for Python extension cross-builds. +- Issue #22877: PEP 477 - OS X installer now installs pip. + Windows ------- -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 15 04:00:03 2014 From: python-checkins at python.org (ned.deily) Date: Sat, 15 Nov 2014 03:00:03 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=282=2E7=29=3A_Update_OS_X_in?= =?utf-8?q?staller_documentation_files_for_2=2E7=2E9=2E?= Message-ID: <20141115030001.15639.72150@psf.io> https://hg.python.org/cpython/rev/33d68c79d601 changeset: 93491:33d68c79d601 branch: 2.7 parent: 93488:6b8e107622b3 user: Ned Deily date: Fri Nov 14 18:57:13 2014 -0800 summary: Update OS X installer documentation files for 2.7.9. files: Mac/BuildScript/resources/ReadMe.txt | 116 ++++--------- Mac/BuildScript/resources/Welcome.rtf | 20 +- Mac/BuildScript/resources/readme.rtf | 92 +++++++++++ 3 files changed, 147 insertions(+), 81 deletions(-) diff --git a/Mac/BuildScript/resources/ReadMe.txt b/Mac/BuildScript/resources/ReadMe.txt --- a/Mac/BuildScript/resources/ReadMe.txt +++ b/Mac/BuildScript/resources/ReadMe.txt @@ -1,88 +1,52 @@ -This package will install Python $FULL_VERSION for Mac OS X -$MACOSX_DEPLOYMENT_TARGET for the following architecture(s): -$ARCHITECTURES. +This package will install Python $FULL_VERSION for Mac OS X $MACOSX_DEPLOYMENT_TARGET for the following architecture(s): $ARCHITECTURES. - **** IMPORTANT **** +============================= +Update your version of Tcl/Tk to use IDLE or other Tk applications +============================= +To use IDLE or other programs that use the Tkinter graphical user interface toolkit, you need to install a newer third-party version of the Tcl/Tk frameworks. Visit https://www.python.org/download/mac/tcltk/ for current information about supported and recommended versions of Tcl/Tk for this version of Python and of Mac OS X. + +============================= Installing on OS X 10.8 (Mountain Lion) or later systems -======================================================== +[CHANGED for Python 2.7.9] +============================= -If you are attempting to install on an OS X 10.8+ system, you may -see a message that Python can't be installed because it is from an -unidentified developer. This is because this Python installer -package is not yet compatible with the Gatekeeper security feature -introduced in OS X 10.8. To allow Python to be installed, you -can override the Gatekeeper policy for this install. In the Finder, -instead of double-clicking, control-click or right click the "Python" -installer package icon. Then select "Open using ... Installer" from -the contextual menu that appears. +As of Python 2.7.9, installer packages from python.org are now compatible with the Gatekeeper security feature introduced in OS X 10.8. Downloaded packages can now be directly installed by double-clicking with the default system security settings. Python.org installer packages for OS X are signed with the Developer ID of the builder, as identified on the download page for this release (https://www.python.org/downloads/). To inspect the digital signature of the package, click on the lock icon in the upper right corner of the Install Python installer window. Refer to Apple?s support pages for more information on Gatekeeper (http://support.apple.com/kb/ht5290). - **** IMPORTANT **** +============================= +Simplified web-based installs +[NEW for Python 2.7.9] +============================= -Update your version of Tcl/Tk to use IDLE or other Tk applications -================================================================== +With the change to the newer flat format installer package, the download file now has a .pkg extension as it is no longer necessary to embed the installer within a disk image (.dmg) container. If you download the Python installer through a web browser, the OS X installer application may open automatically to allow you to perform the install. If your browser settings do not allow automatic open, double click on the downloaded installer file. -To use IDLE or other programs that use the Tkinter graphical user -interface toolkit, you may need to install a newer third-party version -of the Tcl/Tk frameworks. Visit http://www.python.org/download/mac/tcltk/ -for current information about supported and recommended versions of -Tcl/Tk for this version of Python and of Mac OS X. +============================= +New Installation Options and Defaults +[NEW for Python 2.7.9] +============================= - **** IMPORTANT **** +The Python installer now includes an option to automatically install or upgrade pip, a tool for installing and managing Python packages. This option is enabled by default and no Internet access is required. If you do not want the installer to do this, select the Customize option at the Installation Type step and uncheck the Install or ugprade pip option. -Binary installer support for 10.4 and 10.3.9 to be discontinued -=============================================================== +============================= +Binary installer support for OS X 10.4 and 10.3.9 discontinued +[CHANGED for Python 2.7.9] +============================= -Python 2.7.7 is the last release for which binary installers will be -released on python.org that support OS X 10.3.9 (Panther) and 10.4.x -(Tiger) systems. These systems were last updated by Apple in 2005 -and 2007. As of 2.7.8, the 32-bit-only installer will support PPC -and Intel Macs running OS X 10.5 (Leopard) and later. 10.5 was the -last OS X release for PPC machines (G4 and G5). (The 64-/32-bit -installer configuration will remain unchanged.) This aligns Python -2.7.x installer configurations with those currently provided with -Python 3.x. Some of the reasons for making this change are: -there were significant additions and compatibility improvements to -the OS X POSIX system APIs in OS X 10.5 that Python users can now -take advantage of; it is increasingly difficult to build and test -on obsolete 10.3 and 10.4 systems and with the 10.3 ABI; and it is -assumed that most remaining legacy PPC systems have upgraded to 10.5. -To ease the transition, for Python 2.7.7 only we are providing three -binary installers: (1) the legacy deprecated 32-bit-only 10.3+ -PPC/Intel format, (2) the newer 32-bit-only 10.5+ PPC/Intel format, -and (3) the current 64-bit/32-bit 10.6+ Intel-only format. While -future releases will not provide the deprecated installer, it will -still be possible to build Python from source on 10.3.9 and 10.4 -systems if needed. +As previously announced, binary installers for Python 2.7.9 from python.org +no longer support Mac OS X 10.3.9 (Panther) and 10.4.x (Tiger) systems. +These systems were last updated by Apple in 2005 and 2007. As of 2.7.9, the +32-bit-only installer supports PPC and Intel Macs running OS X 10.5 (Leopard). +10.5 was the last OS X release for PPC machines (G4 and G5). The 64-/32-bit +installer configuration remains unchanged and should normally be used on OS X +10.6 (Snow Leopard) and later systems. This aligns Python 2.7.x installer +configurations with those currently provided with Python 3.x. If needed, +it is still possible to build Python from source for 10.3.9 and 10.4. -Using this version of Python on OS X -==================================== +============================= +Python 3 and Python 2 Co-existence +============================= -Python consists of the Python programming language interpreter, plus -a set of programs to allow easy access to it for Mac users including -an integrated development environment, IDLE, plus a set of pre-built -extension modules that open up specific Macintosh technologies to -Python programs. - -The installer puts applications, an "Update Shell Profile" command, -and a link to the optionally installed Python Documentation into the -"Python $VERSION" subfolder of the system Applications folder, -and puts the underlying machinery into the folder -$PYTHONFRAMEWORKINSTALLDIR. It can -optionally place links to the command-line tools in /usr/local/bin as -well. Double-click on the "Update Shell Profile" command to add the -"bin" directory inside the framework to your shell's search path. - -You must install onto your current boot disk, even though the -installer may not enforce this, otherwise things will not work. - -You can verify the integrity of the disk image file containing the -installer package and this ReadMe file by comparing its md5 checksum -and size with the values published on the release page linked at -http://www.python.org/download/ - -Installation requires approximately $INSTALL_SIZE MB of disk space, -ignore the message that it will take zero bytes. - -More information on Python in general can be found at -http://www.python.org. +Python.org Python 2.7 and 3.x versions can both be installed on your system and +will not conflict. Python 2 command names contain a 2 or no digit: python2 (or +python2.7 or python), idle2 (or idle2.7 or idle), pip2 (or pip2.7 or pip), etc. +Command names for Python 3 contain a 3 in them: python3, idle3, pip3, etc. diff --git a/Mac/BuildScript/resources/Welcome.rtf b/Mac/BuildScript/resources/Welcome.rtf --- a/Mac/BuildScript/resources/Welcome.rtf +++ b/Mac/BuildScript/resources/Welcome.rtf @@ -1,5 +1,5 @@ -{\rtf1\ansi\ansicpg1252\cocoartf1265\cocoasubrtf200 -\cocoascreenfonts1{\fonttbl\f0\fswiss\fcharset0 Helvetica;} +{\rtf1\ansi\ansicpg1252\cocoartf1343\cocoasubrtf140 +\cocoascreenfonts1{\fonttbl\f0\fswiss\fcharset0 Helvetica;\f1\fmodern\fcharset0 CourierNewPSMT;} {\colortbl;\red255\green255\blue255;} \paperw11905\paperh16837\margl1440\margr1440\vieww9640\viewh10620\viewkind0 \pard\tx720\tx1440\tx2160\tx2880\tx3600\tx4320\tx5040\tx5760\tx6480\tx7200\tx7920\tx8640 @@ -14,9 +14,19 @@ \b Python for Mac OS X \b0 consists of the Python programming language interpreter, plus a set of programs to allow easy access to it for Mac OS X users including an integrated development environment \b IDLE -\b0 and a set of pre-built extension modules that open up specific Macintosh technologies to Python programs.\ +\b0 .\ \ -See the ReadMe file and the Python documentation for important information, including the dropping of support for OS X 10.3.9 and 10.4 in future Python 2.7.x binary installers.\ + +\b NEW for Python 2.7.9: +\b0 This package installs a version of +\f1 pip +\f0 , the recommended tool for installing and managing Python packages. Type\ +\ + +\f1 pip2.7 --help +\f0 \ +\ +for an overview. See the ReadMe file and the Python documentation for more information.\ \ \b IMPORTANT: @@ -26,4 +36,4 @@ \b tkinter \b0 graphical user interface toolkit require specific versions of the \b Tcl/Tk -\b0 platform independent windowing toolkit. Visit {\field{\*\fldinst{HYPERLINK "http://www.python.org/download/mac/tcltk/"}}{\fldrslt http://www.python.org/download/mac/tcltk/}} for current information on supported and recommended versions of Tcl/Tk for this version of Python and Mac OS X.} \ No newline at end of file +\b0 platform independent windowing toolkit. Visit {\field{\*\fldinst{HYPERLINK "https://www.python.org/download/mac/tcltk/"}}{\fldrslt https://www.python.org/download/mac/tcltk/}} for current information on supported and recommended versions of Tcl/Tk for this version of Python and Mac OS X.} \ No newline at end of file diff --git a/Mac/BuildScript/resources/readme.rtf b/Mac/BuildScript/resources/readme.rtf new file mode 100644 --- /dev/null +++ b/Mac/BuildScript/resources/readme.rtf @@ -0,0 +1,92 @@ +{\rtf1\ansi\ansicpg1252\cocoartf1343\cocoasubrtf140 +{\fonttbl\f0\fswiss\fcharset0 Helvetica;\f1\fmodern\fcharset0 CourierNewPSMT;} +{\colortbl;\red255\green255\blue255;} +\margl1440\margr1440\vieww15240\viewh15540\viewkind0 +\pard\tx720\tx1440\tx2160\tx2880\tx3600\tx4320\tx5040\tx5760\tx6480\tx7200\tx7920\tx8640\pardirnatural + +\f0\fs24 \cf0 This package will install Python $FULL_VERSION for Mac OS X $MACOSX_DEPLOYMENT_TARGET for the following architecture(s): $ARCHITECTURES.\ +\ + +\b \ul Update your version of Tcl/Tk to use IDLE or other Tk applications +\b0 \ulnone \ +\ +To use IDLE or other programs that use the Tkinter graphical user interface toolkit, you need to install a newer third-party version of the +\i Tcl/Tk +\i0 frameworks. Visit {\field{\*\fldinst{HYPERLINK "https://www.python.org/download/mac/tcltk/"}}{\fldrslt https://www.python.org/download/mac/tcltk/}} for current information about supported and recommended versions of +\i Tcl/Tk +\i0 for this version of Python and of Mac OS X.\ + +\b \ul \ +Installing on OS X 10.8 (Mountain Lion) or later systems\ +\ulnone [CHANGED for Python 2.7.9] +\b0 \ +\ +As of Python 2.7.9, installer packages from python.org are now compatible with the Gatekeeper security feature introduced in OS X 10.8. Downloaded packages can now be directly installed by double-clicking with the default system security settings. Python.org installer packages for OS X are signed with the Developer ID of the builder, as identified on the download page for this release ({\field{\*\fldinst{HYPERLINK "https://www.python.org/downloads/"}}{\fldrslt https://www.python.org/downloads/}}). To inspect the digital signature of the package, click on the lock icon in the upper right corner of the +\i Install Python +\i0 installer window. Refer to Apple\'92s support pages for more information on Gatekeeper ({\field{\*\fldinst{HYPERLINK "http://support.apple.com/kb/ht5290"}}{\fldrslt http://support.apple.com/kb/ht5290}}).\ +\ + +\b \ul Simplified web-based installs\ +\ulnone [NEW for Python 2.7.9] +\b0 \ +\ +With the change to the newer flat format installer package, the download file now has a +\f1 .pkg +\f0 extension as it is no longer necessary to embed the installer within a disk image ( +\f1 .dmg +\f0 ) container. If you download the Python installer through a web browser, the OS X installer application may open automatically to allow you to perform the install. If your browser settings do not allow automatic open, double click on the downloaded installer file.\ +\ +\pard\tx720\tx1440\tx2160\tx2880\tx3600\tx4320\tx5040\tx5760\tx6480\tx7200\tx7920\tx8640\pardirnatural + +\b \cf0 \ul \ulc0 New Installation Options and Defaults\ +\ulnone [NEW for Python 2.7.9] +\b0 \ +\ +The Python installer now includes an option to automatically install or upgrade +\f1 pip +\f0 , a tool for installing and managing Python packages. This option is enabled by default and no Internet access is required. If you do not want the installer to do this, select the +\i Customize +\i0 option at the +\i Installation Type +\i0 step and uncheck the +\i Install or ugprade pip +\i0 option.\ +\ + +\b \ul Binary installer support for OS X 10.4 and 10.3.9 discontinued\ +\ulnone [CHANGED for Python 2.7.9] +\b0 \ +\ +As previously announced, binary installers for Python 2.7.9 from python.org no longer support Mac OS X 10.3.9 (Panther) and 10.4.x (Tiger) systems. These systems were last updated by Apple in 2005 and 2007. As of 2.7.9, the 32-bit-only installer supports PPC and Intel Macs running OS X 10.5 (Leopard). 10.5 was the last OS X release for PPC machines (G4 and G5). The 64-/32-bit installer configuration remains unchanged and should normally be used on OS X 10.6 (Snow Leopard) and later systems. This aligns Python 2.7.x installer configurations with those currently provided with Python 3.x. If needed, it is still possible to build Python from source for 10.3.9 and 10.4.\ +\ + +\b \ul Python 3 and Python 2 Co-existence\ + +\b0 \ulnone \ +Python.org Python 2.7 and 3.x versions can both be installed on your system and will not conflict. Python 2.7 command names contain a 2 or no digit: +\f1 python2 +\f0 (or +\f1 python2.7 +\f0 or +\f1 python +\f0 ), +\f1 idle2 +\f0 (or +\f1 idle2.7 +\f0 or +\f1 idle +\f0 ), +\f1 pip2 +\f0 (or +\f1 pip2.7 +\f0 or +\f1 pip +\f0 ), etc. Command names for Python 3 contain a 3 in them, +\f1 python3 +\f0 , +\f1 idle3 +\f0 , +\f1 pip3 +\f0 , etc.\ +\ +} \ No newline at end of file -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 15 04:00:08 2014 From: python-checkins at python.org (ned.deily) Date: Sat, 15 Nov 2014 03:00:08 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Update_OS_X_installer_docu?= =?utf-8?q?mentation_files_for_3=2E5=2E0?= Message-ID: <20141115030002.51555.89292@psf.io> https://hg.python.org/cpython/rev/e79c6ea48b83 changeset: 93492:e79c6ea48b83 parent: 93490:6270a2181ed3 user: Ned Deily date: Fri Nov 14 18:41:56 2014 -0800 summary: Update OS X installer documentation files for 3.5.0 files: Mac/BuildScript/resources/ReadMe.txt | 97 +------------- Mac/BuildScript/resources/Welcome.rtf | 22 +-- Mac/BuildScript/resources/readme.rtf | 51 +++++++ 3 files changed, 65 insertions(+), 105 deletions(-) diff --git a/Mac/BuildScript/resources/ReadMe.txt b/Mac/BuildScript/resources/ReadMe.txt --- a/Mac/BuildScript/resources/ReadMe.txt +++ b/Mac/BuildScript/resources/ReadMe.txt @@ -1,92 +1,13 @@ -This package will install Python $FULL_VERSION for Mac OS X -$MACOSX_DEPLOYMENT_TARGET for the following architecture(s): -$ARCHITECTURES. +This package will install Python $FULL_VERSION for Mac OS X $MACOSX_DEPLOYMENT_TARGET for the following architecture(s): $ARCHITECTURES. - **** IMPORTANT **** +============================= +Update your version of Tcl/Tk to use IDLE or other Tk applications +============================= -Installing on OS X 10.8 (Mountain Lion) or later systems -======================================================== +To use IDLE or other programs that use the Tkinter graphical user interface toolkit, you need to install a newer third-party version of the Tcl/Tk frameworks. Visit https://www.python.org/download/mac/tcltk/ for current information about supported and recommended versions of Tcl/Tk for this version of Python and of Mac OS X. -If you are attempting to install on an OS X 10.8+ system, you may -see a message that Python can't be installed because it is from an -unidentified developer. This is because this Python installer -package is not yet compatible with the Gatekeeper security feature -introduced in OS X 10.8. To allow Python to be installed, you -can override the Gatekeeper policy for this install. In the Finder, -instead of double-clicking, control-click or right click the "Python" -installer package icon. Then select "Open using ... Installer" from -the contextual menu that appears. +============================= +Python 3 and Python 2 Co-existence +============================= - **** IMPORTANT **** - -Update your version of Tcl/Tk to use IDLE or other Tk applications -================================================================== - -To use IDLE or other programs that use the Tkinter graphical user -interface toolkit, you may need to install a newer third-party version -of the Tcl/Tk frameworks. Visit http://www.python.org/download/mac/tcltk/ -for current information about supported and recommended versions of -Tcl/Tk for this version of Python and of Mac OS X. - - **NEW* As of Python 3.4.0b1: - -New Installation Options and Defaults -===================================== - -The Python installer now includes an option to automatically install -or upgrade pip, a tool for installing and managing Python packages. -This option is enabled by default and no Internet access is required. -If you do not want the installer to do this, select the "Customize" -option at the "Installation Type" step and uncheck the "Install or -ugprade pip" option. - -To make it easier to use scripts installed by third-party Python -packages, with pip or by other means, the "Shell profile updater" -option is now enabled by default, as has been the case with Python -2.7.x installers. You can also turn this option off by selecting -"Customize" and unchecking the "Shell profile updater" option. You -can also update your shell profile later by launching the "Update -Shell Profile" command found in the /Applications/Python $VERSION -folder. You may need to start a new terminal window for the -changes to take effect. - -Python.org Python $VERSION and 2.7.x versions can both be installed and -will not conflict. Command names for Python 3 contain a 3 in them, -python3 (or python$VERSION), idle3 (or idle$VERSION), pip3 (or pip$VERSION), etc. -Python 2.7 command names contain a 2 or no digit: python2 (or -python2.7 or python), idle2 (or idle2.7 or idle), etc. If you want to -use pip with Python 2.7.x, you will need to download and install a -separate copy of it from the Python Package Index -(https://pypi.python.org/pypi). - -Using this version of Python on OS X -==================================== - -Python consists of the Python programming language interpreter, plus -a set of programs to allow easy access to it for Mac users including -an integrated development environment, IDLE, plus a set of pre-built -extension modules that open up specific Macintosh technologies to -Python programs. - -The installer puts applications, an "Update Shell Profile" command, -and a link to the optionally installed Python Documentation into the -"Python $VERSION" subfolder of the system Applications folder, -and puts the underlying machinery into the folder -$PYTHONFRAMEWORKINSTALLDIR. It can -optionally place links to the command-line tools in /usr/local/bin as -well. Double-click on the "Update Shell Profile" command to add the -"bin" directory inside the framework to your shell's search path. - -You must install onto your current boot disk, even though the -installer may not enforce this, otherwise things will not work. - -You can verify the integrity of the disk image file containing the -installer package and this ReadMe file by comparing its md5 checksum -and size with the values published on the release page linked at -http://www.python.org/download/ - -Installation requires approximately $INSTALL_SIZE MB of disk space, -ignore the message that it will take zero bytes. - -More information on Python in general can be found at -http://www.python.org. +Python.org Python $VERSION and 2.7.x versions can both be installed on your system and will not conflict. Command names for Python 3 contain a 3 in them, python3 (or python$VERSION), idle3 (or idle$VERSION), pip3 (or pip$VERSION), etc. Python 2.7 command names contain a 2 or no digit: python2 (or python2.7 or python), idle2 (or idle2.7 or idle), etc. If you want to use pip with Python 2.7.x, download and install a separate copy of it from the Python Package Index (https://pypi.python.org/pypi/pip/). diff --git a/Mac/BuildScript/resources/Welcome.rtf b/Mac/BuildScript/resources/Welcome.rtf --- a/Mac/BuildScript/resources/Welcome.rtf +++ b/Mac/BuildScript/resources/Welcome.rtf @@ -1,7 +1,7 @@ -{\rtf1\ansi\ansicpg1252\cocoartf1187\cocoasubrtf400 -\cocoascreenfonts1{\fonttbl\f0\fswiss\fcharset0 Helvetica;\f1\fmodern\fcharset0 CourierNewPSMT;} +{\rtf1\ansi\ansicpg1252\cocoartf1343\cocoasubrtf140 +\cocoascreenfonts1{\fonttbl\f0\fswiss\fcharset0 Helvetica;} {\colortbl;\red255\green255\blue255;} -\paperw11905\paperh16837\margl1440\margr1440\vieww9640\viewh10620\viewkind0 +\paperw11905\paperh16837\margl1440\margr1440\vieww12200\viewh10880\viewkind0 \pard\tx720\tx1440\tx2160\tx2880\tx3600\tx4320\tx5040\tx5760\tx6480\tx7200\tx7920\tx8640 \f0\fs24 \cf0 This package will install @@ -14,19 +14,7 @@ \b Python for Mac OS X \b0 consists of the Python programming language interpreter, plus a set of programs to allow easy access to it for Mac OS X users including an integrated development environment \b IDLE -\b0 and a set of pre-built extension modules that open up specific Macintosh technologies to Python programs.\ -\ - -\b NEW for Python 3.4: -\b0 This package now updates your shell profile by default to make $FULL_VERSION the default Python 3 version. This version can co-exist with other installed versions of Python 3 and Python 2. This package also installs a version of -\f1 pip -\f0 , the recommended tool for installing and managing Python packages. Type\ -\ - -\f1 pip3.4 --help -\f0 \ -\ -for an overview. See the ReadMe file and the Python documentation for more information.\ +\b0 .\ \ \b IMPORTANT: @@ -36,4 +24,4 @@ \b tkinter \b0 graphical user interface toolkit require specific versions of the \b Tcl/Tk -\b0 platform independent windowing toolkit. Visit {\field{\*\fldinst{HYPERLINK "http://www.python.org/download/mac/tcltk/"}}{\fldrslt http://www.python.org/download/mac/tcltk/}} for current information on supported and recommended versions of Tcl/Tk for this version of Python and Mac OS X.} \ No newline at end of file +\b0 platform independent windowing toolkit. Visit {\field{\*\fldinst{HYPERLINK "https://www.python.org/download/mac/tcltk/"}}{\fldrslt https://www.python.org/download/mac/tcltk/}} for current information on supported and recommended versions of Tcl/Tk for this version of Python and Mac OS X.} \ No newline at end of file diff --git a/Mac/BuildScript/resources/readme.rtf b/Mac/BuildScript/resources/readme.rtf new file mode 100644 --- /dev/null +++ b/Mac/BuildScript/resources/readme.rtf @@ -0,0 +1,51 @@ +{\rtf1\ansi\ansicpg1252\cocoartf1343\cocoasubrtf140 +{\fonttbl\f0\fswiss\fcharset0 Helvetica;\f1\fmodern\fcharset0 CourierNewPSMT;} +{\colortbl;\red255\green255\blue255;} +\margl1440\margr1440\vieww13020\viewh15160\viewkind0 +\pard\tx720\tx1440\tx2160\tx2880\tx3600\tx4320\tx5040\tx5760\tx6480\tx7200\tx7920\tx8640\pardirnatural + +\f0\fs24 \cf0 This package will install Python $FULL_VERSION for Mac OS X $MACOSX_DEPLOYMENT_TARGET for the following architecture(s): $ARCHITECTURES.\ +\ + +\b \ul Update your version of Tcl/Tk to use IDLE or other Tk applications +\b0 \ulnone \ +\ +To use IDLE or other programs that use the Tkinter graphical user interface toolkit, you need to install a newer third-party version of the +\i Tcl/Tk +\i0 frameworks. Visit {\field{\*\fldinst{HYPERLINK "https://www.python.org/download/mac/tcltk/"}}{\fldrslt https://www.python.org/download/mac/tcltk/}} for current information about supported and recommended versions of +\i Tcl/Tk +\i0 for this version of Python and of Mac OS X.\ + +\b \ul \ +\pard\tx720\tx1440\tx2160\tx2880\tx3600\tx4320\tx5040\tx5760\tx6480\tx7200\tx7920\tx8640\pardirnatural +\cf0 \ulc0 Python 3 and Python 2 Co-existence\ + +\b0 \ulnone \ +Python.org Python $VERSION and 2.7.x versions can both be installed on your system and will not conflict. Command names for Python 3 contain a 3 in them, +\f1 python3 +\f0 (or +\f1 python$VERSION +\f0 ), +\f1 idle3 +\f0 (or i +\f1 dle$VERSION +\f0 ), +\f1 pip3 +\f0 (or +\f1 pip$VERSION +\f0 ), etc. Python 2.7 command names contain a 2 or no digit: +\f1 python2 +\f0 (or +\f1 python2.7 +\f0 or +\f1 python +\f0 ), +\f1 idle2 +\f0 (or +\f1 idle2.7 +\f0 or +\f1 idle +\f0 ), etc. If you want to use +\f1 pip +\f0 with Python 2.7.x, download and install a separate copy of it from the Python Package Index ({\field{\*\fldinst{HYPERLINK "https://pypi.python.org/pypi/pip/"}}{\fldrslt https://pypi.python.org/pypi/pip/}}).\ +} \ No newline at end of file -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 15 10:19:13 2014 From: python-checkins at python.org (georg.brandl) Date: Sat, 15 Nov 2014 09:19:13 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_Add_PEP_479=3A_Change_StopIte?= =?utf-8?q?ration_handling_inside_generators=2C_by_Chris_Angelico=2E?= Message-ID: <20141115091909.51557.18557@psf.io> https://hg.python.org/peps/rev/c8d6596edaed changeset: 5595:c8d6596edaed user: Georg Brandl date: Sat Nov 15 10:13:42 2014 +0100 summary: Add PEP 479: Change StopIteration handling inside generators, by Chris Angelico. files: pep-0479.txt | 123 +++++++++++++++++++++++++++++++++++++++ 1 files changed, 123 insertions(+), 0 deletions(-) diff --git a/pep-0479.txt b/pep-0479.txt new file mode 100644 --- /dev/null +++ b/pep-0479.txt @@ -0,0 +1,123 @@ +PEP: 479 +Title: Change StopIteration handling inside generators +Version: $Revision$ +Last-Modified: $Date$ +Author: Chris Angelico +Status: Draft +Type: Standards Track +Content-Type: text/x-rst +Created: 15-Nov-2014 +Python-Version: 3.5 +Post-History: + + +Abstract +======== + +This PEP proposes a semantic change to ``StopIteration`` when raised +inside a generator, unifying the behaviour of list comprehensions and +generator expressions somewhat. + + +Rationale +========= + +The interaction of generators and ``StopIteration`` is currently +somewhat surprising, and can conceal obscure bugs. An unexpected +exception should not result in subtly altered behaviour, but should +cause a noisy and easily-debugged traceback. Currently, +``StopIteration`` can be absorbed by the generator construct. + + +Proposal +======== + +If a ``StopIteration`` is about to bubble out of a generator frame, it +is replaced with some other exception (maybe ``RuntimeError``, maybe a +new custom ``Exception`` subclass, but *not* deriving from +``StopIteration``) which causes the ``next()`` call (which invoked the +generator) to fail, passing that exception out. From then on it's +just like any old exception. [3]_ + + +Consequences to existing code +============================= + +This change will affect existing code that depends on +``StopIteration`` bubbling up. The pure Python reference +implementation of ``groupby`` [1]_ currently has comments "Exit on +``StopIteration``" where it is expected that the exception will +propagate and then be handled. This will be unusual, but not unknown, +and such constructs will fail. + +(Nick Coghlan comments: """If you wanted to factor out a helper +function that terminated the generator you'd have to do "return +yield from helper()" rather than just "helper()".""") + +As this can break code, it is proposed to utilize the ``__future__`` +mechanism to introduce this, finally making it standard in Python 3.6 +or 3.7. + + +Alternate proposals +=================== + +Supplying a specific exception to raise on return +------------------------------------------------- + +Nick Coghlan suggested a means of providing a specific +``StopIteration`` instance to the generator; if any other instance of +``StopIteration`` is raised, it is an error, but if that particular +one is raised, the generator has properly completed. + + +Making return-triggered StopIterations obvious +---------------------------------------------- + +For certain situations, a simpler and fully backward-compatible +solution may be sufficient: when a generator returns, instead of +raising ``StopIteration``, it raises a specific subclass of +``StopIteration`` which can then be detected. If it is not that +subclass, it is an escaping exception rather than a return statement. + + +Criticism +========= + +Unofficial and apocryphal statistics suggest that this is seldom, if +ever, a problem. [4]_ Code does exist which relies on the current +behaviour, and there is the concern that this would be unnecessary +code churn to achieve little or no gain. + + +References +========== + +.. [1] Initial mailing list comment + (https://mail.python.org/pipermail/python-ideas/2014-November/029906.html) + +.. [2] Pure Python implementation of groupby + (https://docs.python.org/3/library/itertools.html#itertools.groupby) + +.. [3] Proposal by GvR + (https://mail.python.org/pipermail/python-ideas/2014-November/029953.html) + +.. [4] Response by Steven D'Aprano + (https://mail.python.org/pipermail/python-ideas/2014-November/029994.html) + + +Copyright +========= + +This document has been placed in the public domain. + + + +.. + Local Variables: + mode: indented-text + indent-tabs-mode: nil + sentence-end-double-space: t + fill-column: 70 + coding: utf-8 + End: -- Repository URL: https://hg.python.org/peps From solipsis at pitrou.net Sat Nov 15 10:31:30 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Sat, 15 Nov 2014 10:31:30 +0100 Subject: [Python-checkins] Daily reference leaks (97dc64adb6fe): sum=3 Message-ID: results for 97dc64adb6fe on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogAxuKtE', '-x'] From python-checkins at python.org Sat Nov 15 10:38:09 2014 From: python-checkins at python.org (georg.brandl) Date: Sat, 15 Nov 2014 09:38:09 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_Add_Post-History_to_PEP_479?= =?utf-8?q?=2E?= Message-ID: <20141115093808.29208.23851@psf.io> https://hg.python.org/peps/rev/f956c67f79ab changeset: 5596:f956c67f79ab user: Georg Brandl date: Sat Nov 15 10:38:00 2014 +0100 summary: Add Post-History to PEP 479. files: pep-0479.txt | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/pep-0479.txt b/pep-0479.txt --- a/pep-0479.txt +++ b/pep-0479.txt @@ -8,7 +8,7 @@ Content-Type: text/x-rst Created: 15-Nov-2014 Python-Version: 3.5 -Post-History: +Post-History: 15-Nov-2014 Abstract -- Repository URL: https://hg.python.org/peps From python-checkins at python.org Sat Nov 15 13:05:31 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Sat, 15 Nov 2014 12:05:31 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2322823=3A_Use_set_?= =?utf-8?q?literals_instead_of_creating_a_set_from_a_tuple=2E?= Message-ID: <20141115120528.29230.17272@psf.io> https://hg.python.org/cpython/rev/f4e75efdc7f1 changeset: 93496:f4e75efdc7f1 user: Serhiy Storchaka date: Sat Nov 15 13:30:42 2014 +0200 summary: Issue #22823: Use set literals instead of creating a set from a tuple. files: Tools/clinic/clinic.py | 18 +++++++++--------- 1 files changed, 9 insertions(+), 9 deletions(-) diff --git a/Tools/clinic/clinic.py b/Tools/clinic/clinic.py --- a/Tools/clinic/clinic.py +++ b/Tools/clinic/clinic.py @@ -2535,9 +2535,9 @@ length=False, nullable=False, zeroes=False): types = set(types.strip().split()) - bytes_type = set(("bytes",)) - str_type = set(("str",)) - all_3_type = set(("bytearray",)) | bytes_type | str_type + bytes_type = {"bytes"} + str_type = {"str"} + all_3_type = {"bytearray"} | bytes_type | str_type is_bytes = types == bytes_type is_str = types == str_type is_all_3 = types == all_3_type @@ -2633,12 +2633,12 @@ fail("The only legal default value for Py_buffer is None.") self.c_default = self.c_ignored_default types = set(types.strip().split()) - bytes_type = set(('bytes',)) - bytearray_type = set(('bytearray',)) - buffer_type = set(('buffer',)) - rwbuffer_type = set(('rwbuffer',)) - robuffer_type = set(('robuffer',)) - str_type = set(('str',)) + bytes_type = {'bytes'} + bytearray_type = {'bytearray'} + buffer_type = {'buffer'} + rwbuffer_type = {'rwbuffer'} + robuffer_type = {'robuffer'} + str_type = {'str'} bytes_bytearray_buffer_type = bytes_type | bytearray_type | buffer_type format_unit = None -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 15 13:05:31 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Sat, 15 Nov 2014 12:05:31 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2322193=3A_Fixed_integer_overflow_error_in_sys=2E?= =?utf-8?b?Z2V0c2l6ZW9mKCku?= Message-ID: <20141115120528.29210.16719@psf.io> https://hg.python.org/cpython/rev/b7651f9be4a1 changeset: 93495:b7651f9be4a1 parent: 93492:e79c6ea48b83 parent: 93494:df5c6b05238e user: Serhiy Storchaka date: Sat Nov 15 13:22:27 2014 +0200 summary: Issue #22193: Fixed integer overflow error in sys.getsizeof(). Fixed an error in _PySys_GetSizeOf declaration. files: Include/sysmodule.h | 2 +- Lib/test/test_sys.py | 31 +++++++++++++++++++++++++++++++ Python/sysmodule.c | 15 ++++++++++----- 3 files changed, 42 insertions(+), 6 deletions(-) diff --git a/Include/sysmodule.h b/Include/sysmodule.h --- a/Include/sysmodule.h +++ b/Include/sysmodule.h @@ -34,7 +34,7 @@ PyAPI_FUNC(PyObject *) PySys_GetXOptions(void); #ifndef Py_LIMITED_API -PyAPI_DATA(size_t) _PySys_GetSizeOf(PyObject *); +PyAPI_FUNC(size_t) _PySys_GetSizeOf(PyObject *); #endif #ifdef __cplusplus diff --git a/Lib/test/test_sys.py b/Lib/test/test_sys.py --- a/Lib/test/test_sys.py +++ b/Lib/test/test_sys.py @@ -770,6 +770,37 @@ # but lists are self.assertEqual(sys.getsizeof([]), vsize('Pn') + gc_header_size) + def test_errors(self): + class BadSizeof: + def __sizeof__(self): + raise ValueError + self.assertRaises(ValueError, sys.getsizeof, BadSizeof()) + + class InvalidSizeof: + def __sizeof__(self): + return None + self.assertRaises(TypeError, sys.getsizeof, InvalidSizeof()) + sentinel = ["sentinel"] + self.assertIs(sys.getsizeof(InvalidSizeof(), sentinel), sentinel) + + class FloatSizeof: + def __sizeof__(self): + return 4.5 + self.assertRaises(TypeError, sys.getsizeof, FloatSizeof()) + self.assertIs(sys.getsizeof(FloatSizeof(), sentinel), sentinel) + + class OverflowSizeof(int): + def __sizeof__(self): + return int(self) + self.assertEqual(sys.getsizeof(OverflowSizeof(sys.maxsize)), + sys.maxsize + self.gc_headsize) + with self.assertRaises(OverflowError): + sys.getsizeof(OverflowSizeof(sys.maxsize + 1)) + with self.assertRaises(ValueError): + sys.getsizeof(OverflowSizeof(-1)) + with self.assertRaises((ValueError, OverflowError)): + sys.getsizeof(OverflowSizeof(-sys.maxsize - 1)) + def test_default(self): size = test.support.calcvobjsize self.assertEqual(sys.getsizeof(True), size('') + self.longdigit) diff --git a/Python/sysmodule.c b/Python/sysmodule.c --- a/Python/sysmodule.c +++ b/Python/sysmodule.c @@ -868,7 +868,7 @@ { PyObject *res = NULL; PyObject *method; - size_t size; + Py_ssize_t size; /* Make sure the type is initialized. float gets initialized late */ if (PyType_Ready(Py_TYPE(o)) < 0) @@ -889,15 +889,20 @@ if (res == NULL) return (size_t)-1; - size = PyLong_AsSize_t(res); + size = PyLong_AsSsize_t(res); Py_DECREF(res); - if (size == (size_t)-1 && PyErr_Occurred()) + if (size == -1 && PyErr_Occurred()) return (size_t)-1; + if (size < 0) { + PyErr_SetString(PyExc_ValueError, "__sizeof__() should return >= 0"); + return (size_t)-1; + } + /* add gc_head size */ if (PyObject_IS_GC(o)) - size += sizeof(PyGC_Head); - return size; + return ((size_t)size) + sizeof(PyGC_Head); + return (size_t)size; } static PyObject * -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 15 13:05:31 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Sat, 15 Nov 2014 12:05:31 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzIyMTkz?= =?utf-8?q?=3A_Fixed_integer_overflow_error_in_sys=2Egetsizeof=28=29=2E?= Message-ID: <20141115120527.57228.93720@psf.io> https://hg.python.org/cpython/rev/3537994fa43b changeset: 93493:3537994fa43b branch: 2.7 parent: 93491:33d68c79d601 user: Serhiy Storchaka date: Sat Nov 15 13:21:01 2014 +0200 summary: Issue #22193: Fixed integer overflow error in sys.getsizeof(). Fixed an error in _PySys_GetSizeOf declaration. files: Include/sysmodule.h | 2 +- Lib/test/test_sys.py | 25 +++++++++++++++++++++++++ Python/sysmodule.c | 13 +++++++++---- 3 files changed, 35 insertions(+), 5 deletions(-) diff --git a/Include/sysmodule.h b/Include/sysmodule.h --- a/Include/sysmodule.h +++ b/Include/sysmodule.h @@ -23,7 +23,7 @@ PyAPI_FUNC(void) PySys_AddWarnOption(char *); PyAPI_FUNC(int) PySys_HasWarnOptions(void); -PyAPI_DATA(size_t) _PySys_GetSizeOf(PyObject *); +PyAPI_FUNC(size_t) _PySys_GetSizeOf(PyObject *); #ifdef __cplusplus } diff --git a/Lib/test/test_sys.py b/Lib/test/test_sys.py --- a/Lib/test/test_sys.py +++ b/Lib/test/test_sys.py @@ -494,6 +494,31 @@ # but lists are self.assertEqual(sys.getsizeof([]), size('P PP') + gc_header_size) + def test_errors(self): + class BadSizeof(object): + def __sizeof__(self): + raise ValueError + self.assertRaises(ValueError, sys.getsizeof, BadSizeof()) + + class InvalidSizeof(object): + def __sizeof__(self): + return None + self.assertRaises(TypeError, sys.getsizeof, InvalidSizeof()) + sentinel = ["sentinel"] + self.assertIs(sys.getsizeof(InvalidSizeof(), sentinel), sentinel) + + class OverflowSizeof(int): + def __sizeof__(self): + return int(self) + self.assertEqual(sys.getsizeof(OverflowSizeof(sys.maxsize)), + sys.maxsize + self.gc_headsize) + with self.assertRaises(OverflowError): + sys.getsizeof(OverflowSizeof(sys.maxsize + 1)) + with self.assertRaises(ValueError): + sys.getsizeof(OverflowSizeof(-1)) + with self.assertRaises((ValueError, OverflowError)): + sys.getsizeof(OverflowSizeof(-sys.maxsize - 1)) + def test_default(self): size = test.test_support.calcobjsize self.assertEqual(sys.getsizeof(True, -1), size('l')) diff --git a/Python/sysmodule.c b/Python/sysmodule.c --- a/Python/sysmodule.c +++ b/Python/sysmodule.c @@ -689,7 +689,7 @@ { static PyObject *str__sizeof__ = NULL; PyObject *res = NULL; - size_t size; + Py_ssize_t size; /* Make sure the type is initialized. float gets initialized late */ if (PyType_Ready(Py_TYPE(o)) < 0) @@ -718,14 +718,19 @@ size = (size_t)PyInt_AsSsize_t(res); Py_DECREF(res); - if (size == (size_t)-1 && PyErr_Occurred()) + if (size == -1 && PyErr_Occurred()) return (size_t)-1; } + if (size < 0) { + PyErr_SetString(PyExc_ValueError, "__sizeof__() should return >= 0"); + return (size_t)-1; + } + /* add gc_head size */ if (PyObject_IS_GC(o)) - size += sizeof(PyGC_Head); - return size; + return ((size_t)size) + sizeof(PyGC_Head); + return (size_t)size; } static PyObject * -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 15 13:05:31 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Sat, 15 Nov 2014 12:05:31 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyMTkz?= =?utf-8?q?=3A_Fixed_integer_overflow_error_in_sys=2Egetsizeof=28=29=2E?= Message-ID: <20141115120528.51555.90020@psf.io> https://hg.python.org/cpython/rev/df5c6b05238e changeset: 93494:df5c6b05238e branch: 3.4 parent: 93489:e8182c6c9ef1 user: Serhiy Storchaka date: Sat Nov 15 13:21:37 2014 +0200 summary: Issue #22193: Fixed integer overflow error in sys.getsizeof(). Fixed an error in _PySys_GetSizeOf declaration. files: Include/sysmodule.h | 2 +- Lib/test/test_sys.py | 31 +++++++++++++++++++++++++++++++ Python/sysmodule.c | 15 ++++++++++----- 3 files changed, 42 insertions(+), 6 deletions(-) diff --git a/Include/sysmodule.h b/Include/sysmodule.h --- a/Include/sysmodule.h +++ b/Include/sysmodule.h @@ -34,7 +34,7 @@ PyAPI_FUNC(PyObject *) PySys_GetXOptions(void); #ifndef Py_LIMITED_API -PyAPI_DATA(size_t) _PySys_GetSizeOf(PyObject *); +PyAPI_FUNC(size_t) _PySys_GetSizeOf(PyObject *); #endif #ifdef __cplusplus diff --git a/Lib/test/test_sys.py b/Lib/test/test_sys.py --- a/Lib/test/test_sys.py +++ b/Lib/test/test_sys.py @@ -723,6 +723,37 @@ # but lists are self.assertEqual(sys.getsizeof([]), vsize('Pn') + gc_header_size) + def test_errors(self): + class BadSizeof: + def __sizeof__(self): + raise ValueError + self.assertRaises(ValueError, sys.getsizeof, BadSizeof()) + + class InvalidSizeof: + def __sizeof__(self): + return None + self.assertRaises(TypeError, sys.getsizeof, InvalidSizeof()) + sentinel = ["sentinel"] + self.assertIs(sys.getsizeof(InvalidSizeof(), sentinel), sentinel) + + class FloatSizeof: + def __sizeof__(self): + return 4.5 + self.assertRaises(TypeError, sys.getsizeof, FloatSizeof()) + self.assertIs(sys.getsizeof(FloatSizeof(), sentinel), sentinel) + + class OverflowSizeof(int): + def __sizeof__(self): + return int(self) + self.assertEqual(sys.getsizeof(OverflowSizeof(sys.maxsize)), + sys.maxsize + self.gc_headsize) + with self.assertRaises(OverflowError): + sys.getsizeof(OverflowSizeof(sys.maxsize + 1)) + with self.assertRaises(ValueError): + sys.getsizeof(OverflowSizeof(-1)) + with self.assertRaises((ValueError, OverflowError)): + sys.getsizeof(OverflowSizeof(-sys.maxsize - 1)) + def test_default(self): size = test.support.calcvobjsize self.assertEqual(sys.getsizeof(True), size('') + self.longdigit) diff --git a/Python/sysmodule.c b/Python/sysmodule.c --- a/Python/sysmodule.c +++ b/Python/sysmodule.c @@ -868,7 +868,7 @@ { PyObject *res = NULL; PyObject *method; - size_t size; + Py_ssize_t size; /* Make sure the type is initialized. float gets initialized late */ if (PyType_Ready(Py_TYPE(o)) < 0) @@ -889,15 +889,20 @@ if (res == NULL) return (size_t)-1; - size = PyLong_AsSize_t(res); + size = PyLong_AsSsize_t(res); Py_DECREF(res); - if (size == (size_t)-1 && PyErr_Occurred()) + if (size == -1 && PyErr_Occurred()) return (size_t)-1; + if (size < 0) { + PyErr_SetString(PyExc_ValueError, "__sizeof__() should return >= 0"); + return (size_t)-1; + } + /* add gc_head size */ if (PyObject_IS_GC(o)) - size += sizeof(PyGC_Head); - return size; + return ((size_t)size) + sizeof(PyGC_Head); + return (size_t)size; } static PyObject * -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Sat Nov 15 19:59:07 2014 From: python-checkins at python.org (raymond.hettinger) Date: Sat, 15 Nov 2014 18:59:07 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2322824=3A__Simplif?= =?utf-8?q?y_reprlib_output_format_for_empty_arrays?= Message-ID: <20141115185907.51553.8157@psf.io> https://hg.python.org/cpython/rev/cf5b910ac4c8 changeset: 93497:cf5b910ac4c8 user: Raymond Hettinger date: Sat Nov 15 10:58:58 2014 -0800 summary: Issue #22824: Simplify reprlib output format for empty arrays files: Lib/reprlib.py | 2 ++ Lib/test/test_reprlib.py | 2 +- Misc/NEWS | 3 +++ 3 files changed, 6 insertions(+), 1 deletions(-) diff --git a/Lib/reprlib.py b/Lib/reprlib.py --- a/Lib/reprlib.py +++ b/Lib/reprlib.py @@ -83,6 +83,8 @@ return self._repr_iterable(x, level, '[', ']', self.maxlist) def repr_array(self, x, level): + if not x: + return "array('%s')" % x.typecode header = "array('%s', [" % x.typecode return self._repr_iterable(x, level, header, '])', self.maxarray) diff --git a/Lib/test/test_reprlib.py b/Lib/test/test_reprlib.py --- a/Lib/test/test_reprlib.py +++ b/Lib/test/test_reprlib.py @@ -94,7 +94,7 @@ eq(r(d), "{'alice': 1, 'arthur': 1, 'bob': 2, 'charles': 3, ...}") # array.array after 5. - eq(r(array('i')), "array('i', [])") + eq(r(array('i')), "array('i')") eq(r(array('i', [1])), "array('i', [1])") eq(r(array('i', [1, 2])), "array('i', [1, 2])") eq(r(array('i', [1, 2, 3])), "array('i', [1, 2, 3])") diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -209,6 +209,9 @@ - Issue #22824: Updated reprlib output format for sets to use set literals. Patch contributed by Berker Peksag. +- Issue #22824: Updated reprlib output format for arrays to display empty + arrays without an unnecessary empty list. Suggested by Serhiy Storchaka. + - Issue #22406: Fixed the uu_codec codec incorrectly ported to 3.x. Based on patch by Martin Panter. -- Repository URL: https://hg.python.org/cpython From solipsis at pitrou.net Sun Nov 16 10:32:11 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Sun, 16 Nov 2014 10:32:11 +0100 Subject: [Python-checkins] Daily reference leaks (cf5b910ac4c8): sum=3 Message-ID: results for cf5b910ac4c8 on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogTOSWib', '-x'] From python-checkins at python.org Mon Nov 17 10:26:15 2014 From: python-checkins at python.org (georg.brandl) Date: Mon, 17 Nov 2014 09:26:15 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_Update_PEP_479_from_author=2E?= Message-ID: <20141117092613.36970.60096@psf.io> https://hg.python.org/peps/rev/75a785922e8c changeset: 5597:75a785922e8c user: Georg Brandl date: Mon Nov 17 10:26:09 2014 +0100 summary: Update PEP 479 from author. files: pep-0479.txt | 62 +++++++++++++++++++++++++++++++++++---- 1 files changed, 55 insertions(+), 7 deletions(-) diff --git a/pep-0479.txt b/pep-0479.txt --- a/pep-0479.txt +++ b/pep-0479.txt @@ -29,15 +29,27 @@ ``StopIteration`` can be absorbed by the generator construct. +Background information +====================== + +When a generator frame is (re)started as a result of a ``__next__()`` +(or ``send()`` or ``throw()``) call, one of three outcomes can occur: + +* A yield point is reached, and the yielded value is returned. +* The frame is returned from; ``StopIteration`` is raised. +* An exception is thrown, which bubbles out. + + Proposal ======== If a ``StopIteration`` is about to bubble out of a generator frame, it -is replaced with some other exception (maybe ``RuntimeError``, maybe a -new custom ``Exception`` subclass, but *not* deriving from -``StopIteration``) which causes the ``next()`` call (which invoked the -generator) to fail, passing that exception out. From then on it's -just like any old exception. [3]_ +is replaced with ``RuntimeError``, which causes the ``next()`` call +(which invoked the generator) to fail, passing that exception out. +From then on it's just like any old exception. [3]_ + +This affects the third outcome listed above, without altering any +other effects. Consequences to existing code @@ -56,19 +68,38 @@ As this can break code, it is proposed to utilize the ``__future__`` mechanism to introduce this, finally making it standard in Python 3.6 -or 3.7. +or 3.7. Any generator function constructed in the presence of this +directive will have a flag set on its code object, and generators with +the flag set will behave according to this proposal. Once the feature +becomes standard, the flag may be dropped; code should not inspect +generators for it. (GvR: """And the flag should somehow be +transferred to the stack frame when the function is executed, so the +right action can be taken when an exception is about to bubble out of +that frame.""") Alternate proposals =================== +Raising something other than RuntimeError +----------------------------------------- + +Rather than the generic ``RuntimeError``, it might make sense to raise +a new exception type ``UnexpectedStopIteration``. This has the +downside of implicitly encouraging that it be caught; the correct +action is to catch the original ``StopIteration``, not the chained +exception. + + Supplying a specific exception to raise on return ------------------------------------------------- Nick Coghlan suggested a means of providing a specific ``StopIteration`` instance to the generator; if any other instance of ``StopIteration`` is raised, it is an error, but if that particular -one is raised, the generator has properly completed. +one is raised, the generator has properly completed. This subproposal +has been withdrawn in favour of better options, but is retained for +reference. Making return-triggered StopIterations obvious @@ -80,6 +111,23 @@ ``StopIteration`` which can then be detected. If it is not that subclass, it is an escaping exception rather than a return statement. +Of the three outcomes listed above: + +* A yielded value, obviously, would still be returned. +* If the frame is returned from, ``GeneratorReturn`` is raised. +* If an instance of ``GeneratorReturn`` would be raised, instead an + instance of ``StopIteration`` would be raised. + +In the third case, the ``StopIteration`` would have the ``value`` of +the original ``GeneratorReturn``, and would reference the original +exception in its ``__cause__``. If uncaught, this would clearly show +the chaining of exceptions. + +This does *not* affect the discrepancy between generator expressions +and list comprehensions, but allows generator-aware code (such as the +contextlib and asyncio modules) to reliably differentiate between the +second and third outcomes listed above. + Criticism ========= -- Repository URL: https://hg.python.org/peps From solipsis at pitrou.net Mon Nov 17 10:33:28 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Mon, 17 Nov 2014 10:33:28 +0100 Subject: [Python-checkins] Daily reference leaks (cf5b910ac4c8): sum=3 Message-ID: results for cf5b910ac4c8 on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogg835Z8', '-x'] From python-checkins at python.org Mon Nov 17 20:32:23 2014 From: python-checkins at python.org (guido.van.rossum) Date: Mon, 17 Nov 2014 19:32:23 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_Make_PEP_479_=28Change_StopIt?= =?utf-8?q?eration=29_be_more_specific=2C_improve_some_wording=2C_etc=2E?= Message-ID: <20141117193159.51559.86606@psf.io> https://hg.python.org/peps/rev/8de949863677 changeset: 5598:8de949863677 user: Guido van Rossum date: Mon Nov 17 11:31:54 2014 -0800 summary: Make PEP 479 (Change StopIteration) be more specific, improve some wording, etc. files: pep-0479.txt | 73 +++++++++++++++++++++++++++++---------- 1 files changed, 53 insertions(+), 20 deletions(-) diff --git a/pep-0479.txt b/pep-0479.txt --- a/pep-0479.txt +++ b/pep-0479.txt @@ -15,8 +15,12 @@ ======== This PEP proposes a semantic change to ``StopIteration`` when raised -inside a generator, unifying the behaviour of list comprehensions and -generator expressions somewhat. +inside a generator. This would unify the behaviour of list +comprehensions and generator expressions, reducing surprises such as +the one that started this discussion [1]_. This is also the main +backwards incompatibility of the proposal -- any generator that +depends on an implicitly-raised ``StopIteration`` to terminate it will +have to be rewritten to either catch that exception or use a for-loop. Rationale @@ -37,7 +41,10 @@ * A yield point is reached, and the yielded value is returned. * The frame is returned from; ``StopIteration`` is raised. -* An exception is thrown, which bubbles out. +* An exception is raised, which bubbles out. + +In the latter two cases the frame is abandoned (and the generator +object's ``gi_frame`` attribute is set to None). Proposal @@ -49,33 +56,47 @@ From then on it's just like any old exception. [3]_ This affects the third outcome listed above, without altering any -other effects. +other effects. Furthermore, it only affects this outcome when the +exception raised is StopIteration (or a subclass thereof). +Note that the proposed replacement happens at the point where the +exception is about to bubble out of the frame, i.e. after any +``except`` or ``finally`` blocks that could affect it have been +exited. The ``StopIteration`` raised by returning from the frame is +not affected (the point being that ``StopIteration`` means that the +generator terminated "normally", i.e. it did not raise an exception). -Consequences to existing code -============================= + +Consequences for existing code +============================== This change will affect existing code that depends on ``StopIteration`` bubbling up. The pure Python reference -implementation of ``groupby`` [1]_ currently has comments "Exit on +implementation of ``groupby`` [2]_ currently has comments "Exit on ``StopIteration``" where it is expected that the exception will propagate and then be handled. This will be unusual, but not unknown, -and such constructs will fail. +and such constructs will fail. Other examples abound, e.g. [5]_, [6]_. (Nick Coghlan comments: """If you wanted to factor out a helper function that terminated the generator you'd have to do "return yield from helper()" rather than just "helper()".""") +There are also examples of generator expressions floating around that +rely on a StopIteration raised by the expression, the target or the +predicate (rather than by the __next__() call implied in the ``for`` +loop proper). + As this can break code, it is proposed to utilize the ``__future__`` -mechanism to introduce this, finally making it standard in Python 3.6 -or 3.7. Any generator function constructed in the presence of this -directive will have a flag set on its code object, and generators with -the flag set will behave according to this proposal. Once the feature -becomes standard, the flag may be dropped; code should not inspect -generators for it. (GvR: """And the flag should somehow be -transferred to the stack frame when the function is executed, so the -right action can be taken when an exception is about to bubble out of -that frame.""") +mechanism to introduce this in Python 3.5, finally making it standard +in Python 3.6 or 3.7. The proposed syntax is:: + + from __future__ import replace_stopiteration_in_generators + +Any generator function constructed under the influence of this +directive will have the REPLACE_STOPITERATION flag set on its code +object, and generators with the flag set will behave according to this +proposal. Once the feature becomes standard, the flag may be dropped; +code should not inspect generators for it. Alternate proposals @@ -123,19 +144,25 @@ exception in its ``__cause__``. If uncaught, this would clearly show the chaining of exceptions. -This does *not* affect the discrepancy between generator expressions +This alternative does *not* affect the discrepancy between generator expressions and list comprehensions, but allows generator-aware code (such as the contextlib and asyncio modules) to reliably differentiate between the second and third outcomes listed above. +However, once code exists that depends on this distinction between +``GeneratorReturn`` and ``StopIteration``, a generator that invokes +another generator and relies on the latter's ``StopIteration`` to +bubble out would still be potentially wrong, depending on the use made +of the distinction between the two exception types. + Criticism ========= Unofficial and apocryphal statistics suggest that this is seldom, if ever, a problem. [4]_ Code does exist which relies on the current -behaviour, and there is the concern that this would be unnecessary -code churn to achieve little or no gain. +behaviour (e.g. [2]_, [5]_, [6]_), and there is the concern that this +would be unnecessary code churn to achieve little or no gain. References @@ -153,6 +180,12 @@ .. [4] Response by Steven D'Aprano (https://mail.python.org/pipermail/python-ideas/2014-November/029994.html) +.. [5] Split a sequence or generator using a predicate + (http://code.activestate.com/recipes/578416-split-a-sequence-or-generator-using-a-predicate/) + +.. [6] wrap unbounded generator to restrict its output + (http://code.activestate.com/recipes/66427-wrap-unbounded-generator-to-restrict-its-output/) + Copyright ========= -- Repository URL: https://hg.python.org/peps From python-checkins at python.org Mon Nov 17 21:16:35 2014 From: python-checkins at python.org (guido.van.rossum) Date: Mon, 17 Nov 2014 20:16:35 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_Add_more_words_to_GeneratorRe?= =?utf-8?q?turn_alternative=2E?= Message-ID: <20141117201550.57220.78035@psf.io> https://hg.python.org/peps/rev/d71f1c9cd084 changeset: 5599:d71f1c9cd084 user: Guido van Rossum date: Mon Nov 17 12:15:42 2014 -0800 summary: Add more words to GeneratorReturn alternative. files: pep-0479.txt | 27 +++++++++++++++++++++------ 1 files changed, 21 insertions(+), 6 deletions(-) diff --git a/pep-0479.txt b/pep-0479.txt --- a/pep-0479.txt +++ b/pep-0479.txt @@ -129,8 +129,18 @@ For certain situations, a simpler and fully backward-compatible solution may be sufficient: when a generator returns, instead of raising ``StopIteration``, it raises a specific subclass of -``StopIteration`` which can then be detected. If it is not that -subclass, it is an escaping exception rather than a return statement. +``StopIteration`` (``GeneratorReturn``) which can then be detected. +If it is not that subclass, it is an escaping exception rather than a +return statement. + +The inspiration for this alternative proposal was Nick's observation +[7]_ that if an ``asyncio`` coroutine [8]_ accidentally raises +``StopIteration``, it currently terminates silently, which may present +a hard-to-debug mystery to the developer. The main proposal turns +such accidents in clearly distinguishable ``RuntimeError`` exceptions, +but if that is rejected, this alternate proposal would enable +``asyncio`` to distinguish between a ``return`` statement and an +accidentally-raised ``StopIteration`` exception. Of the three outcomes listed above: @@ -144,10 +154,10 @@ exception in its ``__cause__``. If uncaught, this would clearly show the chaining of exceptions. -This alternative does *not* affect the discrepancy between generator expressions -and list comprehensions, but allows generator-aware code (such as the -contextlib and asyncio modules) to reliably differentiate between the -second and third outcomes listed above. +This alternative does *not* affect the discrepancy between generator +expressions and list comprehensions, but allows generator-aware code +(such as the ``contextlib`` and ``asyncio`` modules) to reliably +differentiate between the second and third outcomes listed above. However, once code exists that depends on this distinction between ``GeneratorReturn`` and ``StopIteration``, a generator that invokes @@ -186,6 +196,11 @@ .. [6] wrap unbounded generator to restrict its output (http://code.activestate.com/recipes/66427-wrap-unbounded-generator-to-restrict-its-output/) +.. [7] Post from Nick Coghlan mentioning asyncio + (https://mail.python.org/pipermail/python-ideas/2014-November/029961.html) + +.. [8] Coroutines in asyncio + (https://docs.python.org/3/library/asyncio-task.html#coroutines) Copyright ========= -- Repository URL: https://hg.python.org/peps From python-checkins at python.org Mon Nov 17 22:50:53 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 17 Nov 2014 21:50:53 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2320662=3A_Argspec_now_is_escaped_in_html_output_?= =?utf-8?q?of_pydoc=2E?= Message-ID: <20141117215051.51549.3811@psf.io> https://hg.python.org/cpython/rev/1855b5c3da61 changeset: 93499:1855b5c3da61 parent: 93497:cf5b910ac4c8 parent: 93498:cf2e424e0413 user: Serhiy Storchaka date: Mon Nov 17 23:48:35 2014 +0200 summary: Issue #20662: Argspec now is escaped in html output of pydoc. files: Lib/pydoc.py | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Lib/pydoc.py b/Lib/pydoc.py --- a/Lib/pydoc.py +++ b/Lib/pydoc.py @@ -954,7 +954,7 @@ if not argspec: argspec = '(...)' - decl = title + argspec + (note and self.grey( + decl = title + self.escape(argspec) + (note and self.grey( '%s' % note)) if skipdocs: -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Mon Nov 17 22:50:53 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Mon, 17 Nov 2014 21:50:53 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIwNjYy?= =?utf-8?q?=3A_Argspec_now_is_escaped_in_html_output_of_pydoc=2E?= Message-ID: <20141117215051.57218.99105@psf.io> https://hg.python.org/cpython/rev/cf2e424e0413 changeset: 93498:cf2e424e0413 branch: 3.4 parent: 93494:df5c6b05238e user: Serhiy Storchaka date: Mon Nov 17 23:48:02 2014 +0200 summary: Issue #20662: Argspec now is escaped in html output of pydoc. files: Lib/pydoc.py | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Lib/pydoc.py b/Lib/pydoc.py --- a/Lib/pydoc.py +++ b/Lib/pydoc.py @@ -956,7 +956,7 @@ if not argspec: argspec = '(...)' - decl = title + argspec + (note and self.grey( + decl = title + self.escape(argspec) + (note and self.grey( '%s' % note)) if skipdocs: -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 18 01:12:33 2014 From: python-checkins at python.org (guido.van.rossum) Date: Tue, 18 Nov 2014 00:12:33 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_Add_link_to_survey_by_Steven_?= =?utf-8?q?D=2C_and_summarize_the_two_responses_so_far=2E?= Message-ID: <20141118001230.62766.45608@psf.io> https://hg.python.org/peps/rev/7f846f74013f changeset: 5600:7f846f74013f user: Guido van Rossum date: Mon Nov 17 16:12:26 2014 -0800 summary: Add link to survey by Steven D, and summarize the two responses so far. files: pep-0479.txt | 8 ++++++++ 1 files changed, 8 insertions(+), 0 deletions(-) diff --git a/pep-0479.txt b/pep-0479.txt --- a/pep-0479.txt +++ b/pep-0479.txt @@ -174,6 +174,11 @@ behaviour (e.g. [2]_, [5]_, [6]_), and there is the concern that this would be unnecessary code churn to achieve little or no gain. +Steven D'Aprano started an informal survey on comp.lang.python [9]_; +at the time of writing only two responses have been received: one was +in favor of changing list comprehensions to match generator +expressions (!), the other was in favor of this PEP's main proposal. + References ========== @@ -202,6 +207,9 @@ .. [8] Coroutines in asyncio (https://docs.python.org/3/library/asyncio-task.html#coroutines) +.. [9] Thread on comp.lang.python started by Steven D'Aprano + (https://mail.python.org/pipermail/python-list/2014-November/680757.html) + Copyright ========= -- Repository URL: https://hg.python.org/peps From solipsis at pitrou.net Tue Nov 18 10:33:46 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Tue, 18 Nov 2014 10:33:46 +0100 Subject: [Python-checkins] Daily reference leaks (1855b5c3da61): sum=9 Message-ID: results for 1855b5c3da61 on branch "default" -------------------------------------------- test_collections leaked [0, 0, 4] references, sum=4 test_collections leaked [0, 0, 2] memory blocks, sum=2 test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogiR2Ijf', '-x'] From python-checkins at python.org Tue Nov 18 16:48:58 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Tue, 18 Nov 2014 15:48:58 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzE4NjM3?= =?utf-8?q?=3A_Fixed_an_error_in_=5FPyNode=5FSizeOf_declaration=2E?= Message-ID: <20141118153731.62762.13581@psf.io> https://hg.python.org/cpython/rev/ab3e8aab7119 changeset: 93501:ab3e8aab7119 branch: 3.4 parent: 93498:cf2e424e0413 user: Serhiy Storchaka date: Tue Nov 18 17:30:15 2014 +0200 summary: Issue #18637: Fixed an error in _PyNode_SizeOf declaration. Patch by Roumen Petrov. files: Include/node.h | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Include/node.h b/Include/node.h --- a/Include/node.h +++ b/Include/node.h @@ -21,7 +21,7 @@ char *str, int lineno, int col_offset); PyAPI_FUNC(void) PyNode_Free(node *n); #ifndef Py_LIMITED_API -Py_ssize_t _PyNode_SizeOf(node *n); +PyAPI_FUNC(Py_ssize_t) _PyNode_SizeOf(node *n); #endif /* Node access functions */ -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 18 16:48:58 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Tue, 18 Nov 2014 15:48:58 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzE4NjM3?= =?utf-8?q?=3A_Fixed_an_error_in_=5FPyNode=5FSizeOf_declaration=2E?= Message-ID: <20141118153731.36065.81873@psf.io> https://hg.python.org/cpython/rev/eb25629d2a46 changeset: 93500:eb25629d2a46 branch: 2.7 parent: 93493:3537994fa43b user: Serhiy Storchaka date: Tue Nov 18 17:29:47 2014 +0200 summary: Issue #18637: Fixed an error in _PyNode_SizeOf declaration. Patch by Roumen Petrov. files: Include/node.h | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Include/node.h b/Include/node.h --- a/Include/node.h +++ b/Include/node.h @@ -20,7 +20,7 @@ PyAPI_FUNC(int) PyNode_AddChild(node *n, int type, char *str, int lineno, int col_offset); PyAPI_FUNC(void) PyNode_Free(node *n); -Py_ssize_t _PyNode_SizeOf(node *n); +PyAPI_FUNC(Py_ssize_t) _PyNode_SizeOf(node *n); /* Node access functions */ #define NCH(n) ((n)->n_nchildren) -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 18 16:48:58 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Tue, 18 Nov 2014 15:48:58 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2318637=3A_Fixed_an_error_in_=5FPyNode=5FSizeOf_d?= =?utf-8?q?eclaration=2E?= Message-ID: <20141118153731.109150.60900@psf.io> https://hg.python.org/cpython/rev/0f663e0ce1d3 changeset: 93502:0f663e0ce1d3 parent: 93499:1855b5c3da61 parent: 93501:ab3e8aab7119 user: Serhiy Storchaka date: Tue Nov 18 17:30:50 2014 +0200 summary: Issue #18637: Fixed an error in _PyNode_SizeOf declaration. Patch by Roumen Petrov. files: Include/node.h | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Include/node.h b/Include/node.h --- a/Include/node.h +++ b/Include/node.h @@ -21,7 +21,7 @@ char *str, int lineno, int col_offset); PyAPI_FUNC(void) PyNode_Free(node *n); #ifndef Py_LIMITED_API -Py_ssize_t _PyNode_SizeOf(node *n); +PyAPI_FUNC(Py_ssize_t) _PyNode_SizeOf(node *n); #endif /* Node access functions */ -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 18 21:41:01 2014 From: python-checkins at python.org (victor.stinner) Date: Tue, 18 Nov 2014 20:41:01 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2320948=3A_Inline_m?= =?utf-8?q?akefmt=28=29_in_unicode=5Ffromformat=5Farg=28=29?= Message-ID: <20141118204100.13371.66628@psf.io> https://hg.python.org/cpython/rev/d6d2549340cb changeset: 93503:d6d2549340cb user: Victor Stinner date: Tue Nov 18 21:40:51 2014 +0100 summary: Issue #20948: Inline makefmt() in unicode_fromformat_arg() files: Objects/unicodeobject.c | 53 ++++------------------------ 1 files changed, 9 insertions(+), 44 deletions(-) diff --git a/Objects/unicodeobject.c b/Objects/unicodeobject.c --- a/Objects/unicodeobject.c +++ b/Objects/unicodeobject.c @@ -2313,35 +2313,6 @@ #endif /* HAVE_WCHAR_H */ -static void -makefmt(char *fmt, int longflag, int longlongflag, int size_tflag, - char c) -{ - *fmt++ = '%'; - if (longflag) - *fmt++ = 'l'; - else if (longlongflag) { - /* longlongflag should only ever be nonzero on machines with - HAVE_LONG_LONG defined */ -#ifdef HAVE_LONG_LONG - char *f = PY_FORMAT_LONG_LONG; - while (*f) - *fmt++ = *f++; -#else - /* we shouldn't ever get here */ - assert(0); - *fmt++ = 'l'; -#endif - } - else if (size_tflag) { - char *f = PY_FORMAT_SIZE_T; - while (*f) - *fmt++ = *f++; - } - *fmt++ = c; - *fmt = '\0'; -} - /* maximum number of characters required for output of %lld or %p. We need at most ceil(log10(256)*SIZEOF_LONG_LONG) digits, plus 1 for the sign. 53/22 is an upper bound for log10(256). */ @@ -2517,48 +2488,42 @@ case 'x': { /* used by sprintf */ - char fmt[10]; /* should be enough for "%0lld\0" */ char buffer[MAX_LONG_LONG_CHARS]; Py_ssize_t arglen; if (*f == 'u') { - makefmt(fmt, longflag, longlongflag, size_tflag, *f); - if (longflag) - len = sprintf(buffer, fmt, + len = sprintf(buffer, "%lu", va_arg(*vargs, unsigned long)); #ifdef HAVE_LONG_LONG else if (longlongflag) - len = sprintf(buffer, fmt, + len = sprintf(buffer, "%" PY_FORMAT_LONG_LONG "u", va_arg(*vargs, unsigned PY_LONG_LONG)); #endif else if (size_tflag) - len = sprintf(buffer, fmt, + len = sprintf(buffer, "%" PY_FORMAT_SIZE_T "u", va_arg(*vargs, size_t)); else - len = sprintf(buffer, fmt, + len = sprintf(buffer, "%u", va_arg(*vargs, unsigned int)); } else if (*f == 'x') { - makefmt(fmt, 0, 0, 0, 'x'); - len = sprintf(buffer, fmt, va_arg(*vargs, int)); + len = sprintf(buffer, "%x", va_arg(*vargs, int)); } else { - makefmt(fmt, longflag, longlongflag, size_tflag, *f); - if (longflag) - len = sprintf(buffer, fmt, + len = sprintf(buffer, "%li", va_arg(*vargs, long)); #ifdef HAVE_LONG_LONG else if (longlongflag) - len = sprintf(buffer, fmt, + len = sprintf(buffer, "%" PY_FORMAT_LONG_LONG "i", va_arg(*vargs, PY_LONG_LONG)); #endif else if (size_tflag) - len = sprintf(buffer, fmt, + len = sprintf(buffer, "%" PY_FORMAT_SIZE_T "i", va_arg(*vargs, Py_ssize_t)); else - len = sprintf(buffer, fmt, + len = sprintf(buffer, "%i", va_arg(*vargs, int)); } assert(len >= 0); -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 18 22:36:55 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Tue, 18 Nov 2014 21:36:55 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2322453=3A_Removed_?= =?utf-8?q?non-documented_macro_PyObject=5FREPR=28=29=2E?= Message-ID: <20141118213642.113284.70690@psf.io> https://hg.python.org/cpython/rev/e339d75a21d5 changeset: 93504:e339d75a21d5 user: Serhiy Storchaka date: Tue Nov 18 23:34:33 2014 +0200 summary: Issue #22453: Removed non-documented macro PyObject_REPR(). files: Doc/whatsnew/3.5.rst | 4 ++++ Include/object.h | 3 --- Misc/NEWS | 2 ++ Python/compile.c | 20 ++++++++++---------- 4 files changed, 16 insertions(+), 13 deletions(-) diff --git a/Doc/whatsnew/3.5.rst b/Doc/whatsnew/3.5.rst --- a/Doc/whatsnew/3.5.rst +++ b/Doc/whatsnew/3.5.rst @@ -441,3 +441,7 @@ * The :c:type:`PyMemAllocator` structure was renamed to :c:type:`PyMemAllocatorEx` and a new ``calloc`` field was added. + +* Removed non-documented macro :c:macro:`PyObject_REPR` which leaked references. + Use format character ``%R`` in :c:func:`PyUnicode_FromFormat`-like functions + to format the :func:`repr` of the object. diff --git a/Include/object.h b/Include/object.h --- a/Include/object.h +++ b/Include/object.h @@ -575,9 +575,6 @@ PyAPI_FUNC(int) Py_ReprEnter(PyObject *); PyAPI_FUNC(void) Py_ReprLeave(PyObject *); -/* Helper for passing objects to printf and the like */ -#define PyObject_REPR(obj) _PyUnicode_AsString(PyObject_Repr(obj)) - /* Flag bits for printing: */ #define Py_PRINT_RAW 1 /* No string quotes etc. */ diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -1256,6 +1256,8 @@ C API ----- +- Issue #22453: Removed non-documented macro PyObject_REPR(). + - Issue #18395: Rename ``_Py_char2wchar()`` to :c:func:`Py_DecodeLocale`, rename ``_Py_wchar2char()`` to :c:func:`Py_EncodeLocale`, and document these functions. diff --git a/Python/compile.c b/Python/compile.c --- a/Python/compile.c +++ b/Python/compile.c @@ -1414,12 +1414,12 @@ PyOS_snprintf(buf, sizeof(buf), "unknown scope for %.100s in %.100s(%s)\n" "symbols: %s\nlocals: %s\nglobals: %s", - PyBytes_AS_STRING(name), - PyBytes_AS_STRING(c->u->u_name), - PyObject_REPR(c->u->u_ste->ste_id), - PyObject_REPR(c->u->u_ste->ste_symbols), - PyObject_REPR(c->u->u_varnames), - PyObject_REPR(c->u->u_names) + PyUnicode_AsUTF8(name), + PyUnicode_AsUTF8(c->u->u_name), + PyUnicode_AsUTF8(PyObject_Repr(c->u->u_ste->ste_id)), + PyUnicode_AsUTF8(PyObject_Repr(c->u->u_ste->ste_symbols)), + PyUnicode_AsUTF8(PyObject_Repr(c->u->u_varnames)), + PyUnicode_AsUTF8(PyObject_Repr(c->u->u_names)) ); Py_FatalError(buf); } @@ -1476,11 +1476,11 @@ fprintf(stderr, "lookup %s in %s %d %d\n" "freevars of %s: %s\n", - PyObject_REPR(name), - PyBytes_AS_STRING(c->u->u_name), + PyUnicode_AsUTF8(PyObject_Repr(name)), + PyUnicode_AsUTF8(c->u->u_name), reftype, arg, - _PyUnicode_AsString(co->co_name), - PyObject_REPR(co->co_freevars)); + PyUnicode_AsUTF8(co->co_name), + PyUnicode_AsUTF8(PyObject_Repr(co->co_freevars))); Py_FatalError("compiler_make_closure()"); } ADDOP_I(c, LOAD_CLOSURE, arg); -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 18 23:17:27 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Tue, 18 Nov 2014 22:17:27 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Null_merge?= Message-ID: <20141118221720.113306.9958@psf.io> https://hg.python.org/cpython/rev/902dbf99fc28 changeset: 93507:902dbf99fc28 parent: 93504:e339d75a21d5 parent: 93505:342a619cdafb user: Serhiy Storchaka date: Wed Nov 19 00:13:24 2014 +0200 summary: Null merge files: -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 18 23:17:27 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Tue, 18 Nov 2014 22:17:27 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIyNDUz?= =?utf-8?q?=3A_Warn_against_the_use_of_leaking_macro_PyObject=5FREPR=28=29?= =?utf-8?q?=2E?= Message-ID: <20141118221720.36061.17668@psf.io> https://hg.python.org/cpython/rev/342a619cdafb changeset: 93505:342a619cdafb branch: 3.4 parent: 93501:ab3e8aab7119 user: Serhiy Storchaka date: Wed Nov 19 00:08:38 2014 +0200 summary: Issue #22453: Warn against the use of leaking macro PyObject_REPR(). files: Include/object.h | 8 ++++++-- Python/compile.c | 20 ++++++++++---------- 2 files changed, 16 insertions(+), 12 deletions(-) diff --git a/Include/object.h b/Include/object.h --- a/Include/object.h +++ b/Include/object.h @@ -572,8 +572,12 @@ PyAPI_FUNC(int) Py_ReprEnter(PyObject *); PyAPI_FUNC(void) Py_ReprLeave(PyObject *); -/* Helper for passing objects to printf and the like */ -#define PyObject_REPR(obj) _PyUnicode_AsString(PyObject_Repr(obj)) +#ifndef Py_LIMITED_API +/* Helper for passing objects to printf and the like. + Leaks refcounts. Don't use it! +*/ +#define PyObject_REPR(obj) PyUnicode_AsUTF8(PyObject_Repr(obj)) +#endif /* Flag bits for printing: */ #define Py_PRINT_RAW 1 /* No string quotes etc. */ diff --git a/Python/compile.c b/Python/compile.c --- a/Python/compile.c +++ b/Python/compile.c @@ -1412,12 +1412,12 @@ PyOS_snprintf(buf, sizeof(buf), "unknown scope for %.100s in %.100s(%s)\n" "symbols: %s\nlocals: %s\nglobals: %s", - PyBytes_AS_STRING(name), - PyBytes_AS_STRING(c->u->u_name), - PyObject_REPR(c->u->u_ste->ste_id), - PyObject_REPR(c->u->u_ste->ste_symbols), - PyObject_REPR(c->u->u_varnames), - PyObject_REPR(c->u->u_names) + PyUnicode_AsUTF8(name), + PyUnicode_AsUTF8(c->u->u_name), + PyUnicode_AsUTF8(PyObject_Repr(c->u->u_ste->ste_id)), + PyUnicode_AsUTF8(PyObject_Repr(c->u->u_ste->ste_symbols)), + PyUnicode_AsUTF8(PyObject_Repr(c->u->u_varnames)), + PyUnicode_AsUTF8(PyObject_Repr(c->u->u_names)) ); Py_FatalError(buf); } @@ -1474,11 +1474,11 @@ fprintf(stderr, "lookup %s in %s %d %d\n" "freevars of %s: %s\n", - PyObject_REPR(name), - PyBytes_AS_STRING(c->u->u_name), + PyUnicode_AsUTF8(PyObject_Repr(name)), + PyUnicode_AsUTF8(c->u->u_name), reftype, arg, - _PyUnicode_AsString(co->co_name), - PyObject_REPR(co->co_freevars)); + PyUnicode_AsUTF8(co->co_name), + PyUnicode_AsUTF8(PyObject_Repr(co->co_freevars))); Py_FatalError("compiler_make_closure()"); } ADDOP_I(c, LOAD_CLOSURE, arg); -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Tue Nov 18 23:17:27 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Tue, 18 Nov 2014 22:17:27 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzIyNDUz?= =?utf-8?q?=3A_Fexed_reference_leaks_when_format_error_messages_in_ceval?= =?utf-8?b?LmMu?= Message-ID: <20141118221720.62756.49480@psf.io> https://hg.python.org/cpython/rev/6e26b5291c41 changeset: 93506:6e26b5291c41 branch: 2.7 parent: 93500:eb25629d2a46 user: Serhiy Storchaka date: Wed Nov 19 00:11:05 2014 +0200 summary: Issue #22453: Fexed reference leaks when format error messages in ceval.c. Warn against the use of leaking macro PyObject_REPR(). files: Include/object.h | 4 +++- Python/ceval.c | 20 ++++++++++++++++---- Python/compile.c | 12 ++++++------ 3 files changed, 25 insertions(+), 11 deletions(-) diff --git a/Include/object.h b/Include/object.h --- a/Include/object.h +++ b/Include/object.h @@ -527,7 +527,9 @@ PyAPI_DATA(int) _Py_HashSecret_Initialized; #endif -/* Helper for passing objects to printf and the like */ +/* Helper for passing objects to printf and the like. + Leaks refcounts. Don't use it! +*/ #define PyObject_REPR(obj) PyString_AS_STRING(PyObject_Repr(obj)) /* Flag bits for printing: */ diff --git a/Python/ceval.c b/Python/ceval.c --- a/Python/ceval.c +++ b/Python/ceval.c @@ -1957,9 +1957,13 @@ if (err == 0) continue; break; } + t = PyObject_Repr(w); + if (t == NULL) + break; PyErr_Format(PyExc_SystemError, "no locals found when storing %s", - PyObject_REPR(w)); + PyString_AS_STRING(t)); + Py_DECREF(t); break; case DELETE_NAME: @@ -1971,9 +1975,13 @@ w); break; } + t = PyObject_Repr(w); + if (t == NULL) + break; PyErr_Format(PyExc_SystemError, "no locals when deleting %s", - PyObject_REPR(w)); + PyString_AS_STRING(w)); + Py_DECREF(t); break; PREDICTED_WITH_ARG(UNPACK_SEQUENCE); @@ -2046,10 +2054,14 @@ case LOAD_NAME: w = GETITEM(names, oparg); if ((v = f->f_locals) == NULL) { + why = WHY_EXCEPTION; + t = PyObject_Repr(w); + if (t == NULL) + break; PyErr_Format(PyExc_SystemError, "no locals when loading %s", - PyObject_REPR(w)); - why = WHY_EXCEPTION; + PyString_AS_STRING(w)); + Py_DECREF(t); break; } if (PyDict_CheckExact(v)) { diff --git a/Python/compile.c b/Python/compile.c --- a/Python/compile.c +++ b/Python/compile.c @@ -1271,11 +1271,11 @@ "symbols: %s\nlocals: %s\nglobals: %s", PyString_AS_STRING(name), PyString_AS_STRING(c->u->u_name), - PyObject_REPR(c->u->u_ste->ste_id), + PyString_AS_STRING(PyObject_Repr(c->u->u_ste->ste_id)), c->c_filename, - PyObject_REPR(c->u->u_ste->ste_symbols), - PyObject_REPR(c->u->u_varnames), - PyObject_REPR(c->u->u_names) + PyString_AS_STRING(PyObject_Repr(c->u->u_ste->ste_symbols)), + PyString_AS_STRING(PyObject_Repr(c->u->u_varnames)), + PyString_AS_STRING(PyObject_Repr(c->u->u_names)) ); Py_FatalError(buf); } @@ -1327,11 +1327,11 @@ if (arg == -1) { printf("lookup %s in %s %d %d\n" "freevars of %s: %s\n", - PyObject_REPR(name), + PyString_AS_STRING(PyObject_Repr(name)), PyString_AS_STRING(c->u->u_name), reftype, arg, PyString_AS_STRING(co->co_name), - PyObject_REPR(co->co_freevars)); + PyString_AS_STRING(PyObject_Repr(co->co_freevars))); Py_FatalError("compiler_make_closure()"); } ADDOP_I(c, LOAD_CLOSURE, arg); -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 19 00:33:44 2014 From: python-checkins at python.org (antoine.pitrou) Date: Tue, 18 Nov 2014 23:33:44 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogQ2xvc2UgIzIyMzcw?= =?utf-8?q?=3A_Windows_detection_in_pathlib_is_now_more_robust=2E?= Message-ID: <20141118233314.13357.78035@psf.io> https://hg.python.org/cpython/rev/cb1d7eac601d changeset: 93508:cb1d7eac601d branch: 3.4 parent: 93505:342a619cdafb user: Antoine Pitrou date: Wed Nov 19 00:32:08 2014 +0100 summary: Close #22370: Windows detection in pathlib is now more robust. files: Lib/pathlib.py | 9 ++++----- Misc/NEWS | 2 ++ 2 files changed, 6 insertions(+), 5 deletions(-) diff --git a/Lib/pathlib.py b/Lib/pathlib.py --- a/Lib/pathlib.py +++ b/Lib/pathlib.py @@ -15,16 +15,15 @@ supports_symlinks = True -try: +if os.name == 'nt': import nt -except ImportError: - nt = None -else: if sys.getwindowsversion()[:2] >= (6, 0): from nt import _getfinalpathname else: supports_symlinks = False _getfinalpathname = None +else: + nt = None __all__ = [ @@ -110,7 +109,7 @@ has_drv = True pathmod = ntpath - is_supported = (nt is not None) + is_supported = (os.name == 'nt') drive_letters = ( set(chr(x) for x in range(ord('a'), ord('z') + 1)) | diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -36,6 +36,8 @@ Library ------- +- Issue #22370: Windows detection in pathlib is now more robust. + - Issue #22841: Reject coroutines in asyncio add_signal_handler(). Patch by Ludovic.Gasc. -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 19 00:33:44 2014 From: python-checkins at python.org (antoine.pitrou) Date: Tue, 18 Nov 2014 23:33:44 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Close_=2322370=3A_Windows_detection_in_pathlib_is_now_mo?= =?utf-8?q?re_robust=2E?= Message-ID: <20141118233315.36037.72921@psf.io> https://hg.python.org/cpython/rev/712f246da49b changeset: 93509:712f246da49b parent: 93507:902dbf99fc28 parent: 93508:cb1d7eac601d user: Antoine Pitrou date: Wed Nov 19 00:33:08 2014 +0100 summary: Close #22370: Windows detection in pathlib is now more robust. files: Lib/pathlib.py | 9 ++++----- Misc/NEWS | 2 ++ 2 files changed, 6 insertions(+), 5 deletions(-) diff --git a/Lib/pathlib.py b/Lib/pathlib.py --- a/Lib/pathlib.py +++ b/Lib/pathlib.py @@ -15,16 +15,15 @@ supports_symlinks = True -try: +if os.name == 'nt': import nt -except ImportError: - nt = None -else: if sys.getwindowsversion()[:2] >= (6, 0): from nt import _getfinalpathname else: supports_symlinks = False _getfinalpathname = None +else: + nt = None __all__ = [ @@ -110,7 +109,7 @@ has_drv = True pathmod = ntpath - is_supported = (nt is not None) + is_supported = (os.name == 'nt') drive_letters = ( set(chr(x) for x in range(ord('a'), ord('z') + 1)) | diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -185,6 +185,8 @@ Library ------- +- Issue #22370: Windows detection in pathlib is now more robust. + - Issue #22841: Reject coroutines in asyncio add_signal_handler(). Patch by Ludovic.Gasc. -- Repository URL: https://hg.python.org/cpython From solipsis at pitrou.net Wed Nov 19 10:33:28 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Wed, 19 Nov 2014 10:33:28 +0100 Subject: [Python-checkins] Daily reference leaks (712f246da49b): sum=5 Message-ID: results for 712f246da49b on branch "default" -------------------------------------------- test_collections leaked [2, 0, 0] references, sum=2 test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogTFWDlr', '-x'] From python-checkins at python.org Wed Nov 19 11:36:39 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Wed, 19 Nov 2014 10:36:39 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2320604=3A_Added_missed_invalid_mode_in_error_mes?= =?utf-8?q?sage_of_socket=2Emakefile=28=29=2E?= Message-ID: <20141119103628.36045.90635@psf.io> https://hg.python.org/cpython/rev/d5b36edeecdb changeset: 93511:d5b36edeecdb parent: 93509:712f246da49b parent: 93510:34c7be03259b user: Serhiy Storchaka date: Wed Nov 19 12:34:07 2014 +0200 summary: Issue #20604: Added missed invalid mode in error message of socket.makefile(). Based on patch by Franck Michea. files: Lib/socket.py | 5 ++--- 1 files changed, 2 insertions(+), 3 deletions(-) diff --git a/Lib/socket.py b/Lib/socket.py --- a/Lib/socket.py +++ b/Lib/socket.py @@ -209,9 +209,8 @@ except the only mode characters supported are 'r', 'w' and 'b'. The semantics are similar too. (XXX refactor to share code?) """ - for c in mode: - if c not in {"r", "w", "b"}: - raise ValueError("invalid mode %r (only r, w, b allowed)") + if not set(mode) <= {"r", "w", "b"}: + raise ValueError("invalid mode %r (only r, w, b allowed)" % (mode,)) writing = "w" in mode reading = "r" in mode or not writing assert reading or writing -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 19 11:36:39 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Wed, 19 Nov 2014 10:36:39 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIwNjA0?= =?utf-8?q?=3A_Added_missed_invalid_mode_in_error_message_of_socket=2Emake?= =?utf-8?b?ZmlsZSgpLg==?= Message-ID: <20141119103628.109146.47390@psf.io> https://hg.python.org/cpython/rev/34c7be03259b changeset: 93510:34c7be03259b branch: 3.4 parent: 93508:cb1d7eac601d user: Serhiy Storchaka date: Wed Nov 19 12:33:40 2014 +0200 summary: Issue #20604: Added missed invalid mode in error message of socket.makefile(). Based on patch by Franck Michea. files: Lib/socket.py | 5 ++--- 1 files changed, 2 insertions(+), 3 deletions(-) diff --git a/Lib/socket.py b/Lib/socket.py --- a/Lib/socket.py +++ b/Lib/socket.py @@ -201,9 +201,8 @@ except the only mode characters supported are 'r', 'w' and 'b'. The semantics are similar too. (XXX refactor to share code?) """ - for c in mode: - if c not in {"r", "w", "b"}: - raise ValueError("invalid mode %r (only r, w, b allowed)") + if not set(mode) <= {"r", "w", "b"}: + raise ValueError("invalid mode %r (only r, w, b allowed)" % (mode,)) writing = "w" in mode reading = "r" in mode or not writing assert reading or writing -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 19 12:24:41 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Wed, 19 Nov 2014 11:24:41 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogSXNzdWUgIzIwNzM2?= =?utf-8?q?=3A_testSendmsgDontWait_in_test=5Fsocket_no_longer_skipped_on_L?= =?utf-8?q?inux=2E?= Message-ID: <20141119112401.113284.42225@psf.io> https://hg.python.org/cpython/rev/fb06c8ccfd41 changeset: 93512:fb06c8ccfd41 branch: 3.4 parent: 93510:34c7be03259b user: Serhiy Storchaka date: Wed Nov 19 13:21:13 2014 +0200 summary: Issue #20736: testSendmsgDontWait in test_socket no longer skipped on Linux. Patch by David Watson. files: Lib/test/test_socket.py | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Lib/test/test_socket.py b/Lib/test/test_socket.py --- a/Lib/test/test_socket.py +++ b/Lib/test/test_socket.py @@ -2216,7 +2216,7 @@ # Linux supports MSG_DONTWAIT when sending, but in general, it # only works when receiving. Could add other platforms if they # support it too. - @skipWithClientIf(sys.platform not in {"linux2"}, + @skipWithClientIf(sys.platform not in {"linux"}, "MSG_DONTWAIT not known to work on this platform when " "sending") def testSendmsgDontWait(self): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 19 12:24:41 2014 From: python-checkins at python.org (serhiy.storchaka) Date: Wed, 19 Nov 2014 11:24:41 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Issue_=2320736=3A_testSendmsgDontWait_in_test=5Fsocket_n?= =?utf-8?q?o_longer_skipped_on_Linux=2E?= Message-ID: <20141119112401.62748.68851@psf.io> https://hg.python.org/cpython/rev/23ab1197df0b changeset: 93513:23ab1197df0b parent: 93511:d5b36edeecdb parent: 93512:fb06c8ccfd41 user: Serhiy Storchaka date: Wed Nov 19 13:21:40 2014 +0200 summary: Issue #20736: testSendmsgDontWait in test_socket no longer skipped on Linux. Patch by David Watson. files: Lib/test/test_socket.py | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/Lib/test/test_socket.py b/Lib/test/test_socket.py --- a/Lib/test/test_socket.py +++ b/Lib/test/test_socket.py @@ -2221,7 +2221,7 @@ # Linux supports MSG_DONTWAIT when sending, but in general, it # only works when receiving. Could add other platforms if they # support it too. - @skipWithClientIf(sys.platform not in {"linux2"}, + @skipWithClientIf(sys.platform not in {"linux"}, "MSG_DONTWAIT not known to work on this platform when " "sending") def testSendmsgDontWait(self): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Wed Nov 19 12:35:29 2014 From: python-checkins at python.org (nick.coghlan) Date: Wed, 19 Nov 2014 11:35:29 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_PEP_458=3A_remove_Windows_lin?= =?utf-8?q?e_endings?= Message-ID: <20141119113452.109164.4115@psf.io> https://hg.python.org/peps/rev/e467ef442506 changeset: 5601:e467ef442506 user: Nick Coghlan date: Wed Nov 19 21:34:40 2014 +1000 summary: PEP 458: remove Windows line endings files: pep-0458.txt | 2166 +++++++++++++++++++------------------- 1 files changed, 1083 insertions(+), 1083 deletions(-) diff --git a/pep-0458.txt b/pep-0458.txt --- a/pep-0458.txt +++ b/pep-0458.txt @@ -1,1083 +1,1083 @@ -PEP: 458 -Title: Surviving a Compromise of PyPI -Version: $Revision$ -Last-Modified: $Date$ -Author: Trishank Karthik Kuppusamy , - Donald Stufft , - Justin Cappos -Discussions-To: Distutils SIG -Status: Draft -Type: Standards Track -Content-Type: text/x-rst -Created: 27-Sep-2013 - - -Abstract -======== - -This PEP describes how the Python Package Index (PyPI [1]_) may be integrated -with The Update Framework [2]_ (TUF). TUF was designed to be a plug-and-play -security add-on to a software updater or package manager. TUF provides -end-to-end security like SSL, but for software updates instead of HTTP -connections. The framework integrates best security practices such as -separating responsibilities, adopting the many-man rule for signing packages, -keeping signing keys offline, and revocation of expired or compromised signing -keys. - -The proposed integration will render modern package managers such as pip [3]_ -more secure against various types of security attacks on PyPI and protect users -against them. Even in the worst case where an attacker manages to compromise -PyPI itself, the damage is controlled in scope and limited in duration. - -Specifically, this PEP will describe how PyPI processes should be adapted to -incorporate TUF metadata. It will not prescribe how package managers such as -pip should be adapted to install or update with TUF metadata projects from -PyPI. - - -Rationale -========= - -In January 2013, the Python Software Foundation (PSF) announced [4]_ that the -python.org wikis for Python, Jython, and the PSF were subjected to a security -breach which caused all of the wiki data to be destroyed on January 5 2013. -Fortunately, the PyPI infrastructure was not affected by this security breach. -However, the incident is a reminder that PyPI should take defensive steps to -protect users as much as possible in the event of a compromise. Attacks on -software repositories happen all the time [5]_. We must accept the possibility -of security breaches and prepare PyPI accordingly because it is a valuable -target used by thousands, if not millions, of people. - -Before the wiki attack, PyPI used MD5 hashes to tell package managers such as -pip whether or not a package was corrupted in transit. However, the absence of -SSL made it hard for package managers to verify transport integrity to PyPI. -It was easy to launch a man-in-the-middle attack between pip and PyPI to change -package contents arbitrarily. This can be used to trick users into installing -malicious packages. After the wiki attack, several steps were proposed (some -of which were implemented) to deliver a much higher level of security than was -previously the case: requiring SSL to communicate with PyPI [6]_, restricting -project names [7]_, and migrating from MD5 to SHA-2 hashes [8]_. - -These steps, though necessary, are insufficient because attacks are still -possible through other avenues. For example, a public mirror is trusted to -honestly mirror PyPI, but some mirrors may misbehave due to malice or accident. -Package managers such as pip are supposed to use signatures from PyPI to verify -packages downloaded from a public mirror [9]_, but none are known to actually -do so [10]_. Therefore, it is also wise to add more security measures to -detect attacks from public mirrors or content delivery networks [11]_ (CDNs). - -Even though official mirrors are being deprecated on PyPI [12]_, there remain a -wide variety of other attack vectors on package managers [13]_. Among other -things, these attacks can crash client systems, cause obsolete packages to be -installed, or even allow an attacker to execute arbitrary code. In September -2013, we showed how the latest version of pip then was susceptible to these -attacks and how TUF could protect users against them [14]_. - -Finally, PyPI allows for packages to be signed with GPG keys [15]_, although no -package manager is known to verify those signatures, thus negating much of the -benefits of having those signatures at all. Validating integrity through -cryptography is important, but issues such as immediate and secure key -revocation or specifying a required threshold number of signatures still -remain. Furthermore, GPG by itself does not immediately address the attacks -mentioned above. - -In order to protect PyPI against infrastructure compromises, we propose -integrating PyPI with The Update Framework [2]_ (TUF). - - -Definitions -=========== - -The key words "MUST", "MUST NOT", "REQUIRED", "SHALL", "SHALL NOT", "SHOULD", -"SHOULD NOT", "RECOMMENDED", "MAY", and "OPTIONAL" in this document are to be -interpreted as described in RFC 2119__. - -__ http://www.ietf.org/rfc/rfc2119.txt - -In order to keep this PEP focused solely on the application of TUF on PyPI, the -reader is assumed to already be familiar with the design principles of -TUF [2]_. It is also strongly RECOMMENDED that the reader be familiar with the -TUF specification [16]_. - -* Projects: Projects are software components that are made available for - integration. Projects include Python libraries, frameworks, scripts, plugins, - applications, collections of data or other resources, and various - combinations thereof. Public Python projects are typically registered on the - Python Package Index [17]_. - -* Releases: Releases are uniquely identified snapshots of a project [17]_. - -* Distributions: Distributions are the packaged files which are used to publish - and distribute a release [17]_. - -* Simple index: The HTML page which contains internal links to the - distributions of a project [17]_. - -* Consistent snapshot: A set of TUF metadata and PyPI targets that capture the - complete state of all projects on PyPI as they were at some fixed point in - time. - -* The *consistent-snapshot* (*release*) role: In order to prevent confusion due - to the different meanings of the term "release" as employed by PEP 426 [17]_ - and the TUF specification [16]_, we rename the *release* role as the - *consistent-snapshot* role. - -* Continuous delivery: A set of processes with which PyPI produces consistent - snapshots that can safely coexist and deleted independently [18]_. - -* Developer: Either the owner or maintainer of a project who is allowed to - update the TUF metadata as well as distribution metadata and data for the - project. - -* Online key: A key that MUST be stored on the PyPI server infrastructure. - This is usually to allow automated signing with the key. However, this means - that an attacker who compromises PyPI infrastructure will be able to read - these keys. - -* Offline key: A key that MUST be stored off the PyPI infrastructure. This - prevents automated signing with the key. This means that an attacker who - compromises PyPI infrastructure will not be able to immediately read these - keys. - -* Developer key: A private key for which its corresponding public key is - registered with PyPI to say that it is responsible for directly signing for - or delegating the distributions belonging to a project. For the purposes of - this PEP, it is offline in the sense that the private key MUST not be stored - on PyPI. However, the project is free to require certain developer keys to - be online on its own infrastructure. - -* Threshold signature scheme: A role could increase its resilience to key - compromises by requiring that at least t out of n keys are REQUIRED to sign - its metadata. This means that a compromise of t-1 keys is insufficient to - compromise the role itself. We denote this property by saying that the role - requires (t, n) keys. - - -Overview -======== - -.. image:: https://raw.github.com/theupdateframework/pep-on-pypi-with-tuf/master/figure1.png - -Figure 1: A simplified overview of the roles in PyPI with TUF - -Figure 1 shows a simplified overview of the roles that TUF metadata assume on -PyPI. The top-level *root* role signs for the keys of the top-level -*timestamp*, *consistent-snapshot*, *targets* and *root* roles. The -*timestamp* role signs for a new and consistent snapshot. The *consistent- -snapshot* role signs for the *root*, *targets* and all delegated targets -metadata. The *claimed* role signs for all projects that have registered their -own developer keys with PyPI. The *recently-claimed* role signs for all -projects that recently registered their own developer keys with PyPI. Finally, -the *unclaimed* role signs for all projects that have not registered developer -keys with PyPI. The *claimed*, *recently-claimed* and *unclaimed* roles are -numbered 1, 2, 3 respectively because a project will be searched for in each of -those roles in that descending order: first in *claimed*, then in -*recently-claimed* if necessary, and finally in *unclaimed* if necessary. - -Every year, PyPI administrators are going to sign for *root* role keys. After -that, automation will continuously sign for a timestamped, consistent snapshot -of all projects. Every few months, PyPI administrators will move projects with -vetted developer keys from the *recently-claimed* role to the *claimed* role. -As we will soon see, they will sign for *claimed* with projects with offline -keys. - -This PEP does not require project developers to use TUF to secure their -packages from attacks on PyPI. By default, all projects will be signed for by -the *unclaimed* role. If a project wishes stronger security guarantees, then -the project is strongly RECOMMENDED to register developer keys with PyPI so -that it may sign for its own distributions. By doing so, the project must -remain as a *recently-claimed* project until PyPI administrators have had an -opportunity to vet the developer keys of the project, after which the project -will be moved to the *claimed* role. - -This PEP has **not** been designed to be backward-compatible for package -managers that do not use the TUF security protocol to install or update a -project from the PyPI described here. Instead, it is RECOMMENDED that PyPI -maintain a backward-compatible API of itself that does NOT offer TUF so that -older package managers that do not use TUF will be able to install or update -projects from PyPI as usual but without any of the security offered by TUF. -For the rest of this PEP, we will assume that PyPI will simultaneously maintain -a backward-incompatible API of itself for package managers that MUST use TUF to -securely install or update projects. We think that this approach represents a -reasonable trade-off: older package managers that do not TUF will still be able -to install or update projects without any TUF security from PyPI, and newer -package managers that do use TUF will be able to securely install or update -projects. At some point in the future, PyPI administrators MAY choose to -permanently deprecate the backward-compatible version of itself that does not -offer TUF metadata. - -Unless a mirror, CDN or the PyPI repository has been compromised, the end-user -will not be able to discern whether or not a package manager is using TUF to -install or update a project from PyPI. - - -Responsibility Separation -========================= - -Recall that TUF requires four top-level roles: *root*, *timestamp*, -*consistent-snapshot* and *targets*. The *root* role specifies the keys of all -the top-level roles (including itself). The *timestamp* role specifies the -latest consistent snapshot. The *consistent-snapshot* role specifies the -latest versions of all TUF metadata files (other than *timestamp*). The -*targets* role specifies available target files (in our case, it will be all -files on PyPI under the /simple and /packages directories). In this PEP, each -of these roles will serve their responsibilities without exception. - -Our proposal offers two levels of security to developers. If developers opt in -to secure their projects with their own developer keys, then their projects -will be very secure. Otherwise, TUF will still protect them in many cases: - -1. Minimum security (no action by a developer): protects *unclaimed* and - *recently-claimed* projects without developer keys from CDNs [19]_ or public - mirrors, but not from some PyPI compromises. This is because continuous - delivery requires some keys to be online. This level of security protects - projects from being accidentally or deliberately tampered with by a mirror - or a CDN because the mirror or CDN will not have any of the PyPI or - developer keys required to sign for projects. However, it would not protect - projects from attackers who have compromised PyPI because they will be able - to manipulate the TUF metadata for *unclaimed* projects with the appropriate - online keys. - -2. Maximum security (developer signs their project): protects projects with - developer keys not only from CDNs or public mirrors, but also from some PyPI - compromises. This is because many important keys will be offline. This - level of security protects projects from being accidentally or deliberately - tampered with by a mirror or a CDN for reasons identical to the minimum - security level. It will also protect projects (or at least mitigate - damages) from the most likely attacks on PyPI. For example: given access to - online keys after a PyPI compromise, attackers will be able to freeze the - distributions for these projects, but they will not be able to serve - malicious distributions for these projects (not without compromising other - offline keys which would entail more risk, time and energy). Details for - the exact level of security offered is discussed in the section on key - management. - -In order to complete support for continuous delivery, we propose three -delegated targets roles: - -1. *claimed*: Signs for the delegation of PyPI projects to their respective - developer keys. - -2. *recently-claimed*: This role is almost identical to the *claimed* role and - could technically be performed by the *unclaimed* role, but there are two - important reasons why it exists independently: the first reason is to - improve the performance of looking up projects in the *unclaimed* role (by - moving metadata to the *recently-claimed* role instead), and the second - reason is to make it easier for PyPI administrators to move - *recently-claimed* projects to the *claimed* role. - -3. *unclaimed*: Signs for PyPI projects without developer keys. - -The *targets* role MUST delegate all PyPI projects to the three delegated -targets roles in the order of appearance listed above. This means that when -pip downloads with TUF a distribution from a project on PyPI, it will first -consult the *claimed* role about it. If the *claimed* role has delegated the -project, then pip will trust the project developers (in order of delegation) -about the TUF metadata for the project. Otherwise, pip will consult the -*recently-claimed* role about the project. If the *recently-claimed* role has -delegated the project, then pip will trust the project developers (in order of -delegation) about the TUF metadata for the project. Otherwise, pip will -consult the *unclaimed* role about the TUF metadata for the project. If the -*unclaimed* role has not delegated the project, then the project is considered -to be non-existent on PyPI. - -A PyPI project MAY begin without registering a developer key. Therefore, the -project will be signed for by the *unclaimed* role. After registering -developer keys, the project will be removed from the *unclaimed* role and -delegated to the *recently-claimed* role. After a probation period and a -vetting process to verify the developer keys of the project, the project will -be removed from the *recently-claimed* role and delegated to the *claimed* -role. - -The *claimed* role offers maximum security, whereas the *recently-claimed* and -*unclaimed* role offer minimum security. All three roles support continuous -delivery of PyPI projects. - -The *unclaimed* role offers minimum security because PyPI will sign for -projects without developer keys with an online key in order to permit -continuous delivery. - -The *recently-claimed* role offers minimum security because while the project -developers will sign for their own distributions with offline developer keys, -PyPI will sign with an online key the delegation of the project to those -offline developer keys. The signing of the delegation with an online key -allows PyPI administrators to continuously deliver projects without having to -continuously sign the delegation whenever one of those projects registers -developer keys. - -Finally, the *claimed* role offers maximum security because PyPI will sign with -offline keys the delegation of a project to its offline developer keys. This -means that every now and then, PyPI administrators will vet developer keys and -sign the delegation of a project to those developer keys after being reasonably -sure about the ownership of the developer keys. The process for vetting -developer keys is out of the scope of this PEP. - - -Metadata Management -=================== - -In this section, we examine the TUF metadata that PyPI must manage by itself, -and other TUF metadata that must be safely delegated to projects. Examples of -the metadata described here may be seen at our testbed mirror of -`PyPI-with-TUF`__. - -__ http://mirror1.poly.edu/ - -The metadata files that change most frequently will be *timestamp*, -*consistent-snapshot* and delegated targets (*claimed*, *recently-claimed*, -*unclaimed*, project) metadata. The *timestamp* and *consistent-snapshot* -metadata MUST be updated whenever *root*, *targets* or delegated targets -metadata are updated. Observe, though, that *root* and *targets* metadata are -much less likely to be updated as often as delegated targets metadata. -Therefore, *timestamp* and *consistent-snapshot* metadata will most likely be -updated frequently (possibly every minute) due to delegated targets metadata -being updated frequently in order to drive continuous delivery of projects. - -Consequently, the processes with which PyPI updates projects will have to be -updated accordingly, the details of which are explained in the following -subsections. - - -Why Do We Need Consistent Snapshots? ------------------------------------- - -In an ideal world, metadata and data should be immediately updated and -presented whenever a project is updated. In practice, there will be problems -when there are many readers and writers who access the same metadata or data at -the same time. - -An important example at the time of writing is that, mirrors are very likely, -as far as we can tell, to update in an inconsistent manner from PyPI as it is -without TUF. Specifically, a mirror would update itself in such a way that -project A would be from time T, whereas project B would be from time T+5, -project C would be from time T+3, and so on where T is the time that the mirror -first begun updating itself. There is no known way for a mirror to update -itself such that it captures the state of all projects as they were at time T. - -Adding TUF to PyPI will not automatically solve the problem. Consider what we -call the `"inverse replay" or "fast-forward" problem`__. Suppose that PyPI has -timestamped a consistent snapshot at version 1. A mirror is later in the -middle of copying PyPI at this snapshot. While the mirror is copying PyPI at -this snapshot, PyPI timestamps a new snapshot at, say, version 2. Without -accounting for consistency, the mirror would then find itself with a copy of -PyPI in an inconsistent state which is indistinguishable from arbitrary -metadata or target attacks. The problem would also apply when the mirror is -substituted with a pip user. - -__ https://groups.google.com/forum/#!topic/theupdateframework/8mkR9iqivQA - -Therefore, the problem can be summarized as such: there are problems of -consistency on PyPI with or without TUF. TUF requires its metadata to be -consistent with the data, but how would the metadata be kept consistent with -projects that change all the time? - -As a result, we will solve for PyPI the problem of producing a consistent -snapshot that captures the state of all known projects at a given time. Each -consistent snapshot can safely coexist with any other consistent snapshot and -deleted independently without affecting any other consistent snapshot. - -The gist of the solution is that every metadata or data file written to disk -MUST include in its filename the `cryptographic hash`__ of the file. How would -this help clients which use the TUF protocol to securely and consistently -install or update a project from PyPI? - -__ https://en.wikipedia.org/wiki/Cryptographic_hash_function - -Recall that the first step in the TUF protocol requires the client to download -the latest *timestamp* metadata. However, the client would not know in advance -the hash of the *timestamp* metadata file from the latest consistent snapshot. -Therefore, PyPI MUST redirect all HTTP GET requests for *timestamp* metadata to -the *timestamp* metadata file from the latest consistent snapshot. Since the -*timestamp* metadata is the root of a tree of cryptographic hashes pointing to -every other metadata or target file that are meant to exist together for -consistency, the client is then able to retrieve any file from this consistent -snapshot by deterministically including, in the request for the file, the hash -of the file in the filename. Assuming infinite disk space and no `hash -collisions`__, a client may safely read from one consistent snapshot while PyPI -produces another consistent snapshot. - -__ https://en.wikipedia.org/wiki/Collision_(computer_science) - -In this simple but effective manner, we are able to capture a consistent -snapshot of all projects and the associated metadata at a given time. The next -subsection will explicate the implementation details of this idea. - - -Producing Consistent Snapshots ------------------------------- - -Given a project, PyPI is responsible for updating, depending on the project, -either the *claimed*, *recently-claimed* or *unclaimed* metadata as well as -associated delegated targets metadata. Every project MUST upload its set of -metadata and targets in a single transaction. We will call this set of files -the project transaction. We will discuss later how PyPI MAY validate the files -in a project transaction. For now, let us focus on how PyPI will respond to a -project transaction. We will call this response the project transaction -process. There will also be a consistent snapshot process that we will define -momentarily; for now, it suffices to know that project transaction processes -and the consistent snapshot process must coordinate with each other. - -Also, every metadata and target file MUST include in its filename the `hex -digest`__ of its `SHA-256`__ hash. For this PEP, it is RECOMMENDED that PyPI -adopt a simple convention of the form filename.digest.ext, where filename is -the original filename without a copy of the hash, digest is the hex digest of -the hash, and ext is the filename extension. - -__ http://docs.python.org/2/library/hashlib.html#hashlib.hash.hexdigest -__ https://en.wikipedia.org/wiki/SHA-2 - -When an *unclaimed* project uploads a new transaction, a project transaction -process MUST add all new targets and relevant delegated *unclaimed* metadata. -(We will see later in this section why the *unclaimed* role will delegate -targets to a number of delegated *unclaimed* roles.) Finally, the project -transaction process MUST inform the consistent snapshot process about new -delegated *unclaimed* metadata. - -When a *recently-claimed* project uploads a new a transaction, a project -transaction process MUST add all new targets and delegated targets metadata for -the project. If the project is new, then the project transaction process MUST -also add new *recently-claimed* metadata with public keys and threshold number -(which MUST be part of the transaction) for the project. Finally, the project -transaction process MUST inform the consistent snapshot process about new -*recently-claimed* metadata as well as the current set of delegated targets -metadata for the project. - -The process for a *claimed* project is slightly different. The difference is -that PyPI administrators will choose to move the project from the -*recently-claimed* role to the *claimed* role. A project transaction process -MUST then add new *recently-claimed* and *claimed* metadata to reflect this -migration. As is the case for a *recently-claimed* project, the project -transaction process MUST always add all new targets and delegated targets -metadata for the *claimed* project. Finally, the project transaction process -MUST inform the consistent snapshot process about new *recently-claimed* or -*claimed* metadata as well as the current set of delegated targets metadata for -the project. - -Project transaction processes SHOULD be automated, except when PyPI -administrators move a project from the *recently-claimed* role to the *claimed* -role. Project transaction processes MUST also be applied atomically: either -all metadata and targets, or none of them, are added. The project transaction -processes and consistent snapshot process SHOULD work concurrently. Finally, -project transaction processes SHOULD keep in memory the latest *claimed*, -*recently-claimed* and *unclaimed* metadata so that they will be correctly -updated in new consistent snapshots. - -All project transactions MAY be placed in a single queue and processed -serially. Alternatively, the queue MAY be processed concurrently in order of -appearance provided that the following rules are observed: - -1. No pair of project transaction processes must concurrently work on the same - project. - -2. No pair of project transaction processes must concurrently work on - *unclaimed* projects that belong to the same delegated *unclaimed* targets - role. - -3. No pair of project transaction processes must concurrently work on new - *recently-claimed* projects. - -4. No pair of project transaction processes must concurrently work on new - *claimed* projects. - -5. No project transaction process must work on a new *claimed* project while - another project transaction process is working on a new *recently-claimed* - project and vice versa. - -These rules MUST be observed so that metadata is not read from or written to -inconsistently. - -The consistent snapshot process is fairly simple and SHOULD be automated. The -consistent snapshot process MUST keep in memory the latest working set of -*root*, *targets* and delegated targets metadata. Every minute or so, the -consistent snapshot process will sign for this latest working set. (Recall -that project transaction processes continuously inform the consistent snapshot -process about the latest delegated targets metadata in a concurrency-safe -manner. The consistent snapshot process will actually sign for a copy of the -latest working set while the actual latest working set in memory will be -updated with information continuously communicated by project transaction -processes.) Next, the consistent snapshot process MUST generate and sign new -*timestamp* metadata that will vouch for the *consistent-snapshot* metadata -generated in the previous step. Finally, the consistent snapshot process MUST -add new *timestamp* and *consistent-snapshot* metadata representing the latest -consistent snapshot. - -A few implementation notes are now in order. So far, we have seen only that -new metadata and targets are added, but not that old metadata and targets are -removed. Practical constraints are such that eventually PyPI will run out of -disk space to produce a new consistent snapshot. In that case, PyPI MAY then -use something like a "mark-and-sweep" algorithm to delete sufficiently old -consistent snapshots: in order to preserve the latest consistent snapshot, PyPI -would walk objects beginning from the root (*timestamp*) of the latest -consistent snapshot, mark all visited objects, and delete all unmarked -objects. The last few consistent snapshots may be preserved in a similar -fashion. Deleting a consistent snapshot will cause clients to see nothing -thereafter but HTTP 404 responses to any request for a file in that consistent -snapshot. Clients SHOULD then retry their requests with the latest consistent -snapshot. - -We do **not** consider updates to any consistent snapshot because `hash -collisions`__ are out of the scope of this PEP. In case a hash collision is -observed, PyPI MAY wish to check that the file being added is identical to the -file already stored. (Should a hash collision be observed, it is far more -likely the case that the file is identical rather than being a genuine -`collision attack`__.) Otherwise, PyPI MAY either overwrite the existing file -or ignore any write operation to an existing file. - -__ https://en.wikipedia.org/wiki/Collision_(computer_science) -__ https://en.wikipedia.org/wiki/Collision_attack - -All clients, such as pip using the TUF protocol, MUST be modified to download -every metadata and target file (except for *timestamp* metadata) by including, -in the request for the file, the hash of the file in the filename. Following -the filename convention recommended earlier, a request for the file at -filename.ext will be transformed to the equivalent request for the file at -filename.digest.ext. - -Finally, PyPI SHOULD use a `transaction log`__ to record project transaction -processes and queues so that it will be easier to recover from errors after a -server failure. - -__ https://en.wikipedia.org/wiki/Transaction_log - - -Metadata Validation -------------------- - -A *claimed* or *recently-claimed* project will need to upload in its -transaction to PyPI not just targets (a simple index as well as distributions) -but also TUF metadata. The project MAY do so by uploading a ZIP file -containing two directories, /metadata/ (containing delegated targets metadata -files) and /targets/ (containing targets such as the project simple index and -distributions which are signed for by the delegated targets metadata). - -Whenever the project uploads metadata or targets to PyPI, PyPI SHOULD check the -project TUF metadata for at least the following properties: - -* A threshold number of the developers keys registered with PyPI by that - project MUST have signed for the delegated targets metadata file that - represents the "root" of targets for that project (e.g. metadata/targets/ - project.txt). - -* The signatures of delegated targets metadata files MUST be valid. - -* The delegated targets metadata files MUST NOT be expired. - -* The delegated targets metadata MUST be consistent with the targets. - -* A delegator MUST NOT delegate targets that were not delegated to itself by - another delegator. - -* A delegatee MUST NOT sign for targets that were not delegated to itself by a - delegator. - -* Every file MUST contain a unique copy of its hash in its filename following - the filename.digest.ext convention recommended earlier. - -If PyPI chooses to check the project TUF metadata, then PyPI MAY choose to -reject publishing any set of metadata or targets that do not meet these -requirements. - -PyPI MUST enforce access control by ensuring that each project can only write -to the TUF metadata for which it is responsible. It MUST do so by ensuring -that project transaction processes write to the correct metadata as well as -correct locations within those metadata. For example, a project transaction -process for an *unclaimed* project MUST write to the correct target paths in -the correct delegated *unclaimed* metadata for the targets of the project. - -On rare occasions, PyPI MAY wish to extend the TUF metadata format for projects -in a backward-incompatible manner. Note that PyPI will NOT be able to -automatically rewrite existing TUF metadata on behalf of projects in order to -upgrade the metadata to the new backward-incompatible format because this would -invalidate the signatures of the metadata as signed by developer keys. -Instead, package managers SHOULD be written to recognize and handle multiple -incompatible versions of TUF metadata so that *claimed* and *recently-claimed* -projects could be offered a reasonable time to migrate their metadata to newer -but backward-incompatible formats. - -The details of how each project manages its TUF metadata is beyond the scope of -this PEP. - - -Mirroring Protocol ------------------- - -The mirroring protocol as described in PEP 381 [9]_ SHOULD change to mirror -PyPI with TUF. - -A mirror SHOULD have to maintain for its clients only one consistent snapshot -which would represent the latest consistent snapshot from PyPI known to the -mirror. The mirror would then serve all HTTP requests for metadata or targets -by simply reading directly from this consistent snapshot directory. - -The mirroring protocol itself is fairly simple. The mirror would ask PyPI for -*timestamp* metadata from the latest consistent snapshot and proceed to copy -the entire consistent snapshot from the *timestamp* metadata onwards. If the -mirror encounters a failure to copy any metadata or target file while copying -the consistent snapshot, it SHOULD retrying resuming the copy of that -particular consistent snapshot. If PyPI has deleted that consistent snapshot, -then the mirror SHOULD delete the failed consistent snapshot and try -downloading the latest consistent snapshot instead. - -The mirror SHOULD point users to a previous consistent snapshot directory while -it is copying the latest consistent snapshot from PyPI. Only after the latest -consistent snapshot has been completely copied SHOULD the mirror switch clients -to the latest consistent snapshot. The mirror MAY then delete the previous -consistent snapshot once it finds that no client is reading from the previous -consistent snapshot. - -The mirror MAY use extant file transfer software such as rsync__ to mirror -PyPI. In that case, the mirror MUST first obtain the latest known timestamp -metadata from PyPI. The mirror MUST NOT immediately publish the latest known -timestamp metadata from PyPI. Instead, the mirror MUST first iteratively -transfer all new files from PyPI until there are no new files left to transfer. -Finally, the mirror MUST publish the latest known timestamp it fetched from -PyPI so that package managers such as pip may be directed to the latest -consistent snapshot known to the mirror. - -__ https://rsync.samba.org/ - - -Backup Process --------------- - -In order to be able to safely restore from static snapshots later in the event -of a compromise, PyPI SHOULD maintain a small number of its own mirrors to copy -PyPI consistent snapshots according to some schedule. The mirroring protocol -can be used immediately for this purpose. The mirrors must be secured and -isolated such that they are responsible only for mirroring PyPI. The mirrors -can be checked against one another to detect accidental or malicious failures. - - -Metadata Expiry Times ---------------------- - -The *root* and *targets* role metadata SHOULD expire in a year, because these -metadata files are expected to change very rarely. - -The *claimed* role metadata SHOULD expire in three to six months, because this -metadata is expected to be refreshed in that time frame. This time frame was -chosen to induce an easier administration process for PyPI. - -The *timestamp*, *consistent-snapshot*, *recently-claimed* and *unclaimed* role -metadata SHOULD expire in a day because a CDN or mirror SHOULD synchronize -itself with PyPI every day. Furthermore, this generous time frame also takes -into account client clocks that are highly skewed or adrift. - -The expiry times for the delegated targets metadata of a project is beyond the -scope of this PEP. - - -Metadata Scalability --------------------- - -Due to the growing number of projects and distributions, the TUF metadata will -also grow correspondingly. - -For example, consider the *unclaimed* role. In August 2013, we found that the -size of the *unclaimed* role metadata was about 42MB if the *unclaimed* role -itself signed for about 220K PyPI targets (which are simple indices and -distributions). We will not delve into details in this PEP, but TUF features a -so-called "`lazy bin walk`__" scheme which splits a large targets or delegated -targets metadata file into many small ones. This allows a TUF client updater -to intelligently download only a small number of TUF metadata files in order to -update any project signed for by the *unclaimed* role. For example, applying -this scheme to the previous repository resulted in pip downloading between -1.3KB and 111KB to install or upgrade a PyPI project via TUF. - -__ https://github.com/theupdateframework/tuf/issues/39 - -From our findings as of the time of writing, PyPI SHOULD split all targets in -the *unclaimed* role by delegating it to 1024 delegated targets role, each of -which would sign for PyPI targets whose hashes fall into that "bin" or -delegated targets role. We found that 1024 bins would result in the -*unclaimed* role metadata and each of its binned delegated targets role -metadata to be about the same size (40-50KB) for about 220K PyPI targets -(simple indices and distributions). - -It is possible to make the TUF metadata more compact by representing it in a -binary format as opposed to the JSON text format. Nevertheless, we believe -that a sufficiently large number of project and distributions will induce -scalability challenges at some point, and therefore the *unclaimed* role will -then still need delegations in order to address the problem. Furthermore, the -JSON format is an open and well-known standard for data interchange. - -Due to the large number of delegated target metadata files, compressed versions -of *consistent-snapshot* metadata SHOULD also be made available. - - -Key Management -============== - -In this section, we examine the kind of keys required to sign for TUF roles on -PyPI. TUF is agnostic with respect to choices of digital signature algorithms. -For the purpose of discussion, we will assume that most digital signatures will -be produced with the well-tested and tried RSA algorithm [20]_. Nevertheless, -we do NOT recommend any particular digital signature algorithm in this PEP -because there are a few important constraints: firstly, cryptography changes -over time; secondly, package managers such as pip may wish to perform signature -verification in Python, without resorting to a compiled C library, in order to -be able to run on as many systems as Python supports; finally, TUF recommends -diversity of keys for certain applications, and we will soon discuss these -exceptions. - - -Number Of Keys --------------- - -The *timestamp*, *consistent-snapshot*, *recently-claimed* and *unclaimed* -roles will need to support continuous delivery. Even though their respective -keys will then need to be online, we will require that the keys be independent -of each other. This allows for each of the keys to be placed on separate -servers if need be, and prevents side channel attacks that compromise one key -from automatically compromising the rest of the keys. Therefore, each of the -*timestamp*, *consistent-snapshot*, *recently-claimed* and *unclaimed* roles -MUST require (1, 1) keys. - -The *unclaimed* role MAY delegate targets in an automated manner to a number of -roles called "bins", as we discussed in the previous section. Each of the -"bin" roles SHOULD share the same key as the *unclaimed* role, due -simultaneously to space efficiency of metadata and because there is no security -advantage in requiring separate keys. - -The *root* role is critical for security and should very rarely be used. It is -primarily used for key revocation, and it is the root of trust for all of PyPI. -The *root* role signs for the keys that are authorized for each of the -top-level roles (including itself). The keys belonging to the *root* role are -intended to be very well-protected and used with the least frequency of all -keys. We propose that every PSF board member own a (strong) root key. A -majority of them can then constitute the quorum to revoke or endow trust in all -top-level keys. Alternatively, the system administrators of PyPI (instead of -PSF board members) could be responsible for signing for the *root* role. -Therefore, the *root* role SHOULD require (t, n) keys, where n is the number of -either all PyPI administrators or all PSF board members, and t > 1 (so that at -least two members must sign the *root* role). - -The *targets* role will be used only to sign for the static delegation of all -targets to the *claimed*, *recently-claimed* and *unclaimed* roles. Since -these target delegations must be secured against attacks in the event of a -compromise, the keys for the *targets* role MUST be offline and independent -from other keys. For simplicity of key management without sacrificing -security, it is RECOMMENDED that the keys of the *targets* role are permanently -discarded as soon as they have been created and used to sign for the role. -Therefore, the *targets* role SHOULD require (1, 1) keys. Again, this is -because the keys are going to be permanently discarded, and more offline keys -will not help against key recovery attacks [21]_ unless diversity of keys is -maintained. - -Similarly, the *claimed* role will be used only to sign for the dynamic -delegation of projects to their respective developer keys. Since these target -delegations must be secured against attacks in the event of a compromise, the -keys for the *claimed* role MUST be offline and independent from other keys. -Therefore, the *claimed* role SHOULD require (t, n) keys, where n is the number -of all PyPI administrators (in order to keep it manageable), and t ? 1 (so that -at least one member MUST sign the *claimed* role). While a stronger threshold -would indeed render the role more robust against a compromise of the *claimed* -keys (which is highly unlikely assuming that the keys are independent and -securely kept offline), we think that this trade-off is acceptable for the -important purpose of keeping the maintenance overhead for PyPI administrators -as little as possible. At the time of writing, we are keeping this point open -for discussion by the distutils-sig community. - -The number of developer keys is project-specific and thus beyond the scope of -this PEP. - - -Online and Offline Keys ------------------------ - -In order to support continuous delivery, the *timestamp*, -*consistent-snapshot*, *recently-claimed* and *unclaimed* role keys MUST be -online. - -As explained in the previous section, the *root*, *targets* and *claimed* role -keys MUST be offline for maximum security. Developers keys will be offline in -the sense that the private keys MUST NOT be stored on PyPI, though some of them -may be online on the private infrastructure of the project. - - -Key Strength ------------- - -At the time of writing, we recommend that all RSA keys (both offline and -online) SHOULD have a minimum key size of 3072 bits for data-protection -lifetimes beyond 2030 [22]_. - - -Diversity Of Keys ------------------ - -Due to the threats of weak key generation and implementation weaknesses [2]_, -the types of keys as well as the libraries used to generate them should vary -within TUF on PyPI. Our current implementation of TUF supports multiple -digital signature algorithms such as RSA (with OpenSSL [23]_ or PyCrypto [24]_) -and ed25519 [25]_. Furthermore, TUF supports the binding of other -cryptographic libraries that it does not immediately support "out of the box", -and so one MAY generate keys using other cryptographic libraries and use them -for TUF on PyPI. - -As such, the root role keys SHOULD be generated by a variety of digital -signature algorithms as implemented by different cryptographic libraries. - - -Key Compromise Analysis ------------------------ - -.. image:: https://raw.github.com/theupdateframework/pep-on-pypi-with-tuf/master/table1.png - -Table 1: Attacks possible by compromising certain combinations of role keys - - -Table 1 summarizes the kinds of attacks rendered possible by compromising a -threshold number of keys belonging to the TUF roles on PyPI. Except for the -*timestamp* and *consistent-snapshot* roles, the pairwise interaction of role -compromises may be found by taking the union of both rows. - -In September 2013, we showed how the latest version of pip then was susceptible -to these attacks and how TUF could protect users against them [14]_. - -An attacker who compromises developer keys for a project and who is able to -somehow upload malicious metadata and targets to PyPI will be able to serve -malicious updates to users of that project (and that project alone). Note that -compromising *targets* or any delegated targets role (except for project -targets metadata) does not immediately endow the attacker with the ability to -serve malicious updates. The attacker must also compromise the *timestamp* and -*consistent-snapshot* roles (which are both online and therefore more likely to -be compromised). This means that in order to launch any attack, one must be -not only be able to act as a man-in-the-middle but also compromise the -*timestamp* key (or the *root* keys and sign a new *timestamp* key). To launch -any attack other than a freeze attack, one must also compromise the -*consistent-snapshot* key. - -Finally, a compromise of the PyPI infrastructure MAY introduce malicious -updates to *recently-claimed* and *unclaimed* projects because the keys for -those roles are online. However, attackers cannot modify *claimed* projects in -such an event because *targets* and *claimed* metadata have been signed with -offline keys. Therefore, it is RECOMMENDED that high-value projects register -their developer keys with PyPI and sign for their own distributions. - - -In the Event of a Key Compromise --------------------------------- - -By a key compromise, we mean that the key as well as PyPI infrastructure has -been compromised and used to sign new metadata on PyPI. - -If a threshold number of developer keys of a project have been compromised, -then the project MUST take the following steps: - -1. The project metadata and targets MUST be restored to the last known good - consistent snapshot where the project was not known to be compromised. This - can be done by the developers repackaging and resigning all targets with the - new keys. - -2. The project delegated targets metadata MUST have their version numbers - incremented, expiry times suitably extended and signatures renewed. - -Whereas PyPI MUST take the following steps: - -1. Revoke the compromised developer keys from the delegation to the project by - the *recently-claimed* or *claimed* role. This is done by replacing the - compromised developer keys with newly issued developer keys. - -2. A new timestamped consistent snapshot MUST be issued. - -If a threshold number of *timestamp*, *consistent-snapshot*, *recently-claimed* -or *unclaimed* keys have been compromised, then PyPI MUST take the following -steps: - -1. Revoke the *timestamp*, *consistent-snapshot* and *targets* role keys from - the *root* role. This is done by replacing the compromised *timestamp*, - *consistent-snapshot* and *targets* keys with newly issued keys. - -2. Revoke the *recently-claimed* and *unclaimed* keys from the *targets* role - by replacing their keys with newly issued keys. Sign the new *targets* role - metadata and discard the new keys (because, as we explained earlier, this - increases the security of *targets* metadata). - -3. Clear all targets or delegations in the *recently-claimed* role and delete - all associated delegated targets metadata. Recently registered projects - SHOULD register their developer keys again with PyPI. - -4. All targets of the *recently-claimed* and *unclaimed* roles SHOULD be - compared with the last known good consistent snapshot where none of the - *timestamp*, *consistent-snapshot*, *recently-claimed* or *unclaimed* keys - were known to have been compromised. Added, updated or deleted targets in - the compromised consistent snapshot that do not match the last known good - consistent snapshot MAY be restored to their previous versions. After - ensuring the integrity of all *unclaimed* targets, the *unclaimed* metadata - MUST be regenerated. - -5. The *recently-claimed* and *unclaimed* metadata MUST have their version - numbers incremented, expiry times suitably extended and signatures renewed. - -6. A new timestamped consistent snapshot MUST be issued. - -This would preemptively protect all of these roles even though only one of them -may have been compromised. - -If a threshold number of the *targets* or *claimed* keys have been compromised, -then there is little that an attacker could do without the *timestamp* and -*consistent-snapshot* keys. In this case, PyPI MUST simply revoke the -compromised *targets* or *claimed* keys by replacing them with new keys in the -*root* and *targets* roles respectively. - -If a threshold number of the *timestamp*, *consistent-snapshot* and *claimed* -keys have been compromised, then PyPI MUST take the following steps in addition -to the steps taken when either the *timestamp* or *consistent-snapshot* keys -are compromised: - -1. Revoke the *claimed* role keys from the *targets* role and replace them with - newly issued keys. - -2. All project targets of the *claimed* roles SHOULD be compared with the last - known good consistent snapshot where none of the *timestamp*, - *consistent-snapshot* or *claimed* keys were known to have been compromised. - Added, updated or deleted targets in the compromised consistent snapshot - that do not match the last known good consistent snapshot MAY be restored to - their previous versions. After ensuring the integrity of all *claimed* - project targets, the *claimed* metadata MUST be regenerated. - -3. The *claimed* metadata MUST have their version numbers incremented, expiry - times suitably extended and signatures renewed. - -If a threshold number of the *timestamp*, *consistent-snapshot* and *targets* -keys have been compromised, then PyPI MUST take the union of the steps taken -when the *claimed*, *recently-claimed* and *unclaimed* keys have been -compromised. - -If a threshold number of the *root* keys have been compromised, then PyPI MUST -take the steps taken when the *targets* role has been compromised as well as -replace all of the *root* keys. - -It is also RECOMMENDED that PyPI sufficiently document compromises with -security bulletins. These security bulletins will be most informative when -users of pip with TUF are unable to install or update a project because the -keys for the *timestamp*, *consistent-snapshot* or *root* roles are no longer -valid. They could then visit the PyPI web site to consult security bulletins -that would help to explain why they are no longer able to install or update, -and then take action accordingly. When a threshold number of *root* keys have -not been revoked due to a compromise, then new *root* metadata may be safely -updated because a threshold number of existing *root* keys will be used to sign -for the integrity of the new *root* metadata so that TUF clients will be able -to verify the integrity of the new *root* metadata with a threshold number of -previously known *root* keys. This will be the common case. Otherwise, in the -worst case where a threshold number of *root* keys have been revoked due to a -compromise, an end-user may choose to update new *root* metadata with -`out-of-band`__ mechanisms. - -__ https://en.wikipedia.org/wiki/Out-of-band#Authentication - - -Appendix: Rejected Proposals -============================ - - -Alternative Proposals for Producing Consistent Snapshots --------------------------------------------------------- - -The complete file snapshot (CFS) scheme uses file system directories to store -efficient consistent snapshots over time. In this scheme, every consistent -snapshot will be stored in a separate directory, wherein files that are shared -with previous consistent snapshots will be `hard links`__ instead of copies. - -__ https://en.wikipedia.org/wiki/Hard_link - -The `differential file`__ snapshot (DFS) scheme is a variant of the CFS scheme, -wherein the next consistent snapshot directory will contain only the additions -of new files and updates to existing files of the previous consistent snapshot. -(The first consistent snapshot will contain a complete set of files known -then.) Deleted files will be marked as such in the next consistent snapshot -directory. This means that files will be resolved in this manner: First, set -the current consistent snapshot directory to be the latest consistent snapshot -directory. Then, any requested file will be seeked in the current consistent -snapshot directory. If the file exists in the current consistent snapshot -directory, then that file will be returned. If it has been marked as deleted -in the current consistent snapshot directory, then that file will be reported -as missing. Otherwise, the current consistent snapshot directory will be set -to the preceding consistent snapshot directory and the previous few steps will -be iterated until there is no preceding consistent snapshot to be considered, -at which point the file will be reported as missing. - -__ http://dl.acm.org/citation.cfm?id=320484 - -With the CFS scheme, the trade-off is the I/O costs of producing a consistent -snapshot with the file system. As of October 2013, we found that a fairly -modern computer with a 7200RPM hard disk drive required at least three minutes -to produce a consistent snapshot with the "cp -lr" command on the ext3__ file -system. Perhaps the I/O costs of this scheme may be ameliorated with advanced -tools or file systems such as ZFS__ or btrfs__. - -__ https://en.wikipedia.org/wiki/Ext3 -__ https://en.wikipedia.org/wiki/ZFS -__ https://en.wikipedia.org/wiki/Btrfs - -While the DFS scheme improves upon the CFS scheme in terms of producing faster -consistent snapshots, there are at least two trade-offs. The first is that a -web server will need to be modified to perform the "daisy chain" resolution of -a file. The second is that every now and then, the differential snapshots will -need to be "squashed" or merged together with the first consistent snapshot to -produce a new first consistent snapshot with the latest and complete set of -files. Although the merge cost may be amortized over time, this scheme is not -conceptually si - - - - -References -========== - -.. [1] https://pypi.python.org -.. [2] https://isis.poly.edu/~jcappos/papers/samuel_tuf_ccs_2010.pdf -.. [3] http://www.pip-installer.org -.. [4] https://wiki.python.org/moin/WikiAttack2013 -.. [5] https://github.com/theupdateframework/pip/wiki/Attacks-on-software-repositories -.. [6] https://mail.python.org/pipermail/distutils-sig/2013-April/020596.html -.. [7] https://mail.python.org/pipermail/distutils-sig/2013-May/020701.html -.. [8] https://mail.python.org/pipermail/distutils-sig/2013-July/022008.html -.. [9] PEP 381, Mirroring infrastructure for PyPI, Ziad?, L?wis - http://www.python.org/dev/peps/pep-0381/ -.. [10] https://mail.python.org/pipermail/distutils-sig/2013-September/022773.html -.. [11] https://mail.python.org/pipermail/distutils-sig/2013-May/020848.html -.. [12] PEP 449, Removal of the PyPI Mirror Auto Discovery and Naming Scheme, Stufft - http://www.python.org/dev/peps/pep-0449/ -.. [13] https://isis.poly.edu/~jcappos/papers/cappos_mirror_ccs_08.pdf -.. [14] https://mail.python.org/pipermail/distutils-sig/2013-September/022755.html -.. [15] https://pypi.python.org/security -.. [16] https://github.com/theupdateframework/tuf/blob/develop/docs/tuf-spec.txt -.. [17] PEP 426, Metadata for Python Software Packages 2.0, Coghlan, Holth, Stufft - http://www.python.org/dev/peps/pep-0426/ -.. [18] https://en.wikipedia.org/wiki/Continuous_delivery -.. [19] https://mail.python.org/pipermail/distutils-sig/2013-August/022154.html -.. [20] https://en.wikipedia.org/wiki/RSA_%28algorithm%29 -.. [21] https://en.wikipedia.org/wiki/Key-recovery_attack -.. [22] http://csrc.nist.gov/publications/nistpubs/800-57/SP800-57-Part1.pdf -.. [23] https://www.openssl.org/ -.. [24] https://pypi.python.org/pypi/pycrypto -.. [25] http://ed25519.cr.yp.to/ - - -Acknowledgements -================ - -Nick Coghlan, Daniel Holth and the distutils-sig community in general for -helping us to think about how to usably and efficiently integrate TUF with -PyPI. - -Roger Dingledine, Sebastian Hahn, Nick Mathewson, Martin Peck and Justin -Samuel for helping us to design TUF from its predecessor Thandy of the Tor -project. - -Konstantin Andrianov, Geremy Condra, Vladimir Diaz, Zane Fisher, Justin Samuel, -Tian Tian, Santiago Torres, John Ward, and Yuyu Zheng for helping us to develop -TUF. - -Vladimir Diaz, Monzur Muhammad and Sai Teja Peddinti for helping us to review -this PEP. - -Zane Fisher for helping us to review and transcribe this PEP. - - -Copyright -========= - -This document has been placed in the public domain. +PEP: 458 +Title: Surviving a Compromise of PyPI +Version: $Revision$ +Last-Modified: $Date$ +Author: Trishank Karthik Kuppusamy , + Donald Stufft , + Justin Cappos +Discussions-To: Distutils SIG +Status: Draft +Type: Standards Track +Content-Type: text/x-rst +Created: 27-Sep-2013 + + +Abstract +======== + +This PEP describes how the Python Package Index (PyPI [1]_) may be integrated +with The Update Framework [2]_ (TUF). TUF was designed to be a plug-and-play +security add-on to a software updater or package manager. TUF provides +end-to-end security like SSL, but for software updates instead of HTTP +connections. The framework integrates best security practices such as +separating responsibilities, adopting the many-man rule for signing packages, +keeping signing keys offline, and revocation of expired or compromised signing +keys. + +The proposed integration will render modern package managers such as pip [3]_ +more secure against various types of security attacks on PyPI and protect users +against them. Even in the worst case where an attacker manages to compromise +PyPI itself, the damage is controlled in scope and limited in duration. + +Specifically, this PEP will describe how PyPI processes should be adapted to +incorporate TUF metadata. It will not prescribe how package managers such as +pip should be adapted to install or update with TUF metadata projects from +PyPI. + + +Rationale +========= + +In January 2013, the Python Software Foundation (PSF) announced [4]_ that the +python.org wikis for Python, Jython, and the PSF were subjected to a security +breach which caused all of the wiki data to be destroyed on January 5 2013. +Fortunately, the PyPI infrastructure was not affected by this security breach. +However, the incident is a reminder that PyPI should take defensive steps to +protect users as much as possible in the event of a compromise. Attacks on +software repositories happen all the time [5]_. We must accept the possibility +of security breaches and prepare PyPI accordingly because it is a valuable +target used by thousands, if not millions, of people. + +Before the wiki attack, PyPI used MD5 hashes to tell package managers such as +pip whether or not a package was corrupted in transit. However, the absence of +SSL made it hard for package managers to verify transport integrity to PyPI. +It was easy to launch a man-in-the-middle attack between pip and PyPI to change +package contents arbitrarily. This can be used to trick users into installing +malicious packages. After the wiki attack, several steps were proposed (some +of which were implemented) to deliver a much higher level of security than was +previously the case: requiring SSL to communicate with PyPI [6]_, restricting +project names [7]_, and migrating from MD5 to SHA-2 hashes [8]_. + +These steps, though necessary, are insufficient because attacks are still +possible through other avenues. For example, a public mirror is trusted to +honestly mirror PyPI, but some mirrors may misbehave due to malice or accident. +Package managers such as pip are supposed to use signatures from PyPI to verify +packages downloaded from a public mirror [9]_, but none are known to actually +do so [10]_. Therefore, it is also wise to add more security measures to +detect attacks from public mirrors or content delivery networks [11]_ (CDNs). + +Even though official mirrors are being deprecated on PyPI [12]_, there remain a +wide variety of other attack vectors on package managers [13]_. Among other +things, these attacks can crash client systems, cause obsolete packages to be +installed, or even allow an attacker to execute arbitrary code. In September +2013, we showed how the latest version of pip then was susceptible to these +attacks and how TUF could protect users against them [14]_. + +Finally, PyPI allows for packages to be signed with GPG keys [15]_, although no +package manager is known to verify those signatures, thus negating much of the +benefits of having those signatures at all. Validating integrity through +cryptography is important, but issues such as immediate and secure key +revocation or specifying a required threshold number of signatures still +remain. Furthermore, GPG by itself does not immediately address the attacks +mentioned above. + +In order to protect PyPI against infrastructure compromises, we propose +integrating PyPI with The Update Framework [2]_ (TUF). + + +Definitions +=========== + +The key words "MUST", "MUST NOT", "REQUIRED", "SHALL", "SHALL NOT", "SHOULD", +"SHOULD NOT", "RECOMMENDED", "MAY", and "OPTIONAL" in this document are to be +interpreted as described in RFC 2119__. + +__ http://www.ietf.org/rfc/rfc2119.txt + +In order to keep this PEP focused solely on the application of TUF on PyPI, the +reader is assumed to already be familiar with the design principles of +TUF [2]_. It is also strongly RECOMMENDED that the reader be familiar with the +TUF specification [16]_. + +* Projects: Projects are software components that are made available for + integration. Projects include Python libraries, frameworks, scripts, plugins, + applications, collections of data or other resources, and various + combinations thereof. Public Python projects are typically registered on the + Python Package Index [17]_. + +* Releases: Releases are uniquely identified snapshots of a project [17]_. + +* Distributions: Distributions are the packaged files which are used to publish + and distribute a release [17]_. + +* Simple index: The HTML page which contains internal links to the + distributions of a project [17]_. + +* Consistent snapshot: A set of TUF metadata and PyPI targets that capture the + complete state of all projects on PyPI as they were at some fixed point in + time. + +* The *consistent-snapshot* (*release*) role: In order to prevent confusion due + to the different meanings of the term "release" as employed by PEP 426 [17]_ + and the TUF specification [16]_, we rename the *release* role as the + *consistent-snapshot* role. + +* Continuous delivery: A set of processes with which PyPI produces consistent + snapshots that can safely coexist and deleted independently [18]_. + +* Developer: Either the owner or maintainer of a project who is allowed to + update the TUF metadata as well as distribution metadata and data for the + project. + +* Online key: A key that MUST be stored on the PyPI server infrastructure. + This is usually to allow automated signing with the key. However, this means + that an attacker who compromises PyPI infrastructure will be able to read + these keys. + +* Offline key: A key that MUST be stored off the PyPI infrastructure. This + prevents automated signing with the key. This means that an attacker who + compromises PyPI infrastructure will not be able to immediately read these + keys. + +* Developer key: A private key for which its corresponding public key is + registered with PyPI to say that it is responsible for directly signing for + or delegating the distributions belonging to a project. For the purposes of + this PEP, it is offline in the sense that the private key MUST not be stored + on PyPI. However, the project is free to require certain developer keys to + be online on its own infrastructure. + +* Threshold signature scheme: A role could increase its resilience to key + compromises by requiring that at least t out of n keys are REQUIRED to sign + its metadata. This means that a compromise of t-1 keys is insufficient to + compromise the role itself. We denote this property by saying that the role + requires (t, n) keys. + + +Overview +======== + +.. image:: https://raw.github.com/theupdateframework/pep-on-pypi-with-tuf/master/figure1.png + +Figure 1: A simplified overview of the roles in PyPI with TUF + +Figure 1 shows a simplified overview of the roles that TUF metadata assume on +PyPI. The top-level *root* role signs for the keys of the top-level +*timestamp*, *consistent-snapshot*, *targets* and *root* roles. The +*timestamp* role signs for a new and consistent snapshot. The *consistent- +snapshot* role signs for the *root*, *targets* and all delegated targets +metadata. The *claimed* role signs for all projects that have registered their +own developer keys with PyPI. The *recently-claimed* role signs for all +projects that recently registered their own developer keys with PyPI. Finally, +the *unclaimed* role signs for all projects that have not registered developer +keys with PyPI. The *claimed*, *recently-claimed* and *unclaimed* roles are +numbered 1, 2, 3 respectively because a project will be searched for in each of +those roles in that descending order: first in *claimed*, then in +*recently-claimed* if necessary, and finally in *unclaimed* if necessary. + +Every year, PyPI administrators are going to sign for *root* role keys. After +that, automation will continuously sign for a timestamped, consistent snapshot +of all projects. Every few months, PyPI administrators will move projects with +vetted developer keys from the *recently-claimed* role to the *claimed* role. +As we will soon see, they will sign for *claimed* with projects with offline +keys. + +This PEP does not require project developers to use TUF to secure their +packages from attacks on PyPI. By default, all projects will be signed for by +the *unclaimed* role. If a project wishes stronger security guarantees, then +the project is strongly RECOMMENDED to register developer keys with PyPI so +that it may sign for its own distributions. By doing so, the project must +remain as a *recently-claimed* project until PyPI administrators have had an +opportunity to vet the developer keys of the project, after which the project +will be moved to the *claimed* role. + +This PEP has **not** been designed to be backward-compatible for package +managers that do not use the TUF security protocol to install or update a +project from the PyPI described here. Instead, it is RECOMMENDED that PyPI +maintain a backward-compatible API of itself that does NOT offer TUF so that +older package managers that do not use TUF will be able to install or update +projects from PyPI as usual but without any of the security offered by TUF. +For the rest of this PEP, we will assume that PyPI will simultaneously maintain +a backward-incompatible API of itself for package managers that MUST use TUF to +securely install or update projects. We think that this approach represents a +reasonable trade-off: older package managers that do not TUF will still be able +to install or update projects without any TUF security from PyPI, and newer +package managers that do use TUF will be able to securely install or update +projects. At some point in the future, PyPI administrators MAY choose to +permanently deprecate the backward-compatible version of itself that does not +offer TUF metadata. + +Unless a mirror, CDN or the PyPI repository has been compromised, the end-user +will not be able to discern whether or not a package manager is using TUF to +install or update a project from PyPI. + + +Responsibility Separation +========================= + +Recall that TUF requires four top-level roles: *root*, *timestamp*, +*consistent-snapshot* and *targets*. The *root* role specifies the keys of all +the top-level roles (including itself). The *timestamp* role specifies the +latest consistent snapshot. The *consistent-snapshot* role specifies the +latest versions of all TUF metadata files (other than *timestamp*). The +*targets* role specifies available target files (in our case, it will be all +files on PyPI under the /simple and /packages directories). In this PEP, each +of these roles will serve their responsibilities without exception. + +Our proposal offers two levels of security to developers. If developers opt in +to secure their projects with their own developer keys, then their projects +will be very secure. Otherwise, TUF will still protect them in many cases: + +1. Minimum security (no action by a developer): protects *unclaimed* and + *recently-claimed* projects without developer keys from CDNs [19]_ or public + mirrors, but not from some PyPI compromises. This is because continuous + delivery requires some keys to be online. This level of security protects + projects from being accidentally or deliberately tampered with by a mirror + or a CDN because the mirror or CDN will not have any of the PyPI or + developer keys required to sign for projects. However, it would not protect + projects from attackers who have compromised PyPI because they will be able + to manipulate the TUF metadata for *unclaimed* projects with the appropriate + online keys. + +2. Maximum security (developer signs their project): protects projects with + developer keys not only from CDNs or public mirrors, but also from some PyPI + compromises. This is because many important keys will be offline. This + level of security protects projects from being accidentally or deliberately + tampered with by a mirror or a CDN for reasons identical to the minimum + security level. It will also protect projects (or at least mitigate + damages) from the most likely attacks on PyPI. For example: given access to + online keys after a PyPI compromise, attackers will be able to freeze the + distributions for these projects, but they will not be able to serve + malicious distributions for these projects (not without compromising other + offline keys which would entail more risk, time and energy). Details for + the exact level of security offered is discussed in the section on key + management. + +In order to complete support for continuous delivery, we propose three +delegated targets roles: + +1. *claimed*: Signs for the delegation of PyPI projects to their respective + developer keys. + +2. *recently-claimed*: This role is almost identical to the *claimed* role and + could technically be performed by the *unclaimed* role, but there are two + important reasons why it exists independently: the first reason is to + improve the performance of looking up projects in the *unclaimed* role (by + moving metadata to the *recently-claimed* role instead), and the second + reason is to make it easier for PyPI administrators to move + *recently-claimed* projects to the *claimed* role. + +3. *unclaimed*: Signs for PyPI projects without developer keys. + +The *targets* role MUST delegate all PyPI projects to the three delegated +targets roles in the order of appearance listed above. This means that when +pip downloads with TUF a distribution from a project on PyPI, it will first +consult the *claimed* role about it. If the *claimed* role has delegated the +project, then pip will trust the project developers (in order of delegation) +about the TUF metadata for the project. Otherwise, pip will consult the +*recently-claimed* role about the project. If the *recently-claimed* role has +delegated the project, then pip will trust the project developers (in order of +delegation) about the TUF metadata for the project. Otherwise, pip will +consult the *unclaimed* role about the TUF metadata for the project. If the +*unclaimed* role has not delegated the project, then the project is considered +to be non-existent on PyPI. + +A PyPI project MAY begin without registering a developer key. Therefore, the +project will be signed for by the *unclaimed* role. After registering +developer keys, the project will be removed from the *unclaimed* role and +delegated to the *recently-claimed* role. After a probation period and a +vetting process to verify the developer keys of the project, the project will +be removed from the *recently-claimed* role and delegated to the *claimed* +role. + +The *claimed* role offers maximum security, whereas the *recently-claimed* and +*unclaimed* role offer minimum security. All three roles support continuous +delivery of PyPI projects. + +The *unclaimed* role offers minimum security because PyPI will sign for +projects without developer keys with an online key in order to permit +continuous delivery. + +The *recently-claimed* role offers minimum security because while the project +developers will sign for their own distributions with offline developer keys, +PyPI will sign with an online key the delegation of the project to those +offline developer keys. The signing of the delegation with an online key +allows PyPI administrators to continuously deliver projects without having to +continuously sign the delegation whenever one of those projects registers +developer keys. + +Finally, the *claimed* role offers maximum security because PyPI will sign with +offline keys the delegation of a project to its offline developer keys. This +means that every now and then, PyPI administrators will vet developer keys and +sign the delegation of a project to those developer keys after being reasonably +sure about the ownership of the developer keys. The process for vetting +developer keys is out of the scope of this PEP. + + +Metadata Management +=================== + +In this section, we examine the TUF metadata that PyPI must manage by itself, +and other TUF metadata that must be safely delegated to projects. Examples of +the metadata described here may be seen at our testbed mirror of +`PyPI-with-TUF`__. + +__ http://mirror1.poly.edu/ + +The metadata files that change most frequently will be *timestamp*, +*consistent-snapshot* and delegated targets (*claimed*, *recently-claimed*, +*unclaimed*, project) metadata. The *timestamp* and *consistent-snapshot* +metadata MUST be updated whenever *root*, *targets* or delegated targets +metadata are updated. Observe, though, that *root* and *targets* metadata are +much less likely to be updated as often as delegated targets metadata. +Therefore, *timestamp* and *consistent-snapshot* metadata will most likely be +updated frequently (possibly every minute) due to delegated targets metadata +being updated frequently in order to drive continuous delivery of projects. + +Consequently, the processes with which PyPI updates projects will have to be +updated accordingly, the details of which are explained in the following +subsections. + + +Why Do We Need Consistent Snapshots? +------------------------------------ + +In an ideal world, metadata and data should be immediately updated and +presented whenever a project is updated. In practice, there will be problems +when there are many readers and writers who access the same metadata or data at +the same time. + +An important example at the time of writing is that, mirrors are very likely, +as far as we can tell, to update in an inconsistent manner from PyPI as it is +without TUF. Specifically, a mirror would update itself in such a way that +project A would be from time T, whereas project B would be from time T+5, +project C would be from time T+3, and so on where T is the time that the mirror +first begun updating itself. There is no known way for a mirror to update +itself such that it captures the state of all projects as they were at time T. + +Adding TUF to PyPI will not automatically solve the problem. Consider what we +call the `"inverse replay" or "fast-forward" problem`__. Suppose that PyPI has +timestamped a consistent snapshot at version 1. A mirror is later in the +middle of copying PyPI at this snapshot. While the mirror is copying PyPI at +this snapshot, PyPI timestamps a new snapshot at, say, version 2. Without +accounting for consistency, the mirror would then find itself with a copy of +PyPI in an inconsistent state which is indistinguishable from arbitrary +metadata or target attacks. The problem would also apply when the mirror is +substituted with a pip user. + +__ https://groups.google.com/forum/#!topic/theupdateframework/8mkR9iqivQA + +Therefore, the problem can be summarized as such: there are problems of +consistency on PyPI with or without TUF. TUF requires its metadata to be +consistent with the data, but how would the metadata be kept consistent with +projects that change all the time? + +As a result, we will solve for PyPI the problem of producing a consistent +snapshot that captures the state of all known projects at a given time. Each +consistent snapshot can safely coexist with any other consistent snapshot and +deleted independently without affecting any other consistent snapshot. + +The gist of the solution is that every metadata or data file written to disk +MUST include in its filename the `cryptographic hash`__ of the file. How would +this help clients which use the TUF protocol to securely and consistently +install or update a project from PyPI? + +__ https://en.wikipedia.org/wiki/Cryptographic_hash_function + +Recall that the first step in the TUF protocol requires the client to download +the latest *timestamp* metadata. However, the client would not know in advance +the hash of the *timestamp* metadata file from the latest consistent snapshot. +Therefore, PyPI MUST redirect all HTTP GET requests for *timestamp* metadata to +the *timestamp* metadata file from the latest consistent snapshot. Since the +*timestamp* metadata is the root of a tree of cryptographic hashes pointing to +every other metadata or target file that are meant to exist together for +consistency, the client is then able to retrieve any file from this consistent +snapshot by deterministically including, in the request for the file, the hash +of the file in the filename. Assuming infinite disk space and no `hash +collisions`__, a client may safely read from one consistent snapshot while PyPI +produces another consistent snapshot. + +__ https://en.wikipedia.org/wiki/Collision_(computer_science) + +In this simple but effective manner, we are able to capture a consistent +snapshot of all projects and the associated metadata at a given time. The next +subsection will explicate the implementation details of this idea. + + +Producing Consistent Snapshots +------------------------------ + +Given a project, PyPI is responsible for updating, depending on the project, +either the *claimed*, *recently-claimed* or *unclaimed* metadata as well as +associated delegated targets metadata. Every project MUST upload its set of +metadata and targets in a single transaction. We will call this set of files +the project transaction. We will discuss later how PyPI MAY validate the files +in a project transaction. For now, let us focus on how PyPI will respond to a +project transaction. We will call this response the project transaction +process. There will also be a consistent snapshot process that we will define +momentarily; for now, it suffices to know that project transaction processes +and the consistent snapshot process must coordinate with each other. + +Also, every metadata and target file MUST include in its filename the `hex +digest`__ of its `SHA-256`__ hash. For this PEP, it is RECOMMENDED that PyPI +adopt a simple convention of the form filename.digest.ext, where filename is +the original filename without a copy of the hash, digest is the hex digest of +the hash, and ext is the filename extension. + +__ http://docs.python.org/2/library/hashlib.html#hashlib.hash.hexdigest +__ https://en.wikipedia.org/wiki/SHA-2 + +When an *unclaimed* project uploads a new transaction, a project transaction +process MUST add all new targets and relevant delegated *unclaimed* metadata. +(We will see later in this section why the *unclaimed* role will delegate +targets to a number of delegated *unclaimed* roles.) Finally, the project +transaction process MUST inform the consistent snapshot process about new +delegated *unclaimed* metadata. + +When a *recently-claimed* project uploads a new a transaction, a project +transaction process MUST add all new targets and delegated targets metadata for +the project. If the project is new, then the project transaction process MUST +also add new *recently-claimed* metadata with public keys and threshold number +(which MUST be part of the transaction) for the project. Finally, the project +transaction process MUST inform the consistent snapshot process about new +*recently-claimed* metadata as well as the current set of delegated targets +metadata for the project. + +The process for a *claimed* project is slightly different. The difference is +that PyPI administrators will choose to move the project from the +*recently-claimed* role to the *claimed* role. A project transaction process +MUST then add new *recently-claimed* and *claimed* metadata to reflect this +migration. As is the case for a *recently-claimed* project, the project +transaction process MUST always add all new targets and delegated targets +metadata for the *claimed* project. Finally, the project transaction process +MUST inform the consistent snapshot process about new *recently-claimed* or +*claimed* metadata as well as the current set of delegated targets metadata for +the project. + +Project transaction processes SHOULD be automated, except when PyPI +administrators move a project from the *recently-claimed* role to the *claimed* +role. Project transaction processes MUST also be applied atomically: either +all metadata and targets, or none of them, are added. The project transaction +processes and consistent snapshot process SHOULD work concurrently. Finally, +project transaction processes SHOULD keep in memory the latest *claimed*, +*recently-claimed* and *unclaimed* metadata so that they will be correctly +updated in new consistent snapshots. + +All project transactions MAY be placed in a single queue and processed +serially. Alternatively, the queue MAY be processed concurrently in order of +appearance provided that the following rules are observed: + +1. No pair of project transaction processes must concurrently work on the same + project. + +2. No pair of project transaction processes must concurrently work on + *unclaimed* projects that belong to the same delegated *unclaimed* targets + role. + +3. No pair of project transaction processes must concurrently work on new + *recently-claimed* projects. + +4. No pair of project transaction processes must concurrently work on new + *claimed* projects. + +5. No project transaction process must work on a new *claimed* project while + another project transaction process is working on a new *recently-claimed* + project and vice versa. + +These rules MUST be observed so that metadata is not read from or written to +inconsistently. + +The consistent snapshot process is fairly simple and SHOULD be automated. The +consistent snapshot process MUST keep in memory the latest working set of +*root*, *targets* and delegated targets metadata. Every minute or so, the +consistent snapshot process will sign for this latest working set. (Recall +that project transaction processes continuously inform the consistent snapshot +process about the latest delegated targets metadata in a concurrency-safe +manner. The consistent snapshot process will actually sign for a copy of the +latest working set while the actual latest working set in memory will be +updated with information continuously communicated by project transaction +processes.) Next, the consistent snapshot process MUST generate and sign new +*timestamp* metadata that will vouch for the *consistent-snapshot* metadata +generated in the previous step. Finally, the consistent snapshot process MUST +add new *timestamp* and *consistent-snapshot* metadata representing the latest +consistent snapshot. + +A few implementation notes are now in order. So far, we have seen only that +new metadata and targets are added, but not that old metadata and targets are +removed. Practical constraints are such that eventually PyPI will run out of +disk space to produce a new consistent snapshot. In that case, PyPI MAY then +use something like a "mark-and-sweep" algorithm to delete sufficiently old +consistent snapshots: in order to preserve the latest consistent snapshot, PyPI +would walk objects beginning from the root (*timestamp*) of the latest +consistent snapshot, mark all visited objects, and delete all unmarked +objects. The last few consistent snapshots may be preserved in a similar +fashion. Deleting a consistent snapshot will cause clients to see nothing +thereafter but HTTP 404 responses to any request for a file in that consistent +snapshot. Clients SHOULD then retry their requests with the latest consistent +snapshot. + +We do **not** consider updates to any consistent snapshot because `hash +collisions`__ are out of the scope of this PEP. In case a hash collision is +observed, PyPI MAY wish to check that the file being added is identical to the +file already stored. (Should a hash collision be observed, it is far more +likely the case that the file is identical rather than being a genuine +`collision attack`__.) Otherwise, PyPI MAY either overwrite the existing file +or ignore any write operation to an existing file. + +__ https://en.wikipedia.org/wiki/Collision_(computer_science) +__ https://en.wikipedia.org/wiki/Collision_attack + +All clients, such as pip using the TUF protocol, MUST be modified to download +every metadata and target file (except for *timestamp* metadata) by including, +in the request for the file, the hash of the file in the filename. Following +the filename convention recommended earlier, a request for the file at +filename.ext will be transformed to the equivalent request for the file at +filename.digest.ext. + +Finally, PyPI SHOULD use a `transaction log`__ to record project transaction +processes and queues so that it will be easier to recover from errors after a +server failure. + +__ https://en.wikipedia.org/wiki/Transaction_log + + +Metadata Validation +------------------- + +A *claimed* or *recently-claimed* project will need to upload in its +transaction to PyPI not just targets (a simple index as well as distributions) +but also TUF metadata. The project MAY do so by uploading a ZIP file +containing two directories, /metadata/ (containing delegated targets metadata +files) and /targets/ (containing targets such as the project simple index and +distributions which are signed for by the delegated targets metadata). + +Whenever the project uploads metadata or targets to PyPI, PyPI SHOULD check the +project TUF metadata for at least the following properties: + +* A threshold number of the developers keys registered with PyPI by that + project MUST have signed for the delegated targets metadata file that + represents the "root" of targets for that project (e.g. metadata/targets/ + project.txt). + +* The signatures of delegated targets metadata files MUST be valid. + +* The delegated targets metadata files MUST NOT be expired. + +* The delegated targets metadata MUST be consistent with the targets. + +* A delegator MUST NOT delegate targets that were not delegated to itself by + another delegator. + +* A delegatee MUST NOT sign for targets that were not delegated to itself by a + delegator. + +* Every file MUST contain a unique copy of its hash in its filename following + the filename.digest.ext convention recommended earlier. + +If PyPI chooses to check the project TUF metadata, then PyPI MAY choose to +reject publishing any set of metadata or targets that do not meet these +requirements. + +PyPI MUST enforce access control by ensuring that each project can only write +to the TUF metadata for which it is responsible. It MUST do so by ensuring +that project transaction processes write to the correct metadata as well as +correct locations within those metadata. For example, a project transaction +process for an *unclaimed* project MUST write to the correct target paths in +the correct delegated *unclaimed* metadata for the targets of the project. + +On rare occasions, PyPI MAY wish to extend the TUF metadata format for projects +in a backward-incompatible manner. Note that PyPI will NOT be able to +automatically rewrite existing TUF metadata on behalf of projects in order to +upgrade the metadata to the new backward-incompatible format because this would +invalidate the signatures of the metadata as signed by developer keys. +Instead, package managers SHOULD be written to recognize and handle multiple +incompatible versions of TUF metadata so that *claimed* and *recently-claimed* +projects could be offered a reasonable time to migrate their metadata to newer +but backward-incompatible formats. + +The details of how each project manages its TUF metadata is beyond the scope of +this PEP. + + +Mirroring Protocol +------------------ + +The mirroring protocol as described in PEP 381 [9]_ SHOULD change to mirror +PyPI with TUF. + +A mirror SHOULD have to maintain for its clients only one consistent snapshot +which would represent the latest consistent snapshot from PyPI known to the +mirror. The mirror would then serve all HTTP requests for metadata or targets +by simply reading directly from this consistent snapshot directory. + +The mirroring protocol itself is fairly simple. The mirror would ask PyPI for +*timestamp* metadata from the latest consistent snapshot and proceed to copy +the entire consistent snapshot from the *timestamp* metadata onwards. If the +mirror encounters a failure to copy any metadata or target file while copying +the consistent snapshot, it SHOULD retrying resuming the copy of that +particular consistent snapshot. If PyPI has deleted that consistent snapshot, +then the mirror SHOULD delete the failed consistent snapshot and try +downloading the latest consistent snapshot instead. + +The mirror SHOULD point users to a previous consistent snapshot directory while +it is copying the latest consistent snapshot from PyPI. Only after the latest +consistent snapshot has been completely copied SHOULD the mirror switch clients +to the latest consistent snapshot. The mirror MAY then delete the previous +consistent snapshot once it finds that no client is reading from the previous +consistent snapshot. + +The mirror MAY use extant file transfer software such as rsync__ to mirror +PyPI. In that case, the mirror MUST first obtain the latest known timestamp +metadata from PyPI. The mirror MUST NOT immediately publish the latest known +timestamp metadata from PyPI. Instead, the mirror MUST first iteratively +transfer all new files from PyPI until there are no new files left to transfer. +Finally, the mirror MUST publish the latest known timestamp it fetched from +PyPI so that package managers such as pip may be directed to the latest +consistent snapshot known to the mirror. + +__ https://rsync.samba.org/ + + +Backup Process +-------------- + +In order to be able to safely restore from static snapshots later in the event +of a compromise, PyPI SHOULD maintain a small number of its own mirrors to copy +PyPI consistent snapshots according to some schedule. The mirroring protocol +can be used immediately for this purpose. The mirrors must be secured and +isolated such that they are responsible only for mirroring PyPI. The mirrors +can be checked against one another to detect accidental or malicious failures. + + +Metadata Expiry Times +--------------------- + +The *root* and *targets* role metadata SHOULD expire in a year, because these +metadata files are expected to change very rarely. + +The *claimed* role metadata SHOULD expire in three to six months, because this +metadata is expected to be refreshed in that time frame. This time frame was +chosen to induce an easier administration process for PyPI. + +The *timestamp*, *consistent-snapshot*, *recently-claimed* and *unclaimed* role +metadata SHOULD expire in a day because a CDN or mirror SHOULD synchronize +itself with PyPI every day. Furthermore, this generous time frame also takes +into account client clocks that are highly skewed or adrift. + +The expiry times for the delegated targets metadata of a project is beyond the +scope of this PEP. + + +Metadata Scalability +-------------------- + +Due to the growing number of projects and distributions, the TUF metadata will +also grow correspondingly. + +For example, consider the *unclaimed* role. In August 2013, we found that the +size of the *unclaimed* role metadata was about 42MB if the *unclaimed* role +itself signed for about 220K PyPI targets (which are simple indices and +distributions). We will not delve into details in this PEP, but TUF features a +so-called "`lazy bin walk`__" scheme which splits a large targets or delegated +targets metadata file into many small ones. This allows a TUF client updater +to intelligently download only a small number of TUF metadata files in order to +update any project signed for by the *unclaimed* role. For example, applying +this scheme to the previous repository resulted in pip downloading between +1.3KB and 111KB to install or upgrade a PyPI project via TUF. + +__ https://github.com/theupdateframework/tuf/issues/39 + +From our findings as of the time of writing, PyPI SHOULD split all targets in +the *unclaimed* role by delegating it to 1024 delegated targets role, each of +which would sign for PyPI targets whose hashes fall into that "bin" or +delegated targets role. We found that 1024 bins would result in the +*unclaimed* role metadata and each of its binned delegated targets role +metadata to be about the same size (40-50KB) for about 220K PyPI targets +(simple indices and distributions). + +It is possible to make the TUF metadata more compact by representing it in a +binary format as opposed to the JSON text format. Nevertheless, we believe +that a sufficiently large number of project and distributions will induce +scalability challenges at some point, and therefore the *unclaimed* role will +then still need delegations in order to address the problem. Furthermore, the +JSON format is an open and well-known standard for data interchange. + +Due to the large number of delegated target metadata files, compressed versions +of *consistent-snapshot* metadata SHOULD also be made available. + + +Key Management +============== + +In this section, we examine the kind of keys required to sign for TUF roles on +PyPI. TUF is agnostic with respect to choices of digital signature algorithms. +For the purpose of discussion, we will assume that most digital signatures will +be produced with the well-tested and tried RSA algorithm [20]_. Nevertheless, +we do NOT recommend any particular digital signature algorithm in this PEP +because there are a few important constraints: firstly, cryptography changes +over time; secondly, package managers such as pip may wish to perform signature +verification in Python, without resorting to a compiled C library, in order to +be able to run on as many systems as Python supports; finally, TUF recommends +diversity of keys for certain applications, and we will soon discuss these +exceptions. + + +Number Of Keys +-------------- + +The *timestamp*, *consistent-snapshot*, *recently-claimed* and *unclaimed* +roles will need to support continuous delivery. Even though their respective +keys will then need to be online, we will require that the keys be independent +of each other. This allows for each of the keys to be placed on separate +servers if need be, and prevents side channel attacks that compromise one key +from automatically compromising the rest of the keys. Therefore, each of the +*timestamp*, *consistent-snapshot*, *recently-claimed* and *unclaimed* roles +MUST require (1, 1) keys. + +The *unclaimed* role MAY delegate targets in an automated manner to a number of +roles called "bins", as we discussed in the previous section. Each of the +"bin" roles SHOULD share the same key as the *unclaimed* role, due +simultaneously to space efficiency of metadata and because there is no security +advantage in requiring separate keys. + +The *root* role is critical for security and should very rarely be used. It is +primarily used for key revocation, and it is the root of trust for all of PyPI. +The *root* role signs for the keys that are authorized for each of the +top-level roles (including itself). The keys belonging to the *root* role are +intended to be very well-protected and used with the least frequency of all +keys. We propose that every PSF board member own a (strong) root key. A +majority of them can then constitute the quorum to revoke or endow trust in all +top-level keys. Alternatively, the system administrators of PyPI (instead of +PSF board members) could be responsible for signing for the *root* role. +Therefore, the *root* role SHOULD require (t, n) keys, where n is the number of +either all PyPI administrators or all PSF board members, and t > 1 (so that at +least two members must sign the *root* role). + +The *targets* role will be used only to sign for the static delegation of all +targets to the *claimed*, *recently-claimed* and *unclaimed* roles. Since +these target delegations must be secured against attacks in the event of a +compromise, the keys for the *targets* role MUST be offline and independent +from other keys. For simplicity of key management without sacrificing +security, it is RECOMMENDED that the keys of the *targets* role are permanently +discarded as soon as they have been created and used to sign for the role. +Therefore, the *targets* role SHOULD require (1, 1) keys. Again, this is +because the keys are going to be permanently discarded, and more offline keys +will not help against key recovery attacks [21]_ unless diversity of keys is +maintained. + +Similarly, the *claimed* role will be used only to sign for the dynamic +delegation of projects to their respective developer keys. Since these target +delegations must be secured against attacks in the event of a compromise, the +keys for the *claimed* role MUST be offline and independent from other keys. +Therefore, the *claimed* role SHOULD require (t, n) keys, where n is the number +of all PyPI administrators (in order to keep it manageable), and t ? 1 (so that +at least one member MUST sign the *claimed* role). While a stronger threshold +would indeed render the role more robust against a compromise of the *claimed* +keys (which is highly unlikely assuming that the keys are independent and +securely kept offline), we think that this trade-off is acceptable for the +important purpose of keeping the maintenance overhead for PyPI administrators +as little as possible. At the time of writing, we are keeping this point open +for discussion by the distutils-sig community. + +The number of developer keys is project-specific and thus beyond the scope of +this PEP. + + +Online and Offline Keys +----------------------- + +In order to support continuous delivery, the *timestamp*, +*consistent-snapshot*, *recently-claimed* and *unclaimed* role keys MUST be +online. + +As explained in the previous section, the *root*, *targets* and *claimed* role +keys MUST be offline for maximum security. Developers keys will be offline in +the sense that the private keys MUST NOT be stored on PyPI, though some of them +may be online on the private infrastructure of the project. + + +Key Strength +------------ + +At the time of writing, we recommend that all RSA keys (both offline and +online) SHOULD have a minimum key size of 3072 bits for data-protection +lifetimes beyond 2030 [22]_. + + +Diversity Of Keys +----------------- + +Due to the threats of weak key generation and implementation weaknesses [2]_, +the types of keys as well as the libraries used to generate them should vary +within TUF on PyPI. Our current implementation of TUF supports multiple +digital signature algorithms such as RSA (with OpenSSL [23]_ or PyCrypto [24]_) +and ed25519 [25]_. Furthermore, TUF supports the binding of other +cryptographic libraries that it does not immediately support "out of the box", +and so one MAY generate keys using other cryptographic libraries and use them +for TUF on PyPI. + +As such, the root role keys SHOULD be generated by a variety of digital +signature algorithms as implemented by different cryptographic libraries. + + +Key Compromise Analysis +----------------------- + +.. image:: https://raw.github.com/theupdateframework/pep-on-pypi-with-tuf/master/table1.png + +Table 1: Attacks possible by compromising certain combinations of role keys + + +Table 1 summarizes the kinds of attacks rendered possible by compromising a +threshold number of keys belonging to the TUF roles on PyPI. Except for the +*timestamp* and *consistent-snapshot* roles, the pairwise interaction of role +compromises may be found by taking the union of both rows. + +In September 2013, we showed how the latest version of pip then was susceptible +to these attacks and how TUF could protect users against them [14]_. + +An attacker who compromises developer keys for a project and who is able to +somehow upload malicious metadata and targets to PyPI will be able to serve +malicious updates to users of that project (and that project alone). Note that +compromising *targets* or any delegated targets role (except for project +targets metadata) does not immediately endow the attacker with the ability to +serve malicious updates. The attacker must also compromise the *timestamp* and +*consistent-snapshot* roles (which are both online and therefore more likely to +be compromised). This means that in order to launch any attack, one must be +not only be able to act as a man-in-the-middle but also compromise the +*timestamp* key (or the *root* keys and sign a new *timestamp* key). To launch +any attack other than a freeze attack, one must also compromise the +*consistent-snapshot* key. + +Finally, a compromise of the PyPI infrastructure MAY introduce malicious +updates to *recently-claimed* and *unclaimed* projects because the keys for +those roles are online. However, attackers cannot modify *claimed* projects in +such an event because *targets* and *claimed* metadata have been signed with +offline keys. Therefore, it is RECOMMENDED that high-value projects register +their developer keys with PyPI and sign for their own distributions. + + +In the Event of a Key Compromise +-------------------------------- + +By a key compromise, we mean that the key as well as PyPI infrastructure has +been compromised and used to sign new metadata on PyPI. + +If a threshold number of developer keys of a project have been compromised, +then the project MUST take the following steps: + +1. The project metadata and targets MUST be restored to the last known good + consistent snapshot where the project was not known to be compromised. This + can be done by the developers repackaging and resigning all targets with the + new keys. + +2. The project delegated targets metadata MUST have their version numbers + incremented, expiry times suitably extended and signatures renewed. + +Whereas PyPI MUST take the following steps: + +1. Revoke the compromised developer keys from the delegation to the project by + the *recently-claimed* or *claimed* role. This is done by replacing the + compromised developer keys with newly issued developer keys. + +2. A new timestamped consistent snapshot MUST be issued. + +If a threshold number of *timestamp*, *consistent-snapshot*, *recently-claimed* +or *unclaimed* keys have been compromised, then PyPI MUST take the following +steps: + +1. Revoke the *timestamp*, *consistent-snapshot* and *targets* role keys from + the *root* role. This is done by replacing the compromised *timestamp*, + *consistent-snapshot* and *targets* keys with newly issued keys. + +2. Revoke the *recently-claimed* and *unclaimed* keys from the *targets* role + by replacing their keys with newly issued keys. Sign the new *targets* role + metadata and discard the new keys (because, as we explained earlier, this + increases the security of *targets* metadata). + +3. Clear all targets or delegations in the *recently-claimed* role and delete + all associated delegated targets metadata. Recently registered projects + SHOULD register their developer keys again with PyPI. + +4. All targets of the *recently-claimed* and *unclaimed* roles SHOULD be + compared with the last known good consistent snapshot where none of the + *timestamp*, *consistent-snapshot*, *recently-claimed* or *unclaimed* keys + were known to have been compromised. Added, updated or deleted targets in + the compromised consistent snapshot that do not match the last known good + consistent snapshot MAY be restored to their previous versions. After + ensuring the integrity of all *unclaimed* targets, the *unclaimed* metadata + MUST be regenerated. + +5. The *recently-claimed* and *unclaimed* metadata MUST have their version + numbers incremented, expiry times suitably extended and signatures renewed. + +6. A new timestamped consistent snapshot MUST be issued. + +This would preemptively protect all of these roles even though only one of them +may have been compromised. + +If a threshold number of the *targets* or *claimed* keys have been compromised, +then there is little that an attacker could do without the *timestamp* and +*consistent-snapshot* keys. In this case, PyPI MUST simply revoke the +compromised *targets* or *claimed* keys by replacing them with new keys in the +*root* and *targets* roles respectively. + +If a threshold number of the *timestamp*, *consistent-snapshot* and *claimed* +keys have been compromised, then PyPI MUST take the following steps in addition +to the steps taken when either the *timestamp* or *consistent-snapshot* keys +are compromised: + +1. Revoke the *claimed* role keys from the *targets* role and replace them with + newly issued keys. + +2. All project targets of the *claimed* roles SHOULD be compared with the last + known good consistent snapshot where none of the *timestamp*, + *consistent-snapshot* or *claimed* keys were known to have been compromised. + Added, updated or deleted targets in the compromised consistent snapshot + that do not match the last known good consistent snapshot MAY be restored to + their previous versions. After ensuring the integrity of all *claimed* + project targets, the *claimed* metadata MUST be regenerated. + +3. The *claimed* metadata MUST have their version numbers incremented, expiry + times suitably extended and signatures renewed. + +If a threshold number of the *timestamp*, *consistent-snapshot* and *targets* +keys have been compromised, then PyPI MUST take the union of the steps taken +when the *claimed*, *recently-claimed* and *unclaimed* keys have been +compromised. + +If a threshold number of the *root* keys have been compromised, then PyPI MUST +take the steps taken when the *targets* role has been compromised as well as +replace all of the *root* keys. + +It is also RECOMMENDED that PyPI sufficiently document compromises with +security bulletins. These security bulletins will be most informative when +users of pip with TUF are unable to install or update a project because the +keys for the *timestamp*, *consistent-snapshot* or *root* roles are no longer +valid. They could then visit the PyPI web site to consult security bulletins +that would help to explain why they are no longer able to install or update, +and then take action accordingly. When a threshold number of *root* keys have +not been revoked due to a compromise, then new *root* metadata may be safely +updated because a threshold number of existing *root* keys will be used to sign +for the integrity of the new *root* metadata so that TUF clients will be able +to verify the integrity of the new *root* metadata with a threshold number of +previously known *root* keys. This will be the common case. Otherwise, in the +worst case where a threshold number of *root* keys have been revoked due to a +compromise, an end-user may choose to update new *root* metadata with +`out-of-band`__ mechanisms. + +__ https://en.wikipedia.org/wiki/Out-of-band#Authentication + + +Appendix: Rejected Proposals +============================ + + +Alternative Proposals for Producing Consistent Snapshots +-------------------------------------------------------- + +The complete file snapshot (CFS) scheme uses file system directories to store +efficient consistent snapshots over time. In this scheme, every consistent +snapshot will be stored in a separate directory, wherein files that are shared +with previous consistent snapshots will be `hard links`__ instead of copies. + +__ https://en.wikipedia.org/wiki/Hard_link + +The `differential file`__ snapshot (DFS) scheme is a variant of the CFS scheme, +wherein the next consistent snapshot directory will contain only the additions +of new files and updates to existing files of the previous consistent snapshot. +(The first consistent snapshot will contain a complete set of files known +then.) Deleted files will be marked as such in the next consistent snapshot +directory. This means that files will be resolved in this manner: First, set +the current consistent snapshot directory to be the latest consistent snapshot +directory. Then, any requested file will be seeked in the current consistent +snapshot directory. If the file exists in the current consistent snapshot +directory, then that file will be returned. If it has been marked as deleted +in the current consistent snapshot directory, then that file will be reported +as missing. Otherwise, the current consistent snapshot directory will be set +to the preceding consistent snapshot directory and the previous few steps will +be iterated until there is no preceding consistent snapshot to be considered, +at which point the file will be reported as missing. + +__ http://dl.acm.org/citation.cfm?id=320484 + +With the CFS scheme, the trade-off is the I/O costs of producing a consistent +snapshot with the file system. As of October 2013, we found that a fairly +modern computer with a 7200RPM hard disk drive required at least three minutes +to produce a consistent snapshot with the "cp -lr" command on the ext3__ file +system. Perhaps the I/O costs of this scheme may be ameliorated with advanced +tools or file systems such as ZFS__ or btrfs__. + +__ https://en.wikipedia.org/wiki/Ext3 +__ https://en.wikipedia.org/wiki/ZFS +__ https://en.wikipedia.org/wiki/Btrfs + +While the DFS scheme improves upon the CFS scheme in terms of producing faster +consistent snapshots, there are at least two trade-offs. The first is that a +web server will need to be modified to perform the "daisy chain" resolution of +a file. The second is that every now and then, the differential snapshots will +need to be "squashed" or merged together with the first consistent snapshot to +produce a new first consistent snapshot with the latest and complete set of +files. Although the merge cost may be amortized over time, this scheme is not +conceptually si + + + + +References +========== + +.. [1] https://pypi.python.org +.. [2] https://isis.poly.edu/~jcappos/papers/samuel_tuf_ccs_2010.pdf +.. [3] http://www.pip-installer.org +.. [4] https://wiki.python.org/moin/WikiAttack2013 +.. [5] https://github.com/theupdateframework/pip/wiki/Attacks-on-software-repositories +.. [6] https://mail.python.org/pipermail/distutils-sig/2013-April/020596.html +.. [7] https://mail.python.org/pipermail/distutils-sig/2013-May/020701.html +.. [8] https://mail.python.org/pipermail/distutils-sig/2013-July/022008.html +.. [9] PEP 381, Mirroring infrastructure for PyPI, Ziad?, L?wis + http://www.python.org/dev/peps/pep-0381/ +.. [10] https://mail.python.org/pipermail/distutils-sig/2013-September/022773.html +.. [11] https://mail.python.org/pipermail/distutils-sig/2013-May/020848.html +.. [12] PEP 449, Removal of the PyPI Mirror Auto Discovery and Naming Scheme, Stufft + http://www.python.org/dev/peps/pep-0449/ +.. [13] https://isis.poly.edu/~jcappos/papers/cappos_mirror_ccs_08.pdf +.. [14] https://mail.python.org/pipermail/distutils-sig/2013-September/022755.html +.. [15] https://pypi.python.org/security +.. [16] https://github.com/theupdateframework/tuf/blob/develop/docs/tuf-spec.txt +.. [17] PEP 426, Metadata for Python Software Packages 2.0, Coghlan, Holth, Stufft + http://www.python.org/dev/peps/pep-0426/ +.. [18] https://en.wikipedia.org/wiki/Continuous_delivery +.. [19] https://mail.python.org/pipermail/distutils-sig/2013-August/022154.html +.. [20] https://en.wikipedia.org/wiki/RSA_%28algorithm%29 +.. [21] https://en.wikipedia.org/wiki/Key-recovery_attack +.. [22] http://csrc.nist.gov/publications/nistpubs/800-57/SP800-57-Part1.pdf +.. [23] https://www.openssl.org/ +.. [24] https://pypi.python.org/pypi/pycrypto +.. [25] http://ed25519.cr.yp.to/ + + +Acknowledgements +================ + +Nick Coghlan, Daniel Holth and the distutils-sig community in general for +helping us to think about how to usably and efficiently integrate TUF with +PyPI. + +Roger Dingledine, Sebastian Hahn, Nick Mathewson, Martin Peck and Justin +Samuel for helping us to design TUF from its predecessor Thandy of the Tor +project. + +Konstantin Andrianov, Geremy Condra, Vladimir Diaz, Zane Fisher, Justin Samuel, +Tian Tian, Santiago Torres, John Ward, and Yuyu Zheng for helping us to develop +TUF. + +Vladimir Diaz, Monzur Muhammad and Sai Teja Peddinti for helping us to review +this PEP. + +Zane Fisher for helping us to review and transcribe this PEP. + + +Copyright +========= + +This document has been placed in the public domain. -- Repository URL: https://hg.python.org/peps From python-checkins at python.org Wed Nov 19 12:44:54 2014 From: python-checkins at python.org (nick.coghlan) Date: Wed, 19 Nov 2014 11:44:54 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_Split_PEP_458_into_two_distin?= =?utf-8?q?ct_PEPs?= Message-ID: <20141119114314.109162.47437@psf.io> https://hg.python.org/peps/rev/58644fa78931 changeset: 5602:58644fa78931 user: Nick Coghlan date: Wed Nov 19 21:43:04 2014 +1000 summary: Split PEP 458 into two distinct PEPs PEP 458 now focuses on content security (rather than the current transport-only security) between PyPI and end users. PEP 480 builds on PEP 458 to also provide end-to-end security that can fully handle a compromise of PyPI. files: pep-0458.txt | 1680 +++++++++++++++++++------------------ pep-0480.txt | 890 ++++++++++++++++++++ 2 files changed, 1737 insertions(+), 833 deletions(-) diff --git a/pep-0458.txt b/pep-0458.txt --- a/pep-0458.txt +++ b/pep-0458.txt @@ -2,10 +2,11 @@ Title: Surviving a Compromise of PyPI Version: $Revision$ Last-Modified: $Date$ -Author: Trishank Karthik Kuppusamy , - Donald Stufft , - Justin Cappos -Discussions-To: Distutils SIG +Author: Trishank Karthik Kuppusamy , + Vladimir Diaz , + Donald Stufft , Justin Cappos +BDFL-Delegate: Richard Jones +Discussions-To: DistUtils mailing list Status: Draft Type: Standards Track Content-Type: text/x-rst @@ -15,491 +16,632 @@ Abstract ======== -This PEP describes how the Python Package Index (PyPI [1]_) may be integrated -with The Update Framework [2]_ (TUF). TUF was designed to be a plug-and-play -security add-on to a software updater or package manager. TUF provides -end-to-end security like SSL, but for software updates instead of HTTP -connections. The framework integrates best security practices such as -separating responsibilities, adopting the many-man rule for signing packages, -keeping signing keys offline, and revocation of expired or compromised signing -keys. +This PEP proposes how the Python Package Index (PyPI [1]_) should be integrated +with The Update Framework [2]_ (TUF). TUF was designed to be a flexible +security add-on to a software updater or package manager. The framework +integrates best security practices such as separating role responsibilities, +adopting the many-man rule for signing packages, keeping signing keys offline, +and revocation of expired or compromised signing keys. For example, attackers +would have to steal multiple signing keys stored independently to compromise +a role responsible for specifying a repository's available files. Another role +responsible for indicating the latest snapshot of the repository may have to be +similarly compromised, and independent of the first compromised role. -The proposed integration will render modern package managers such as pip [3]_ -more secure against various types of security attacks on PyPI and protect users -against them. Even in the worst case where an attacker manages to compromise -PyPI itself, the damage is controlled in scope and limited in duration. +The proposed integration will allow modern package managers such as pip [3]_ to +be more secure against various types of security attacks on PyPI and protect +users from such attacks. Specifically, this PEP describes how PyPI processes +should be adapted to generate and incorporate TUF metadata (i.e., the minimum +security model). The minimum security model supports verification of PyPI +distributions that are signed with keys stored on PyPI: distributions uploaded +by developers are signed by PyPI, require no action from developers (other than +uploading the distribution), and are immediately available for download. The +minimum security model also minimizes PyPI administrative responsibilities by +automating much of the signing process. -Specifically, this PEP will describe how PyPI processes should be adapted to -incorporate TUF metadata. It will not prescribe how package managers such as -pip should be adapted to install or update with TUF metadata projects from -PyPI. +This PEP does not prescribe how package managers such as pip should be adapted +to install or update projects from PyPI with TUF metadata. Package managers +interested in adopting TUF on the client side may consult TUF's `library +documentation`__, which exists for this purpose. Support for project +distributions that are signed by developers (maximum security model) is also +not discussed in this PEP, but is outlined in the appendix as a possible future +extension and covered in detail in PEP X [VD: Link to PEP once it is +completed]. The PEP X extension focuses on the maximum security model, which +requires more PyPI administrative work (none by clients), but it also proposes +an easy-to-use key management solution for developers, how to interface with a +potential future build farm on PyPI infrastructure, and discusses the +feasibility of end-to-end signing. +__ https://github.com/theupdateframework/tuf/tree/develop/tuf/client#updaterpy -Rationale -========= + +Motivation +========== In January 2013, the Python Software Foundation (PSF) announced [4]_ that the python.org wikis for Python, Jython, and the PSF were subjected to a security -breach which caused all of the wiki data to be destroyed on January 5 2013. +breach that caused all of the wiki data to be destroyed on January 5, 2013. Fortunately, the PyPI infrastructure was not affected by this security breach. However, the incident is a reminder that PyPI should take defensive steps to protect users as much as possible in the event of a compromise. Attacks on -software repositories happen all the time [5]_. We must accept the possibility -of security breaches and prepare PyPI accordingly because it is a valuable -target used by thousands, if not millions, of people. +software repositories happen all the time [5]_. The PSF must accept the +possibility of security breaches and prepare PyPI accordingly because it is a +valuable resource used by thousands, if not millions, of people. -Before the wiki attack, PyPI used MD5 hashes to tell package managers such as -pip whether or not a package was corrupted in transit. However, the absence of -SSL made it hard for package managers to verify transport integrity to PyPI. -It was easy to launch a man-in-the-middle attack between pip and PyPI to change -package contents arbitrarily. This can be used to trick users into installing -malicious packages. After the wiki attack, several steps were proposed (some -of which were implemented) to deliver a much higher level of security than was -previously the case: requiring SSL to communicate with PyPI [6]_, restricting -project names [7]_, and migrating from MD5 to SHA-2 hashes [8]_. +Before the wiki attack, PyPI used MD5 hashes to tell package managers, such as +pip, whether or not a package was corrupted in transit. However, the absence +of SSL made it hard for package managers to verify transport integrity to PyPI. +It was therefore easy to launch a man-in-the-middle attack between pip and +PyPI, and change package content arbitrarily. Users could be tricked into +installing malicious packages with man-in-the-middle attacks. After the wiki +attack, several steps were proposed (some of which were implemented) to deliver +a much higher level of security than was previously the case: requiring SSL to +communicate with PyPI [6]_, restricting project names [7]_, and migrating from +MD5 to SHA-2 hashes [8]_. These steps, though necessary, are insufficient because attacks are still possible through other avenues. For example, a public mirror is trusted to honestly mirror PyPI, but some mirrors may misbehave due to malice or accident. Package managers such as pip are supposed to use signatures from PyPI to verify packages downloaded from a public mirror [9]_, but none are known to actually -do so [10]_. Therefore, it is also wise to add more security measures to +do so [10]_. Therefore, it would be wise to add more security measures to detect attacks from public mirrors or content delivery networks [11]_ (CDNs). Even though official mirrors are being deprecated on PyPI [12]_, there remain a -wide variety of other attack vectors on package managers [13]_. Among other -things, these attacks can crash client systems, cause obsolete packages to be -installed, or even allow an attacker to execute arbitrary code. In September -2013, we showed how the latest version of pip then was susceptible to these -attacks and how TUF could protect users against them [14]_. +wide variety of other attack vectors on package managers [13]_. These attacks +can crash client systems, cause obsolete packages to be installed, or even +allow an attacker to execute arbitrary code. In `September 2013`__, a post was +made to the Distutils mailing list showing that the latest version of pip (at +the time) was susceptible to such attacks, and how TUF could protect users +against them [14]_. Specifically, testing was done to see how pip would +respond to these attacks with and without TUF. Attacks tested included replay +and freeze, arbitrary packages, slow retrieval, and endless data. The post +also included a demonstration of how pip would respond if PyPI were +compromised. -Finally, PyPI allows for packages to be signed with GPG keys [15]_, although no -package manager is known to verify those signatures, thus negating much of the -benefits of having those signatures at all. Validating integrity through -cryptography is important, but issues such as immediate and secure key -revocation or specifying a required threshold number of signatures still -remain. Furthermore, GPG by itself does not immediately address the attacks -mentioned above. +__ https://mail.python.org/pipermail/distutils-sig/2013-September/022755.html -In order to protect PyPI against infrastructure compromises, we propose -integrating PyPI with The Update Framework [2]_ (TUF). +With the intent to protect PyPI against infrastructure compromises, this PEP +proposes integrating PyPI with The Update Framework [2]_ (TUF). TUF helps +secure new or existing software update systems. Software update systems are +vulnerable to many known attacks, including those that can result in clients +being compromised or crashed. TUF solves these problems by providing a flexible +security framework that can be added to software updaters. + + +Threat Model +============ + +The threat model assumes the following: + +* Offline keys are safe and securely stored. + +* Attackers can compromise at least one of PyPI's trusted keys stored online, + and may do so at once or over a period of time. + +* Attackers can respond to client requests. + +An attacker is considered successful if they can cause a client to install (or +leave installed) something other than the most up-to-date version of the +software the client is updating. If the attacker is preventing the installation +of updates, they want clients to not realize there is anything wrong. Definitions =========== -The key words "MUST", "MUST NOT", "REQUIRED", "SHALL", "SHALL NOT", "SHOULD", +The keywords "MUST", "MUST NOT", "REQUIRED", "SHALL", "SHALL NOT", "SHOULD", "SHOULD NOT", "RECOMMENDED", "MAY", and "OPTIONAL" in this document are to be interpreted as described in RFC 2119__. __ http://www.ietf.org/rfc/rfc2119.txt -In order to keep this PEP focused solely on the application of TUF on PyPI, the -reader is assumed to already be familiar with the design principles of -TUF [2]_. It is also strongly RECOMMENDED that the reader be familiar with the -TUF specification [16]_. +This PEP focuses on integrating TUF with PyPI; however, the reader is +encouraged to read about TUF's design principles [2]_. It is also RECOMMENDED +that the reader be familiar with the TUF specification [16]_. + +Terms used in this PEP are defined as follows: * Projects: Projects are software components that are made available for - integration. Projects include Python libraries, frameworks, scripts, plugins, - applications, collections of data or other resources, and various + integration. Projects include Python libraries, frameworks, scripts, + plugins, applications, collections of data or other resources, and various combinations thereof. Public Python projects are typically registered on the Python Package Index [17]_. * Releases: Releases are uniquely identified snapshots of a project [17]_. -* Distributions: Distributions are the packaged files which are used to publish +* Distributions: Distributions are the packaged files that are used to publish and distribute a release [17]_. -* Simple index: The HTML page which contains internal links to the +* Simple index: The HTML page that contains internal links to the distributions of a project [17]_. + +* Roles: There is one *root* role in PyPI. There are multiple roles whose + responsibilities are delegated to them directly or indirectly by the *root* + role. The term top-level role refers to the *root* role and any role + delegated by the *root* role. Each role has a single metadata file that it is + trusted to provide. + +* Metadata: Metadata are signed files that describe roles, other metadata, and + target files. + +* Repository: A repository is a resource compromised of named metadata and + target files. Clients request metadata and target files stored on a + repository. * Consistent snapshot: A set of TUF metadata and PyPI targets that capture the - complete state of all projects on PyPI as they were at some fixed point in + complete state of all projects on PyPI as they existed at some fixed point in time. -* The *consistent-snapshot* (*release*) role: In order to prevent confusion due - to the different meanings of the term "release" as employed by PEP 426 [17]_ - and the TUF specification [16]_, we rename the *release* role as the - *consistent-snapshot* role. - -* Continuous delivery: A set of processes with which PyPI produces consistent - snapshots that can safely coexist and deleted independently [18]_. - +* The *snapshot* (*release*) role: In order to prevent confusion due to the + different meanings of the term "release" used in PEP 426 [17]_ and the TUF + specification [16]_, the *release* role is renamed as the *snapshot* role. + * Developer: Either the owner or maintainer of a project who is allowed to - update the TUF metadata as well as distribution metadata and data for the + update the TUF metadata as well as distribution metadata and files for the project. -* Online key: A key that MUST be stored on the PyPI server infrastructure. - This is usually to allow automated signing with the key. However, this means - that an attacker who compromises PyPI infrastructure will be able to read - these keys. +* Online key: A private cryptographic key that MUST be stored on the PyPI + server infrastructure. This is usually to allow automated signing with the + key. However, an attacker who compromises the PyPI infrastructure will be + able to read these keys. -* Offline key: A key that MUST be stored off the PyPI infrastructure. This - prevents automated signing with the key. This means that an attacker who - compromises PyPI infrastructure will not be able to immediately read these - keys. +* Offline key: A private cryptographic key that MUST be stored independent of + the PyPI server infrastructure. This prevents automated signing with the + key. An attacker who compromises the PyPI infrastructure will not be able to + immediately read these keys. -* Developer key: A private key for which its corresponding public key is - registered with PyPI to say that it is responsible for directly signing for - or delegating the distributions belonging to a project. For the purposes of - this PEP, it is offline in the sense that the private key MUST not be stored - on PyPI. However, the project is free to require certain developer keys to - be online on its own infrastructure. +* Threshold signature scheme: A role can increase its resilience to key + compromises by specifying that at least t out of n keys are REQUIRED to sign + its metadata. A compromise of t-1 keys is insufficient to compromise the + role itself. Saying that a role requires (t, n) keys denotes the threshold + signature property. -* Threshold signature scheme: A role could increase its resilience to key - compromises by requiring that at least t out of n keys are REQUIRED to sign - its metadata. This means that a compromise of t-1 keys is insufficient to - compromise the role itself. We denote this property by saying that the role - requires (t, n) keys. +Overview of TUF +=============== -Overview -======== +At its highest level, TUF provides applications with a secure method of +obtaining files and knowing when new versions of files are available. On the +surface, this all sounds simple. The basic steps for updating applications are: -.. image:: https://raw.github.com/theupdateframework/pep-on-pypi-with-tuf/master/figure1.png +* Knowing when an update exists. -Figure 1: A simplified overview of the roles in PyPI with TUF +* Downloading a correct copy of the latest version of an updated file. -Figure 1 shows a simplified overview of the roles that TUF metadata assume on -PyPI. The top-level *root* role signs for the keys of the top-level -*timestamp*, *consistent-snapshot*, *targets* and *root* roles. The -*timestamp* role signs for a new and consistent snapshot. The *consistent- -snapshot* role signs for the *root*, *targets* and all delegated targets -metadata. The *claimed* role signs for all projects that have registered their -own developer keys with PyPI. The *recently-claimed* role signs for all -projects that recently registered their own developer keys with PyPI. Finally, -the *unclaimed* role signs for all projects that have not registered developer -keys with PyPI. The *claimed*, *recently-claimed* and *unclaimed* roles are -numbered 1, 2, 3 respectively because a project will be searched for in each of -those roles in that descending order: first in *claimed*, then in -*recently-claimed* if necessary, and finally in *unclaimed* if necessary. +The problem is that updating applications is only simple when there are no +malicious activities in the picture. If an attacker is trying to interfere with +these seemingly simple steps, there is plenty they can do. -Every year, PyPI administrators are going to sign for *root* role keys. After -that, automation will continuously sign for a timestamped, consistent snapshot -of all projects. Every few months, PyPI administrators will move projects with -vetted developer keys from the *recently-claimed* role to the *claimed* role. -As we will soon see, they will sign for *claimed* with projects with offline -keys. +Assume a software updater takes the approach of most systems (at least the ones +that try to be secure). It downloads both the file it wants and a cryptographic +signature of the file. The software updater already knows which key it trusts +to make the signature. It checks that the signature is correct and was made by +this trusted key. Unfortunately, the software updater is still at risk in many +ways, including: -This PEP does not require project developers to use TUF to secure their -packages from attacks on PyPI. By default, all projects will be signed for by -the *unclaimed* role. If a project wishes stronger security guarantees, then -the project is strongly RECOMMENDED to register developer keys with PyPI so -that it may sign for its own distributions. By doing so, the project must -remain as a *recently-claimed* project until PyPI administrators have had an -opportunity to vet the developer keys of the project, after which the project -will be moved to the *claimed* role. +* An attacker keeps giving the software updater the same update file, so it + never realizes there is an update. -This PEP has **not** been designed to be backward-compatible for package -managers that do not use the TUF security protocol to install or update a -project from the PyPI described here. Instead, it is RECOMMENDED that PyPI -maintain a backward-compatible API of itself that does NOT offer TUF so that -older package managers that do not use TUF will be able to install or update -projects from PyPI as usual but without any of the security offered by TUF. -For the rest of this PEP, we will assume that PyPI will simultaneously maintain -a backward-incompatible API of itself for package managers that MUST use TUF to -securely install or update projects. We think that this approach represents a -reasonable trade-off: older package managers that do not TUF will still be able -to install or update projects without any TUF security from PyPI, and newer -package managers that do use TUF will be able to securely install or update -projects. At some point in the future, PyPI administrators MAY choose to -permanently deprecate the backward-compatible version of itself that does not -offer TUF metadata. +* An attacker gives the software updater an older, insecure version of a file + that it already has, so it downloads that one and blindly uses it thinking it + is newer. -Unless a mirror, CDN or the PyPI repository has been compromised, the end-user -will not be able to discern whether or not a package manager is using TUF to -install or update a project from PyPI. +* An attacker gives the software updater a newer version of a file it has but + it is not the newest one. The file is newer to the software updater, but it + may be insecure and exploitable by the attacker. +* An attacker compromises the key used to sign these files and now the software + updater downloads a malicious file that is properly signed. -Responsibility Separation +TUF is designed to address these attacks, and others, by adding signed metadata +(text files that describe the repository's files) to the repository and +referencing the metadata files during the update procedure. Repository files +are verified against the information included in the metadata before they are +handed off to the software update system. The framework also provides +multi-signature trust, explicit and implicit revocation of cryptograhic keys, +responsibility separation of the metadata, and minimizes key risk. For a full +list and outline of the repository attacks and software updater weaknesses +addressed by TUF, see Appendix A. + + +Integrating TUF with PyPI ========================= -Recall that TUF requires four top-level roles: *root*, *timestamp*, -*consistent-snapshot* and *targets*. The *root* role specifies the keys of all -the top-level roles (including itself). The *timestamp* role specifies the -latest consistent snapshot. The *consistent-snapshot* role specifies the -latest versions of all TUF metadata files (other than *timestamp*). The -*targets* role specifies available target files (in our case, it will be all -files on PyPI under the /simple and /packages directories). In this PEP, each -of these roles will serve their responsibilities without exception. +A software update system must complete two main tasks to integrate with TUF. +First, it must add the framework to the client side of the update system. For +example, TUF MAY be integrated with the pip package manager. Second, the +repository on the server side MUST be modified to provide signed TUF metadata. +This PEP is concerned with the second part of the integration, and the changes +required on PyPI to support software updates with TUF. -Our proposal offers two levels of security to developers. If developers opt in -to secure their projects with their own developer keys, then their projects -will be very secure. Otherwise, TUF will still protect them in many cases: -1. Minimum security (no action by a developer): protects *unclaimed* and - *recently-claimed* projects without developer keys from CDNs [19]_ or public - mirrors, but not from some PyPI compromises. This is because continuous - delivery requires some keys to be online. This level of security protects - projects from being accidentally or deliberately tampered with by a mirror - or a CDN because the mirror or CDN will not have any of the PyPI or - developer keys required to sign for projects. However, it would not protect - projects from attackers who have compromised PyPI because they will be able - to manipulate the TUF metadata for *unclaimed* projects with the appropriate - online keys. +What Additional Repository Files are Required on PyPI? +------------------------------------------------------ -2. Maximum security (developer signs their project): protects projects with - developer keys not only from CDNs or public mirrors, but also from some PyPI - compromises. This is because many important keys will be offline. This - level of security protects projects from being accidentally or deliberately - tampered with by a mirror or a CDN for reasons identical to the minimum - security level. It will also protect projects (or at least mitigate - damages) from the most likely attacks on PyPI. For example: given access to - online keys after a PyPI compromise, attackers will be able to freeze the - distributions for these projects, but they will not be able to serve - malicious distributions for these projects (not without compromising other - offline keys which would entail more risk, time and energy). Details for - the exact level of security offered is discussed in the section on key - management. +In order for package managers like pip to download and verify packages with +TUF, a few extra files MUST exist on PyPI. These extra repository files are +called TUF metadata. TUF metadata contains information such as which keys are +trustable, the cryptographic hashes of files, signatures to the metadata, +metadata version numbers, and the date after which the metadata should be +considered expired. -In order to complete support for continuous delivery, we propose three -delegated targets roles: +When a package manager wants to check for updates, it asks TUF to do the work. +That is, a package manager never has to deal with this additional metadata or +understand what's going on underneath. If TUF reports back that there are +updates available, a package manager can then ask TUF to download these files +from PyPI. TUF downloads them and checks them against the TUF metadata that it +also downloads from the repository. If the downloaded target files are +trustworthy, TUF then hands them over to the package manager. -1. *claimed*: Signs for the delegation of PyPI projects to their respective - developer keys. +The `Metadata`__ document provides information about each of the required +metadata and their expected content. The next section covers the different +kinds of metadata RECOMMENDED for PyPI. -2. *recently-claimed*: This role is almost identical to the *claimed* role and - could technically be performed by the *unclaimed* role, but there are two - important reasons why it exists independently: the first reason is to - improve the performance of looking up projects in the *unclaimed* role (by - moving metadata to the *recently-claimed* role instead), and the second - reason is to make it easier for PyPI administrators to move - *recently-claimed* projects to the *claimed* role. +__ https://github.com/theupdateframework/tuf/blob/develop/METADATA.md -3. *unclaimed*: Signs for PyPI projects without developer keys. -The *targets* role MUST delegate all PyPI projects to the three delegated -targets roles in the order of appearance listed above. This means that when -pip downloads with TUF a distribution from a project on PyPI, it will first -consult the *claimed* role about it. If the *claimed* role has delegated the -project, then pip will trust the project developers (in order of delegation) -about the TUF metadata for the project. Otherwise, pip will consult the -*recently-claimed* role about the project. If the *recently-claimed* role has -delegated the project, then pip will trust the project developers (in order of -delegation) about the TUF metadata for the project. Otherwise, pip will -consult the *unclaimed* role about the TUF metadata for the project. If the -*unclaimed* role has not delegated the project, then the project is considered -to be non-existent on PyPI. +PyPI and TUF Metadata +===================== -A PyPI project MAY begin without registering a developer key. Therefore, the -project will be signed for by the *unclaimed* role. After registering -developer keys, the project will be removed from the *unclaimed* role and -delegated to the *recently-claimed* role. After a probation period and a -vetting process to verify the developer keys of the project, the project will -be removed from the *recently-claimed* role and delegated to the *claimed* -role. +TUF metadata provides information that clients can use to make update +decisions. For example, a *targets* metadata lists the available distributions +on PyPI and includes the distribution's signatures, cryptographic hashes, and +file sizes. Different metadata files provide different information. The +various metadata files are signed by different roles, which are indicated by +the *root* role. The concept of roles allows TUF to delegate responsibilities +to multiple roles and minimizes the impact of a compromised role. -The *claimed* role offers maximum security, whereas the *recently-claimed* and -*unclaimed* role offer minimum security. All three roles support continuous -delivery of PyPI projects. +TUF requires four top-level roles. These are *root*, *timestamp*, *snapshot*, +and *targets*. The *root* role specifies the public cryptographic keys of the +top-level roles (including its own). The *timestamp* role references the +latest *snapshot* and can signify when a new snapshot of the repository is +available. The *snapshot* role indicates the latest version of all the TUF +metadata files (other than *timestamp*). The *targets* role lists the +available target files (in our case, it will be all files on PyPI under the +/simple and /packages directories). Each top-level role will serve its +responsibilities without exception. Figure 1 provides a table of the roles +used in TUF. -The *unclaimed* role offers minimum security because PyPI will sign for -projects without developer keys with an online key in order to permit -continuous delivery. +.. image:: figure1.png -The *recently-claimed* role offers minimum security because while the project -developers will sign for their own distributions with offline developer keys, -PyPI will sign with an online key the delegation of the project to those -offline developer keys. The signing of the delegation with an online key -allows PyPI administrators to continuously deliver projects without having to -continuously sign the delegation whenever one of those projects registers -developer keys. +Figure 1: An overview of the TUF roles. -Finally, the *claimed* role offers maximum security because PyPI will sign with -offline keys the delegation of a project to its offline developer keys. This -means that every now and then, PyPI administrators will vet developer keys and -sign the delegation of a project to those developer keys after being reasonably -sure about the ownership of the developer keys. The process for vetting -developer keys is out of the scope of this PEP. +Signing Metadata and Repository Management +------------------------------------------ -Metadata Management -=================== +The top-level *root* role signs for the keys of the top-level *timestamp*, +*snapshot*, *targets*, and *root* roles. The *timestamp* role signs for every +new snapshot of the repository metadata. The *snapshot* role signs for *root*, +*targets*, and all delegated roles. The *bins* roles (delegated roles) sign +for all distributions belonging to registered PyPI projects. -In this section, we examine the TUF metadata that PyPI must manage by itself, -and other TUF metadata that must be safely delegated to projects. Examples of -the metadata described here may be seen at our testbed mirror of -`PyPI-with-TUF`__. +Figure 2 provides an overview of the roles available within PyPI, which +includes the top-level roles and the roles delegated by *targets*. The figure +also indicates the types of keys used to sign each role and which roles are +trusted to sign for files available on PyPI. The next two sections cover the +details of signing repository files and the types of keys used for each role. -__ http://mirror1.poly.edu/ +.. image:: figure2.png -The metadata files that change most frequently will be *timestamp*, -*consistent-snapshot* and delegated targets (*claimed*, *recently-claimed*, -*unclaimed*, project) metadata. The *timestamp* and *consistent-snapshot* -metadata MUST be updated whenever *root*, *targets* or delegated targets -metadata are updated. Observe, though, that *root* and *targets* metadata are -much less likely to be updated as often as delegated targets metadata. -Therefore, *timestamp* and *consistent-snapshot* metadata will most likely be -updated frequently (possibly every minute) due to delegated targets metadata -being updated frequently in order to drive continuous delivery of projects. +Figure 2: An overview of the role metadata available on PyPI. -Consequently, the processes with which PyPI updates projects will have to be -updated accordingly, the details of which are explained in the following -subsections. +The roles that change most frequently are *timestamp*, *snapshot* and delegated +roles (*bins* and its delegated roles). The *timestamp* and *snapshot* +metadata MUST be updated whenever *root*, *targets* or delegated metadata are +updated. Observe, though, that *root* and *targets* metadata are much less +likely to be updated as often as delegated metadata. Therefore, *timestamp* +and *snapshot* metadata will most likely be updated frequently (possibly every +minute) due to delegated metadata being updated frequently in order to support +continuous delivery of projects. Continuous delivery is a set of processes +that PyPI uses produce snapshots that can safely coexist and be deleted +independent of other snapshots [18]_. +Every year, PyPI administrators SHOULD sign for *root* and *targets* role keys. +Automation will continuously sign for a timestamped, snapshot of all projects. +A `repository management`__ tool is available that can sign metadata files, +generate cryptographic keys, and manage a TUF repository. -Why Do We Need Consistent Snapshots? ------------------------------------- +__ https://github.com/theupdateframework/tuf/tree/develop/tuf#repository-management -In an ideal world, metadata and data should be immediately updated and -presented whenever a project is updated. In practice, there will be problems -when there are many readers and writers who access the same metadata or data at -the same time. -An important example at the time of writing is that, mirrors are very likely, -as far as we can tell, to update in an inconsistent manner from PyPI as it is -without TUF. Specifically, a mirror would update itself in such a way that -project A would be from time T, whereas project B would be from time T+5, -project C would be from time T+3, and so on where T is the time that the mirror -first begun updating itself. There is no known way for a mirror to update -itself such that it captures the state of all projects as they were at time T. +How to Establish Initial Trust in the PyPI Root Keys +---------------------------------------------------- -Adding TUF to PyPI will not automatically solve the problem. Consider what we -call the `"inverse replay" or "fast-forward" problem`__. Suppose that PyPI has -timestamped a consistent snapshot at version 1. A mirror is later in the -middle of copying PyPI at this snapshot. While the mirror is copying PyPI at -this snapshot, PyPI timestamps a new snapshot at, say, version 2. Without -accounting for consistency, the mirror would then find itself with a copy of -PyPI in an inconsistent state which is indistinguishable from arbitrary -metadata or target attacks. The problem would also apply when the mirror is -substituted with a pip user. +Package managers like pip need to ship a file called "root.json" with the +installation files that users initially download. This includes information +about the keys trusted for certain roles, as well as the root keys themselves. +Any new version of "root.json" that clients may download are verified against +the root keys that client's initially trust. If a root key is compromised, but +a threshold of keys are still secured, the PyPI administrator MUST push a new +release that revokes trust in the compromised keys. If a threshold of root keys +are compromised, then "root.json" should be updated out-of-band, however the +threshold should be chosen so that this is extremely unlikely. The TUF client +library does not require manual intervention if root keys are revoked or added: +the update process handles the cases where "root.json" has changed. -__ https://groups.google.com/forum/#!topic/theupdateframework/8mkR9iqivQA +To bundle the software, "root.json" MUST be included in the version of pip +shipped with CPython (via ensurepip). The TUF client library then loads the +root metadata and downloads the rest of the roles, including updating +"root.json" if it has changed. An `outline of the update process`__ is +available. -Therefore, the problem can be summarized as such: there are problems of -consistency on PyPI with or without TUF. TUF requires its metadata to be -consistent with the data, but how would the metadata be kept consistent with -projects that change all the time? +__ https://github.com/theupdateframework/tuf/tree/develop/tuf/client#overview-of-the-update-process. -As a result, we will solve for PyPI the problem of producing a consistent + +Minimum Security Model +---------------------- + +There are two security models to consider when integrating TUF with PyPI. The +one proposed in this PEP is the minimum security model, which supports +verification of PyPI distributions that are signed with private cryptographic +keys stored on PyPI. Distributions uploaded by developers are signed by PyPI +and immediately available for download. A possible future extension to this +PEP, discussed in Appendix B, proposes the maximum security model and allows a +developer to sign for his/her project. Developer keys are not stored online: +therefore, projects are safe from PyPI compromises. + +The minimum security model requires no action from a developer and protects +against malicious CDNs [19]_ and public mirrors. To support continuous +delivery of uploaded packages, PyPI signs for projects with an online key. +This level of security prevents projects from being accidentally or +deliberately tampered with by a mirror or a CDN because the mirror or CDN will +not have any of the keys required to sign for projects. However, it does not +protect projects from attackers who have compromised PyPI, since attackers can +manipulate TUF metadata using the keys stored online. + +This PEP proposes that the *bins* role (and its delegated roles) sign for all +PyPI projects with an online key. The *targets* role, which only signs with an +offline key, MUST delegate all PyPI projects to the *bins* role. This means +that when a package manager such as pip (i.e., using TUF) downloads a +distribution from a project on PyPI, it will consult the *bins* role about the +TUF metadata for the project. If no bin roles delegated by *bins* specify the +project's distribution, then the project is considered to be non-existent on +PyPI. + + +Metadata Expiry Times +--------------------- + +The *root* and *targets* role metadata SHOULD expire in one year, because these +two metadata files are expected to change very rarely. + +The *timestamp*, *snapshot*, and *bins* metadata SHOULD expire in one day +because a CDN or mirror SHOULD synchronize itself with PyPI every day. +Furthermore, this generous time frame also takes into account client clocks +that are highly skewed or adrift. + + +Metadata Scalability +-------------------- + +Due to the growing number of projects and distributions, TUF metadata will also +grow correspondingly. For example, consider the *bins* role. In August 2013, +it was found that the size of the *bins* metadata was about 42MB if the *bins* +role itself signed for about 220K PyPI targets (which are simple indices and +distributions). This PEP does not delve into the details, but TUF features a +so-called "`lazy bin walk`__" scheme that splits a large targets' metadata file +into many small ones. This allows a TUF client updater to intelligently +download only a small number of TUF metadata files in order to update any +project signed for by the *bins* role. For example, applying this scheme to +the previous repository resulted in pip downloading between 1.3KB and 111KB to +install or upgrade a PyPI project via TUF. + +__ https://github.com/theupdateframework/tuf/issues/39 + +Based on our findings as of the time of writing, PyPI SHOULD split all targets +in the *bins* role by delegating them to 1024 delegated roles, each of which +would sign for PyPI targets whose hashes fall into that "bin" or delegated role +(see Figure 2). It was found that 1024 bins would result in the *bins* +metadata, and each of its delegated roles, being about the same size (40-50KB) +for about 220K PyPI targets (simple indices and distributions). + +It is possible to make TUF metadata more compact by representing it in a binary +format as opposed to the JSON text format. Nevertheless, a sufficiently large +number of projects and distributions will introduce scalability challenges at +some point, and therefore the *bins* role will still need delegations (as +outlined in figure 2) in order to address the problem. Furthermore, the JSON +format is an open and well-known standard for data interchange. Due to the +large number of delegated metadata, compressed versions of *snapshot* metadata +SHOULD also be made available to clients. + + +PyPI and Key Requirements +========================= + +In this section, the kinds of keys required to sign for TUF roles on PyPI are +examined. TUF is agnostic with respect to choices of digital signature +algorithms. For the purpose of discussion, it is assumed that most digital +signatures will be produced with the well-tested and tried RSA algorithm [20]_. +Nevertheless, we do NOT recommend any particular digital signature algorithm in +this PEP because there are a few important constraints: first, cryptography +changes over time; second, package managers such as pip may wish to perform +signature verification in Python, without resorting to a compiled C library, in +order to be able to run on as many systems as Python supports; and third, TUF +recommends diversity of keys for certain applications. + + +Number Of Keys Recommended +-------------------------- + +The *timestamp*, *snapshot*, and *bins* roles require continuous delivery. +Even though their respective keys MUST be online, this PEP requires that the +keys be independent of each other. Different keys for online roles allow for +each of the keys to be placed on separate servers if need be, and prevents side +channel attacks that compromise one key from automatically compromising the +rest of the keys. Therefore, each of the *timestamp*, *snapshot*, and *bins* +roles MUST require (1, 1) keys. + +The *bins* role MAY delegate targets in an automated manner to a number of +roles called "bins", as discussed in the previous section. Each of the "bin" +roles SHOULD share the same key as the *bins* role, due to space efficiency, +and because there is no security advantage to requiring separate keys. + +The *root* role key is critical for security and should very rarely be used. +It is primarily used for key revocation, and it is the locus of trust for all +of PyPI. The *root* role signs for the keys that are authorized for each of +the top-level roles (including its own). Keys belonging to the *root* role are +intended to be very well-protected and used with the least frequency of all +keys. It is RECOMMENDED that every PSF board member own a (strong) root key. +A majority of them can then constitute a quorum to revoke or endow trust in all +top-level keys. Alternatively, the system administrators of PyPI could be +given responsibility for signing for the *root* role. Therefore, the *root* +role SHOULD require (t, n) keys, where n is the number of either all PyPI +administrators or all PSF board members, and t > 1 (so that at least two +members must sign the *root* role). + +The *targets* role will be used only to sign for the static delegation of all +targets to the *bins* role. Since these target delegations must be secured +against attacks in the event of a compromise, the keys for the *targets* role +MUST be offline and independent of other keys. For simplicity of key +management, without sacrificing security, it is RECOMMENDED that the keys of +the *targets* role be permanently discarded as soon as they have been created +and used to sign for the role. Therefore, the *targets* role SHOULD require +(1, 1) keys. Again, this is because the keys are going to be permanently +discarded and more offline keys will not help resist key recovery attacks [21]_ +unless diversity of keys is maintained. + + +Online and Offline Keys Recommended for Each Role +------------------------------------------------- + +In order to support continuous delivery, the *timestamp*, *snapshot*, *bins* +role keys MUST be online. + +As explained in the previous section, the *root* and *targets* role keys MUST +be offline for maximum security: these keys will be offline in the sense that +their private keys MUST NOT be stored on PyPI, though some of them MAY be +online in the private infrastructure of the project. + + +How Should Metadata be Generated? +================================= + +Project developers expect the distributions they upload to PyPI to be +immediately available for download. Unfortunately, there will be problems when +many readers and writers simultaneously access the same metadata and +distributions. That is, there needs to be a way to ensure consistency of +metadata and repository files when multiple developers simulaneously change the +same metadata or distributions. There are also issues with consistency on PyPI +without TUF, but the problem is more severe with signed metadata that MUST keep +track of the files available on PyPI in real-time. + +Suppose that PyPI generates a *snapshot*, which indicates the latest version of +every metadata except *timestamp*, at version 1 and a client requests this +*snapshot* from PyPI. While the client is busy downloading this *snapshot*, +PyPI then timestamps a new snapshot at, say, version 2. Without ensuring +consistency of metadata, the client would find itself with a copy of *snapshot* +that disagrees with what is available on PyPI, which is indistinguishable from +arbitrary metadata injected by an attacker. The problem would also occur for +mirrors attempting to sync with PyPI. + + +Consistent Snapshots +-------------------- + +There are problems with consistency on PyPI with or without TUF. TUF requires +that its metadata be consistent with the repository files, but how would the +metadata be kept consistent with projects that change all the time? As a +result, this proposal MUST address the problem of producing a consistent snapshot that captures the state of all known projects at a given time. Each -consistent snapshot can safely coexist with any other consistent snapshot and -deleted independently without affecting any other consistent snapshot. +snapshot should safely coexist with any other snapshot, and be able to be +deleted independently, without affecting any other snapshot. -The gist of the solution is that every metadata or data file written to disk -MUST include in its filename the `cryptographic hash`__ of the file. How would -this help clients which use the TUF protocol to securely and consistently -install or update a project from PyPI? +The solution presented in this PEP is that every metadata or data file managed +by PyPI and written to disk MUST include in its filename the `cryptographic +hash`__ of the file. How would this help clients that use the TUF protocol to +securely and consistently install or update a project from PyPI? __ https://en.wikipedia.org/wiki/Cryptographic_hash_function -Recall that the first step in the TUF protocol requires the client to download -the latest *timestamp* metadata. However, the client would not know in advance -the hash of the *timestamp* metadata file from the latest consistent snapshot. -Therefore, PyPI MUST redirect all HTTP GET requests for *timestamp* metadata to -the *timestamp* metadata file from the latest consistent snapshot. Since the -*timestamp* metadata is the root of a tree of cryptographic hashes pointing to -every other metadata or target file that are meant to exist together for -consistency, the client is then able to retrieve any file from this consistent -snapshot by deterministically including, in the request for the file, the hash -of the file in the filename. Assuming infinite disk space and no `hash -collisions`__, a client may safely read from one consistent snapshot while PyPI -produces another consistent snapshot. +The first step in the TUF protocol requires the client to download the latest +*timestamp* metadata. However, the client would not know in advance the hash +of the *timestamp* associated with the latest snapshot. Therefore, PyPI MUST +redirect all HTTP GET requests for *timestamp* to the *timestamp* referenced in +the latest snapshot. The *timestamp* role is the root of a tree of +cryptographic hashes that points to every other metadata that is meant to exist +together (i.e., clients request metadata in timestamp -> snapshot -> root -> +targets order). Clients are able to retrieve any file from this snapshot +by deterministically including, in the request for the file, the hash of the +file in the filename. Assuming infinite disk space and no `hash collisions`__, +a client may safely read from one snapshot while PyPI produces another +snapshot. __ https://en.wikipedia.org/wiki/Collision_(computer_science) -In this simple but effective manner, we are able to capture a consistent +In this simple but effective manner, PyPI is able to capture a consistent snapshot of all projects and the associated metadata at a given time. The next -subsection will explicate the implementation details of this idea. +subsection provides implementation details of this idea. + +Note: This PEP does not prohibit using advanced file systems or tools to +produce consistent snapshots. There are two important reasons for why this PEP +proposes the simple solution. First, the solution does not mandate that PyPI +use any particular file system or tool. Second, the generic file-system based +approach allows mirrors to use extant file transfer tools such as rsync to +efficiently transfer consistent snapshots from PyPI. Producing Consistent Snapshots ------------------------------ -Given a project, PyPI is responsible for updating, depending on the project, -either the *claimed*, *recently-claimed* or *unclaimed* metadata as well as -associated delegated targets metadata. Every project MUST upload its set of -metadata and targets in a single transaction. We will call this set of files -the project transaction. We will discuss later how PyPI MAY validate the files -in a project transaction. For now, let us focus on how PyPI will respond to a -project transaction. We will call this response the project transaction -process. There will also be a consistent snapshot process that we will define -momentarily; for now, it suffices to know that project transaction processes -and the consistent snapshot process must coordinate with each other. +Given a project, PyPI is responsible for updating the *bins* metadata (roles +delegated by the *bins* role and signed with an online key). Every project +MUST upload its release in a single transaction. The uploaded set of files is +called the "project transaction". How PyPI MAY validate the files in a project +transaction is discussed in a later section. For now, the focus is on how PyPI +will respond to a project transaction. -Also, every metadata and target file MUST include in its filename the `hex -digest`__ of its `SHA-256`__ hash. For this PEP, it is RECOMMENDED that PyPI -adopt a simple convention of the form filename.digest.ext, where filename is -the original filename without a copy of the hash, digest is the hex digest of -the hash, and ext is the filename extension. +Every metadata and target file MUST include in its filename the `hex digest`__ +of its `SHA-256`__ hash. For this PEP, it is RECOMMENDED that PyPI adopt a +simple convention of the form: digest.filename, where filename is the original +filename without a copy of the hash, and digest is the hex digest of the hash. __ http://docs.python.org/2/library/hashlib.html#hashlib.hash.hexdigest __ https://en.wikipedia.org/wiki/SHA-2 -When an *unclaimed* project uploads a new transaction, a project transaction -process MUST add all new targets and relevant delegated *unclaimed* metadata. -(We will see later in this section why the *unclaimed* role will delegate -targets to a number of delegated *unclaimed* roles.) Finally, the project -transaction process MUST inform the consistent snapshot process about new -delegated *unclaimed* metadata. +When a project uploads a new transaction, the project transaction process MUST +add all new targets and relevant delegated *bins* metadata. (It is shown later +in this section why the *bins* role will delegate targets to a number of +delegated *bins* roles.) Finally, the project transaction process MUST inform +the snapshot process about new delegated *bins* metadata. -When a *recently-claimed* project uploads a new a transaction, a project -transaction process MUST add all new targets and delegated targets metadata for -the project. If the project is new, then the project transaction process MUST -also add new *recently-claimed* metadata with public keys and threshold number -(which MUST be part of the transaction) for the project. Finally, the project -transaction process MUST inform the consistent snapshot process about new -*recently-claimed* metadata as well as the current set of delegated targets -metadata for the project. - -The process for a *claimed* project is slightly different. The difference is -that PyPI administrators will choose to move the project from the -*recently-claimed* role to the *claimed* role. A project transaction process -MUST then add new *recently-claimed* and *claimed* metadata to reflect this -migration. As is the case for a *recently-claimed* project, the project -transaction process MUST always add all new targets and delegated targets -metadata for the *claimed* project. Finally, the project transaction process -MUST inform the consistent snapshot process about new *recently-claimed* or -*claimed* metadata as well as the current set of delegated targets metadata for -the project. - -Project transaction processes SHOULD be automated, except when PyPI -administrators move a project from the *recently-claimed* role to the *claimed* -role. Project transaction processes MUST also be applied atomically: either -all metadata and targets, or none of them, are added. The project transaction -processes and consistent snapshot process SHOULD work concurrently. Finally, -project transaction processes SHOULD keep in memory the latest *claimed*, -*recently-claimed* and *unclaimed* metadata so that they will be correctly -updated in new consistent snapshots. +Project transaction processes SHOULD be automated and MUST also be applied +atomically: either all metadata and targets -- or none of them -- are added. +The project transaction and snapshot processes SHOULD work concurrently. +Finally, project transaction processes SHOULD keep in memory the latest *bins* +metadata so that they will be correctly updated in new consistent snapshots. All project transactions MAY be placed in a single queue and processed serially. Alternatively, the queue MAY be processed concurrently in order of -appearance provided that the following rules are observed: +appearance, provided that the following rules are observed: 1. No pair of project transaction processes must concurrently work on the same project. 2. No pair of project transaction processes must concurrently work on - *unclaimed* projects that belong to the same delegated *unclaimed* targets + *bins* projects that belong to the same delegated *bins* targets role. -3. No pair of project transaction processes must concurrently work on new - *recently-claimed* projects. - -4. No pair of project transaction processes must concurrently work on new - *claimed* projects. - -5. No project transaction process must work on a new *claimed* project while - another project transaction process is working on a new *recently-claimed* - project and vice versa. - These rules MUST be observed so that metadata is not read from or written to inconsistently. -The consistent snapshot process is fairly simple and SHOULD be automated. The -consistent snapshot process MUST keep in memory the latest working set of -*root*, *targets* and delegated targets metadata. Every minute or so, the -consistent snapshot process will sign for this latest working set. (Recall -that project transaction processes continuously inform the consistent snapshot -process about the latest delegated targets metadata in a concurrency-safe -manner. The consistent snapshot process will actually sign for a copy of the -latest working set while the actual latest working set in memory will be -updated with information continuously communicated by project transaction -processes.) Next, the consistent snapshot process MUST generate and sign new -*timestamp* metadata that will vouch for the *consistent-snapshot* metadata -generated in the previous step. Finally, the consistent snapshot process MUST -add new *timestamp* and *consistent-snapshot* metadata representing the latest -consistent snapshot. + +Snapshot Process +---------------- + +The snapshot process is fairly simple and SHOULD be automated. The snapshot +process MUST keep in memory the latest working set of *root*, *targets*, and +delegated roles. Every minute or so, the snapshot process will sign for this +latest working set. (Recall that project transaction processes continuously +inform the snapshot process about the latest delegated metadata in a +concurrency-safe manner. The snapshot process will actually sign for a copy of +the latest working set while the latest working set in memory will be updated +with information that is continuously communicated by the project transaction +processes.) The snapshot process MUST generate and sign new *timestamp* +metadata that will vouch for the metadata (*root*, *targets*, and delegated +roles) generated in the previous step. Finally, the snapshot process MUST make +available to clients the new *timestamp* and *snapshot* metadata representing +the latest snapshot. A few implementation notes are now in order. So far, we have seen only that new metadata and targets are added, but not that old metadata and targets are @@ -508,30 +650,19 @@ use something like a "mark-and-sweep" algorithm to delete sufficiently old consistent snapshots: in order to preserve the latest consistent snapshot, PyPI would walk objects beginning from the root (*timestamp*) of the latest -consistent snapshot, mark all visited objects, and delete all unmarked -objects. The last few consistent snapshots may be preserved in a similar -fashion. Deleting a consistent snapshot will cause clients to see nothing -thereafter but HTTP 404 responses to any request for a file in that consistent -snapshot. Clients SHOULD then retry their requests with the latest consistent +consistent snapshot, mark all visited objects, and delete all unmarked objects. +The last few consistent snapshots may be preserved in a similar fashion. +Deleting a consistent snapshot will cause clients to see nothing except HTTP +404 responses to any request for a file within that consistent snapshot. +Clients SHOULD then retry (as before) their requests with the latest consistent snapshot. -We do **not** consider updates to any consistent snapshot because `hash -collisions`__ are out of the scope of this PEP. In case a hash collision is -observed, PyPI MAY wish to check that the file being added is identical to the -file already stored. (Should a hash collision be observed, it is far more -likely the case that the file is identical rather than being a genuine -`collision attack`__.) Otherwise, PyPI MAY either overwrite the existing file -or ignore any write operation to an existing file. - -__ https://en.wikipedia.org/wiki/Collision_(computer_science) -__ https://en.wikipedia.org/wiki/Collision_attack - All clients, such as pip using the TUF protocol, MUST be modified to download every metadata and target file (except for *timestamp* metadata) by including, -in the request for the file, the hash of the file in the filename. Following -the filename convention recommended earlier, a request for the file at -filename.ext will be transformed to the equivalent request for the file at -filename.digest.ext. +in the request for the file, the cryptographic hash of the file in the +filename. Following the filename convention recommended earlier, a request for +the file at filename.ext will be transformed to the equivalent request for the +file at digest.filename. Finally, PyPI SHOULD use a `transaction log`__ to record project transaction processes and queues so that it will be easier to recover from errors after a @@ -540,487 +671,367 @@ __ https://en.wikipedia.org/wiki/Transaction_log -Metadata Validation -------------------- +Key Compromise Analysis +======================= -A *claimed* or *recently-claimed* project will need to upload in its -transaction to PyPI not just targets (a simple index as well as distributions) -but also TUF metadata. The project MAY do so by uploading a ZIP file -containing two directories, /metadata/ (containing delegated targets metadata -files) and /targets/ (containing targets such as the project simple index and -distributions which are signed for by the delegated targets metadata). +This PEP has covered the minimum security model, the TUF roles that should be +added to support continuous delivery of distributions, and how to generate and +sign the metadata of each role. The remaining sections discuss how PyPI +SHOULD audit repository metadata, and the methods PyPI can use to detect and +recover from a PyPI compromise. -Whenever the project uploads metadata or targets to PyPI, PyPI SHOULD check the -project TUF metadata for at least the following properties: +Table 1 summarizes a few of the attacks possible when a threshold number of +private cryptographic keys (belonging to any of the PyPI roles) are +compromised. The leftmost column lists the roles (or a combination of roles) +that have been compromised, and the columns to its right show whether the +compromised roles leaves clients susceptible to malicious updates, a freeze +attack, or metadata inconsistency attacks. -* A threshold number of the developers keys registered with PyPI by that - project MUST have signed for the delegated targets metadata file that - represents the "root" of targets for that project (e.g. metadata/targets/ - project.txt). ++-----------------+-------------------+----------------+--------------------------------+ +| Role Compromise | Malicious Updates | Freeze Attack | Metadata Inconsistency Attacks | ++=================+===================+================+================================+ +| timestamp | NO | YES | NO | +| | snapshot and | limited by | snapshot needs to cooperate | +| | targets or any | earliest root, | | +| | of the bins need | targets, or | | +| | to cooperate | bin expiry | | +| | | time | | ++-----------------+-------------------+----------------+--------------------------------+ +| snapshot | NO | NO | NO | +| | timestamp and | timestamp | timestamp needs to cooperate | +| | targets or any of | needs to | | +| | the bins need to | cooperate | | +| | cooperate | | | ++-----------------+-------------------+----------------+--------------------------------+ +| timestamp | NO | YES | YES | +| **AND** | targets or any | limited by | limited by earliest root, | +| snapshot | of the bins need | earliest root, | targets, or bin metadata | +| | to cooperate | targets, or | expiry time | +| | | bin metadata | | +| | | expiry time | | ++-----------------+-------------------+----------------+--------------------------------+ +| targets | NO | NOT APPLICABLE | NOT APPLICABLE | +| **OR** | timestamp and | need timestamp | need timestamp and snapshot | +| bin | snapshot need to | and snapshot | | +| | cooperate | | | ++-----------------+-------------------+----------------+--------------------------------+ +| timestamp | YES | YES | YES | +| **AND** | | limited by | limited by earliest root, | +| snapshot | | earliest root, | targets, or bin metadata | +| **AND** | | targets, or | expiry time | +| bin | | bin metadata | | +| | | expiry time | | ++-----------------+-------------------+----------------+--------------------------------+ +| root | YES | YES | YES | ++-----------------+-------------------+----------------+--------------------------------+ -* The signatures of delegated targets metadata files MUST be valid. +Table 1: Attacks possible by compromising certain combinations of role keys. +In `September 2013`__, it was shown how the latest version (at the time) of pip +was susceptible to these attacks and how TUF could protect users against them +[14]_. -* The delegated targets metadata files MUST NOT be expired. +__ https://mail.python.org/pipermail/distutils-sig/2013-September/022755.html -* The delegated targets metadata MUST be consistent with the targets. - -* A delegator MUST NOT delegate targets that were not delegated to itself by - another delegator. - -* A delegatee MUST NOT sign for targets that were not delegated to itself by a - delegator. - -* Every file MUST contain a unique copy of its hash in its filename following - the filename.digest.ext convention recommended earlier. - -If PyPI chooses to check the project TUF metadata, then PyPI MAY choose to -reject publishing any set of metadata or targets that do not meet these -requirements. - -PyPI MUST enforce access control by ensuring that each project can only write -to the TUF metadata for which it is responsible. It MUST do so by ensuring -that project transaction processes write to the correct metadata as well as -correct locations within those metadata. For example, a project transaction -process for an *unclaimed* project MUST write to the correct target paths in -the correct delegated *unclaimed* metadata for the targets of the project. - -On rare occasions, PyPI MAY wish to extend the TUF metadata format for projects -in a backward-incompatible manner. Note that PyPI will NOT be able to -automatically rewrite existing TUF metadata on behalf of projects in order to -upgrade the metadata to the new backward-incompatible format because this would -invalidate the signatures of the metadata as signed by developer keys. -Instead, package managers SHOULD be written to recognize and handle multiple -incompatible versions of TUF metadata so that *claimed* and *recently-claimed* -projects could be offered a reasonable time to migrate their metadata to newer -but backward-incompatible formats. - -The details of how each project manages its TUF metadata is beyond the scope of -this PEP. - - -Mirroring Protocol ------------------- - -The mirroring protocol as described in PEP 381 [9]_ SHOULD change to mirror -PyPI with TUF. - -A mirror SHOULD have to maintain for its clients only one consistent snapshot -which would represent the latest consistent snapshot from PyPI known to the -mirror. The mirror would then serve all HTTP requests for metadata or targets -by simply reading directly from this consistent snapshot directory. - -The mirroring protocol itself is fairly simple. The mirror would ask PyPI for -*timestamp* metadata from the latest consistent snapshot and proceed to copy -the entire consistent snapshot from the *timestamp* metadata onwards. If the -mirror encounters a failure to copy any metadata or target file while copying -the consistent snapshot, it SHOULD retrying resuming the copy of that -particular consistent snapshot. If PyPI has deleted that consistent snapshot, -then the mirror SHOULD delete the failed consistent snapshot and try -downloading the latest consistent snapshot instead. - -The mirror SHOULD point users to a previous consistent snapshot directory while -it is copying the latest consistent snapshot from PyPI. Only after the latest -consistent snapshot has been completely copied SHOULD the mirror switch clients -to the latest consistent snapshot. The mirror MAY then delete the previous -consistent snapshot once it finds that no client is reading from the previous -consistent snapshot. - -The mirror MAY use extant file transfer software such as rsync__ to mirror -PyPI. In that case, the mirror MUST first obtain the latest known timestamp -metadata from PyPI. The mirror MUST NOT immediately publish the latest known -timestamp metadata from PyPI. Instead, the mirror MUST first iteratively -transfer all new files from PyPI until there are no new files left to transfer. -Finally, the mirror MUST publish the latest known timestamp it fetched from -PyPI so that package managers such as pip may be directed to the latest -consistent snapshot known to the mirror. - -__ https://rsync.samba.org/ - - -Backup Process --------------- - -In order to be able to safely restore from static snapshots later in the event -of a compromise, PyPI SHOULD maintain a small number of its own mirrors to copy -PyPI consistent snapshots according to some schedule. The mirroring protocol -can be used immediately for this purpose. The mirrors must be secured and -isolated such that they are responsible only for mirroring PyPI. The mirrors -can be checked against one another to detect accidental or malicious failures. - - -Metadata Expiry Times ---------------------- - -The *root* and *targets* role metadata SHOULD expire in a year, because these -metadata files are expected to change very rarely. - -The *claimed* role metadata SHOULD expire in three to six months, because this -metadata is expected to be refreshed in that time frame. This time frame was -chosen to induce an easier administration process for PyPI. - -The *timestamp*, *consistent-snapshot*, *recently-claimed* and *unclaimed* role -metadata SHOULD expire in a day because a CDN or mirror SHOULD synchronize -itself with PyPI every day. Furthermore, this generous time frame also takes -into account client clocks that are highly skewed or adrift. - -The expiry times for the delegated targets metadata of a project is beyond the -scope of this PEP. - - -Metadata Scalability --------------------- - -Due to the growing number of projects and distributions, the TUF metadata will -also grow correspondingly. - -For example, consider the *unclaimed* role. In August 2013, we found that the -size of the *unclaimed* role metadata was about 42MB if the *unclaimed* role -itself signed for about 220K PyPI targets (which are simple indices and -distributions). We will not delve into details in this PEP, but TUF features a -so-called "`lazy bin walk`__" scheme which splits a large targets or delegated -targets metadata file into many small ones. This allows a TUF client updater -to intelligently download only a small number of TUF metadata files in order to -update any project signed for by the *unclaimed* role. For example, applying -this scheme to the previous repository resulted in pip downloading between -1.3KB and 111KB to install or upgrade a PyPI project via TUF. - -__ https://github.com/theupdateframework/tuf/issues/39 - -From our findings as of the time of writing, PyPI SHOULD split all targets in -the *unclaimed* role by delegating it to 1024 delegated targets role, each of -which would sign for PyPI targets whose hashes fall into that "bin" or -delegated targets role. We found that 1024 bins would result in the -*unclaimed* role metadata and each of its binned delegated targets role -metadata to be about the same size (40-50KB) for about 220K PyPI targets -(simple indices and distributions). - -It is possible to make the TUF metadata more compact by representing it in a -binary format as opposed to the JSON text format. Nevertheless, we believe -that a sufficiently large number of project and distributions will induce -scalability challenges at some point, and therefore the *unclaimed* role will -then still need delegations in order to address the problem. Furthermore, the -JSON format is an open and well-known standard for data interchange. - -Due to the large number of delegated target metadata files, compressed versions -of *consistent-snapshot* metadata SHOULD also be made available. - - -Key Management -============== - -In this section, we examine the kind of keys required to sign for TUF roles on -PyPI. TUF is agnostic with respect to choices of digital signature algorithms. -For the purpose of discussion, we will assume that most digital signatures will -be produced with the well-tested and tried RSA algorithm [20]_. Nevertheless, -we do NOT recommend any particular digital signature algorithm in this PEP -because there are a few important constraints: firstly, cryptography changes -over time; secondly, package managers such as pip may wish to perform signature -verification in Python, without resorting to a compiled C library, in order to -be able to run on as many systems as Python supports; finally, TUF recommends -diversity of keys for certain applications, and we will soon discuss these -exceptions. - - -Number Of Keys --------------- - -The *timestamp*, *consistent-snapshot*, *recently-claimed* and *unclaimed* -roles will need to support continuous delivery. Even though their respective -keys will then need to be online, we will require that the keys be independent -of each other. This allows for each of the keys to be placed on separate -servers if need be, and prevents side channel attacks that compromise one key -from automatically compromising the rest of the keys. Therefore, each of the -*timestamp*, *consistent-snapshot*, *recently-claimed* and *unclaimed* roles -MUST require (1, 1) keys. - -The *unclaimed* role MAY delegate targets in an automated manner to a number of -roles called "bins", as we discussed in the previous section. Each of the -"bin" roles SHOULD share the same key as the *unclaimed* role, due -simultaneously to space efficiency of metadata and because there is no security -advantage in requiring separate keys. - -The *root* role is critical for security and should very rarely be used. It is -primarily used for key revocation, and it is the root of trust for all of PyPI. -The *root* role signs for the keys that are authorized for each of the -top-level roles (including itself). The keys belonging to the *root* role are -intended to be very well-protected and used with the least frequency of all -keys. We propose that every PSF board member own a (strong) root key. A -majority of them can then constitute the quorum to revoke or endow trust in all -top-level keys. Alternatively, the system administrators of PyPI (instead of -PSF board members) could be responsible for signing for the *root* role. -Therefore, the *root* role SHOULD require (t, n) keys, where n is the number of -either all PyPI administrators or all PSF board members, and t > 1 (so that at -least two members must sign the *root* role). - -The *targets* role will be used only to sign for the static delegation of all -targets to the *claimed*, *recently-claimed* and *unclaimed* roles. Since -these target delegations must be secured against attacks in the event of a -compromise, the keys for the *targets* role MUST be offline and independent -from other keys. For simplicity of key management without sacrificing -security, it is RECOMMENDED that the keys of the *targets* role are permanently -discarded as soon as they have been created and used to sign for the role. -Therefore, the *targets* role SHOULD require (1, 1) keys. Again, this is -because the keys are going to be permanently discarded, and more offline keys -will not help against key recovery attacks [21]_ unless diversity of keys is -maintained. - -Similarly, the *claimed* role will be used only to sign for the dynamic -delegation of projects to their respective developer keys. Since these target -delegations must be secured against attacks in the event of a compromise, the -keys for the *claimed* role MUST be offline and independent from other keys. -Therefore, the *claimed* role SHOULD require (t, n) keys, where n is the number -of all PyPI administrators (in order to keep it manageable), and t ? 1 (so that -at least one member MUST sign the *claimed* role). While a stronger threshold -would indeed render the role more robust against a compromise of the *claimed* -keys (which is highly unlikely assuming that the keys are independent and -securely kept offline), we think that this trade-off is acceptable for the -important purpose of keeping the maintenance overhead for PyPI administrators -as little as possible. At the time of writing, we are keeping this point open -for discussion by the distutils-sig community. - -The number of developer keys is project-specific and thus beyond the scope of -this PEP. - - -Online and Offline Keys ------------------------ - -In order to support continuous delivery, the *timestamp*, -*consistent-snapshot*, *recently-claimed* and *unclaimed* role keys MUST be -online. - -As explained in the previous section, the *root*, *targets* and *claimed* role -keys MUST be offline for maximum security. Developers keys will be offline in -the sense that the private keys MUST NOT be stored on PyPI, though some of them -may be online on the private infrastructure of the project. - - -Key Strength ------------- - -At the time of writing, we recommend that all RSA keys (both offline and -online) SHOULD have a minimum key size of 3072 bits for data-protection -lifetimes beyond 2030 [22]_. - - -Diversity Of Keys ------------------ - -Due to the threats of weak key generation and implementation weaknesses [2]_, -the types of keys as well as the libraries used to generate them should vary -within TUF on PyPI. Our current implementation of TUF supports multiple -digital signature algorithms such as RSA (with OpenSSL [23]_ or PyCrypto [24]_) -and ed25519 [25]_. Furthermore, TUF supports the binding of other -cryptographic libraries that it does not immediately support "out of the box", -and so one MAY generate keys using other cryptographic libraries and use them -for TUF on PyPI. - -As such, the root role keys SHOULD be generated by a variety of digital -signature algorithms as implemented by different cryptographic libraries. - - -Key Compromise Analysis ------------------------ - -.. image:: https://raw.github.com/theupdateframework/pep-on-pypi-with-tuf/master/table1.png - -Table 1: Attacks possible by compromising certain combinations of role keys - - -Table 1 summarizes the kinds of attacks rendered possible by compromising a -threshold number of keys belonging to the TUF roles on PyPI. Except for the -*timestamp* and *consistent-snapshot* roles, the pairwise interaction of role -compromises may be found by taking the union of both rows. - -In September 2013, we showed how the latest version of pip then was susceptible -to these attacks and how TUF could protect users against them [14]_. - -An attacker who compromises developer keys for a project and who is able to -somehow upload malicious metadata and targets to PyPI will be able to serve -malicious updates to users of that project (and that project alone). Note that -compromising *targets* or any delegated targets role (except for project -targets metadata) does not immediately endow the attacker with the ability to -serve malicious updates. The attacker must also compromise the *timestamp* and -*consistent-snapshot* roles (which are both online and therefore more likely to -be compromised). This means that in order to launch any attack, one must be -not only be able to act as a man-in-the-middle but also compromise the -*timestamp* key (or the *root* keys and sign a new *timestamp* key). To launch -any attack other than a freeze attack, one must also compromise the -*consistent-snapshot* key. +Note that compromising *targets* or any delegated role (except for project +targets metadata) does not immediately allow an attacker to serve malicious +updates. The attacker must also compromise the *timestamp* and *snapshot* +roles (which are both online and therefore more likely to be compromised). +This means that in order to launch any attack, one must not only be able to +act as a man-in-the-middle but also compromise the *timestamp* key (or +compromise the *root* keys and sign a new *timestamp* key). To launch any +attack other than a freeze attack, one must also compromise the *snapshot* key. Finally, a compromise of the PyPI infrastructure MAY introduce malicious -updates to *recently-claimed* and *unclaimed* projects because the keys for -those roles are online. However, attackers cannot modify *claimed* projects in -such an event because *targets* and *claimed* metadata have been signed with -offline keys. Therefore, it is RECOMMENDED that high-value projects register -their developer keys with PyPI and sign for their own distributions. +updates to *bins* projects because the keys for these roles are online. The +maximum security model discussed in the appendix addresses this issue. PEP X +[VD: Link to PEP once it is completed] also covers the maximum security model +and goes into more detail on generating developer keys and signing uploaded +distributions. In the Event of a Key Compromise -------------------------------- -By a key compromise, we mean that the key as well as PyPI infrastructure has -been compromised and used to sign new metadata on PyPI. +A key compromise means that a threshold of keys (belonging to the metadata +roles on PyPI), as well as the PyPI infrastructure, have been compromised and +used to sign new metadata on PyPI. -If a threshold number of developer keys of a project have been compromised, -then the project MUST take the following steps: +If a threshold number of *timestamp*, *snapshot*, or *bins* keys have +been compromised, then PyPI MUST take the following steps: -1. The project metadata and targets MUST be restored to the last known good - consistent snapshot where the project was not known to be compromised. This - can be done by the developers repackaging and resigning all targets with the - new keys. +1. Revoke the *timestamp*, *snapshot* and *targets* role keys from + the *root* role. This is done by replacing the compromised *timestamp*, + *snapshot* and *targets* keys with newly issued keys. -2. The project delegated targets metadata MUST have their version numbers - incremented, expiry times suitably extended and signatures renewed. +2. Revoke the *bins* keys from the *targets* role by replacing their keys with + newly issued keys. Sign the new *targets* role metadata and discard the new + keys (because, as explained earlier, this increases the security of + *targets* metadata). -Whereas PyPI MUST take the following steps: - -1. Revoke the compromised developer keys from the delegation to the project by - the *recently-claimed* or *claimed* role. This is done by replacing the - compromised developer keys with newly issued developer keys. - -2. A new timestamped consistent snapshot MUST be issued. - -If a threshold number of *timestamp*, *consistent-snapshot*, *recently-claimed* -or *unclaimed* keys have been compromised, then PyPI MUST take the following -steps: - -1. Revoke the *timestamp*, *consistent-snapshot* and *targets* role keys from - the *root* role. This is done by replacing the compromised *timestamp*, - *consistent-snapshot* and *targets* keys with newly issued keys. - -2. Revoke the *recently-claimed* and *unclaimed* keys from the *targets* role - by replacing their keys with newly issued keys. Sign the new *targets* role - metadata and discard the new keys (because, as we explained earlier, this - increases the security of *targets* metadata). - -3. Clear all targets or delegations in the *recently-claimed* role and delete - all associated delegated targets metadata. Recently registered projects - SHOULD register their developer keys again with PyPI. - -4. All targets of the *recently-claimed* and *unclaimed* roles SHOULD be - compared with the last known good consistent snapshot where none of the - *timestamp*, *consistent-snapshot*, *recently-claimed* or *unclaimed* keys +3. All targets of the *bins* roles SHOULD be compared with the last known + good consistent snapshot where none of the *timestamp*, *snapshot*, or + *bins* keys were known to have been compromised. Added, updated or deleted targets in the compromised consistent snapshot that do not match the last known good consistent snapshot MAY be restored to their previous versions. After - ensuring the integrity of all *unclaimed* targets, the *unclaimed* metadata + ensuring the integrity of all *bins* targets, the *bins* metadata MUST be regenerated. -5. The *recently-claimed* and *unclaimed* metadata MUST have their version - numbers incremented, expiry times suitably extended and signatures renewed. +4. The *bins* metadata MUST have their version numbers incremented, expiry + times suitably extended, and signatures renewed. -6. A new timestamped consistent snapshot MUST be issued. +5. A new timestamped consistent snapshot MUST be issued. -This would preemptively protect all of these roles even though only one of them -may have been compromised. +Following these steps would preemptively protect all of these roles even though +only one of them may have been compromised. -If a threshold number of the *targets* or *claimed* keys have been compromised, -then there is little that an attacker could do without the *timestamp* and -*consistent-snapshot* keys. In this case, PyPI MUST simply revoke the -compromised *targets* or *claimed* keys by replacing them with new keys in the -*root* and *targets* roles respectively. - -If a threshold number of the *timestamp*, *consistent-snapshot* and *claimed* -keys have been compromised, then PyPI MUST take the following steps in addition -to the steps taken when either the *timestamp* or *consistent-snapshot* keys -are compromised: - -1. Revoke the *claimed* role keys from the *targets* role and replace them with - newly issued keys. - -2. All project targets of the *claimed* roles SHOULD be compared with the last - known good consistent snapshot where none of the *timestamp*, - *consistent-snapshot* or *claimed* keys were known to have been compromised. - Added, updated or deleted targets in the compromised consistent snapshot - that do not match the last known good consistent snapshot MAY be restored to - their previous versions. After ensuring the integrity of all *claimed* - project targets, the *claimed* metadata MUST be regenerated. - -3. The *claimed* metadata MUST have their version numbers incremented, expiry - times suitably extended and signatures renewed. - -If a threshold number of the *timestamp*, *consistent-snapshot* and *targets* -keys have been compromised, then PyPI MUST take the union of the steps taken -when the *claimed*, *recently-claimed* and *unclaimed* keys have been -compromised. - -If a threshold number of the *root* keys have been compromised, then PyPI MUST -take the steps taken when the *targets* role has been compromised as well as -replace all of the *root* keys. +If a threshold number of *root* keys have been compromised, then PyPI MUST take +the steps taken when the *targets* role has been compromised. All of the +*root* keys must also be replaced. It is also RECOMMENDED that PyPI sufficiently document compromises with security bulletins. These security bulletins will be most informative when -users of pip with TUF are unable to install or update a project because the -keys for the *timestamp*, *consistent-snapshot* or *root* roles are no longer -valid. They could then visit the PyPI web site to consult security bulletins -that would help to explain why they are no longer able to install or update, -and then take action accordingly. When a threshold number of *root* keys have -not been revoked due to a compromise, then new *root* metadata may be safely -updated because a threshold number of existing *root* keys will be used to sign -for the integrity of the new *root* metadata so that TUF clients will be able -to verify the integrity of the new *root* metadata with a threshold number of -previously known *root* keys. This will be the common case. Otherwise, in the -worst case where a threshold number of *root* keys have been revoked due to a +users of pip-with-TUF are unable to install or update a project because the +keys for the *timestamp*, *snapshot* or *root* roles are no longer valid. They +could then visit the PyPI web site to consult security bulletins that would +help to explain why they are no longer able to install or update, and then take +action accordingly. When a threshold number of *root* keys have not been +revoked due to a compromise, then new *root* metadata may be safely updated +because a threshold number of existing *root* keys will be used to sign for the +integrity of the new *root* metadata. TUF clients will be able to verify the +integrity of the new *root* metadata with a threshold number of previously +known *root* keys. This will be the common case. Otherwise, in the worst +case, where a threshold number of *root* keys have been revoked due to a compromise, an end-user may choose to update new *root* metadata with `out-of-band`__ mechanisms. __ https://en.wikipedia.org/wiki/Out-of-band#Authentication -Appendix: Rejected Proposals -============================ +Auditing Snapshots +------------------ +If a malicious party compromises PyPI, they can sign arbitrary files with any +of the online keys. The roles with offline keys (i.e., *root* and *targets*) +are still protected. To safely recover from a repository compromise, snapshots +should be audited to ensure files are only restored to trusted versions. -Alternative Proposals for Producing Consistent Snapshots --------------------------------------------------------- +When a repository compromise has been detected, the integrity of three types of +information must be validated: -The complete file snapshot (CFS) scheme uses file system directories to store -efficient consistent snapshots over time. In this scheme, every consistent -snapshot will be stored in a separate directory, wherein files that are shared -with previous consistent snapshots will be `hard links`__ instead of copies. +1. If the online keys of the repository have been compromised, they can be + revoked by having the *targets* role sign new metadata delegating to a new + key. -__ https://en.wikipedia.org/wiki/Hard_link +2. If the role metadata on the repository has been changed, this would impact + the metadata that is signed by online keys. Any role information created + since the last period should be discarded. As a result, developers of new + projects will need to re-register their projects. -The `differential file`__ snapshot (DFS) scheme is a variant of the CFS scheme, -wherein the next consistent snapshot directory will contain only the additions -of new files and updates to existing files of the previous consistent snapshot. -(The first consistent snapshot will contain a complete set of files known -then.) Deleted files will be marked as such in the next consistent snapshot -directory. This means that files will be resolved in this manner: First, set -the current consistent snapshot directory to be the latest consistent snapshot -directory. Then, any requested file will be seeked in the current consistent -snapshot directory. If the file exists in the current consistent snapshot -directory, then that file will be returned. If it has been marked as deleted -in the current consistent snapshot directory, then that file will be reported -as missing. Otherwise, the current consistent snapshot directory will be set -to the preceding consistent snapshot directory and the previous few steps will -be iterated until there is no preceding consistent snapshot to be considered, -at which point the file will be reported as missing. +3. If the packages themselves may have been tampered with, they can be + validated using the stored hash information for packages that existed at the + time of the last period. -__ http://dl.acm.org/citation.cfm?id=320484 +In order to safely restore snapshots in the event of a compromise, PyPI SHOULD +maintain a small number of its own mirrors to copy PyPI snapshots according to +some schedule. The mirroring protocol can be used immediately for this +purpose. The mirrors must be secured and isolated such that they are +responsible only for mirroring PyPI. The mirrors can be checked against one +another to detect accidental or malicious failures. -With the CFS scheme, the trade-off is the I/O costs of producing a consistent -snapshot with the file system. As of October 2013, we found that a fairly -modern computer with a 7200RPM hard disk drive required at least three minutes -to produce a consistent snapshot with the "cp -lr" command on the ext3__ file -system. Perhaps the I/O costs of this scheme may be ameliorated with advanced -tools or file systems such as ZFS__ or btrfs__. +Another approach is to generate the cryptographic hash of *snapshot* +periodically and tweet it. Perhaps a user comes forward with the actual +metadata and the repository maintainers can verify the metadata's cryptographic +hash. Alternatively, PyPI may periodically archive its own versions of +*snapshot* rather than rely on externally provided metadata. In this case, +PyPI SHOULD take the cryptographic hash of every package on the repository and +store this data on an offline device. If any package hash has changed, this +indicates an attack. -__ https://en.wikipedia.org/wiki/Ext3 -__ https://en.wikipedia.org/wiki/ZFS -__ https://en.wikipedia.org/wiki/Btrfs +As for attacks that serve different versions of metadata, or freeze a version +of a package at a specific version, they can be handled by TUF with techniques +like implicit key revocation and metadata mismatch detection [81]. -While the DFS scheme improves upon the CFS scheme in terms of producing faster -consistent snapshots, there are at least two trade-offs. The first is that a -web server will need to be modified to perform the "daisy chain" resolution of -a file. The second is that every now and then, the differential snapshots will -need to be "squashed" or merged together with the first consistent snapshot to -produce a new first consistent snapshot with the latest and complete set of -files. Although the merge cost may be amortized over time, this scheme is not -conceptually si +Appendix A: Repository Attacks Prevented by TUF +=============================================== +* **Arbitrary software installation**: An attacker installs anything they want + on the client system. That is, an attacker can provide arbitrary files in + respond to download requests and the files will not be detected as + illegitimate. + +* **Rollback attacks**: An attacker presents a software update system with + older files than those the client has already seen, causing the client to use + files older than those the client knows about. + +* **Indefinite freeze attacks**: An attacker continues to present a software + update system with the same files the client has already seen. The result is + that the client does not know that new files are available. + +* **Endless data attacks**: An attacker responds to a file download request + with an endless stream of data, causing harm to clients (e.g., a disk + partition filling up or memory exhaustion). + +* **Slow retrieval attacks**: An attacker responds to clients with a very slow + stream of data that essentially results in the client never continuing the + update process. + +* **Extraneous dependencies attacks**: An attacker indicates to clients that in + order to install the software they wanted, they also need to install + unrelated software. This unrelated software can be from a trusted source + but may have known vulnerabilities that are exploitable by the attacker. + +* **Mix-and-match attacks**: An attacker presents clients with a view of a + repository that includes files that never existed together on the repository + at the same time. This can result in, for example, outdated versions of + dependencies being installed. + +* **Wrong software installation**: An attacker provides a client with a trusted + file that is not the one the client wanted. + +* **Malicious mirrors preventing updates**: An attacker in control of one + repository mirror is able to prevent users from obtaining updates from + other, good mirrors. + +* **Vulnerability to key compromises**: An attacker who is able to compromise a + single key or less than a given threshold of keys can compromise clients. + This includes relying on a single online key (such as only being protected + by SSL) or a single offline key (such as most software update systems use + to sign files). + + +Appendix B: Extension to the Minimum Security Model +=================================================== + +The maximum security model and end-to-end signing have been intentionally +excluded from this PEP. Although both improve PyPI's ability to survive a +repository compromise and allow developers to sign their distributions, they +have been postponed for review as a potential future extension to PEP 458. PEP +X [VD: Link to PEP once it is completed], which discusses the extension in +detail, is available for review to those developers interested in the +end-to-end signing option. The maximum security model and end-to-end signing +are briefly covered in subsections that follow. + +There are several reasons for not initially supporting the features discussed +in this section: + +1. A build farm (distribution wheels on supported platforms are generated for + each project on PyPI infrastructure) may possibly complicate matters. PyPI + wants to support a build farm in the future. Unfortunately, if wheels are + auto-generated externally, developer signatures for these wheels are + unlikely. However, there might still be a benefit to generating wheels from + source distributions that are signed by developers (provided that + reproducible wheels are possible). Another possibility is to optionally + delegate trust of these wheels to an online role. + +2. An easy-to-use key management solution is needed for developers. + `miniLock`__ is one likely candidate for management and generation of keys. + Although developer signatures can remain optional, this approach may be + inadequate due to the great number of potentially unsigned dependencies each + distribution may have. If any one of these dependencies is unsigned, it + negates any benefit the project gains from signing its own distribution + (i.e., attackers would only need to compromise one of the unsigned + dependencies to attack end-users). Requiring developers to manually sign + distributions and manage keys is expected to render key signing an unused + feature. + + __ https://minilock.io/ + +3. A two-phase approach, where the minimum security model is implemented first + followed by the maximum security model, can simplify matters and give PyPI + administrators time to review the feasibility of end-to-end signing. + + +Maximum Security Model +---------------------- + +The maximum security model relies on developers signing their projects and +uploading signed metadata to PyPI. If the PyPI infrastructure were to be +compromised, attackers would be unable to serve malicious versions of claimed +projects without access to the project's developer key. Figure 3 depicts the +changes made to figure 2, namely that developer roles are now supported and +that three new delegated roles exist: *claimed*, *recently-claimed*, and +*unclaimed*. The *bins* role has been renamed *unclaimed* and can contain any +projects that have not been added to *claimed*. The strength of this model +(over the minimum security model) is in the offline keys provided by +developers. Although the minimum security model supports continuous delivery, +all of the projects are signed by an online key. An attacker can corrupt +packages in the minimum security model, but not in the maximum model without +also compromising a developer's key. + +.. image:: figure3.png + +Figure 3: An overview of the metadata layout in the maximum security model. +The maximum security model supports continuous delivery and survivable key +compromise. + + +End-to-End Signing +------------------ + +End-to-End signing allows both PyPI and developers to sign for the metadata +downloaded by clients. PyPI is trusted to make uploaded projects available to +clients (they sign the metadata for this part of the process), and developers +can sign the distributions that they upload. + +PEP X [VD: Link to PEP once it is completed] discusses the tools available to +developers who sign the distributions that they upload to PyPI. To summarize +PEP X, developers generate cryptographic keys and sign metadata in some +automated fashion, where the metadata includes the information required to +verify the authenticity of the distribution. The metadata is then uploaded to +PyPI by the client, where it will be available for download by package managers +such as pip (i.e., package managers that support TUF metadata). The entire +process is transparent to clients (using a package manager that supports TUF) +who download distributions from PyPI. + + +Appendix C: PEP 470 and Projects Hosted Externally +================================================== + +How should TUF handle distributions that are not hosted on PyPI? According to +`PEP 470`__, projects may opt to host their distributions externally and are +only required to provide PyPI a link to its external index, which package +managers like pip can use to find the project's distributions. PEP 470 does +not mention whether externally hosted projects are considered unverified by +default, as projects that use this option are not required to submit any +information about their distributions (e.g., file size and cryptographic hash) +when the project is registered, nor include a cryptographic hash of the file +in download links. + +__ http://www.python.org/dev/peps/pep-0470/ + +Potentional approaches that PyPI administrators MAY consider to handle +projects hosted externally: + +1. Download external distributions but do not verify them. The targets + metadata will not include information for externally hosted projects. + +2. PyPI will periodically download information from the external index. PyPI + will gather the external distribution's file size and hashes and generate + appropriate TUF metadata. + +3. External projects MUST submit to PyPI the file size and cryptographic hash + for a distribution. + +4. External projects MUST upload to PyPI a developer public key for the + index. The distribution MUST create TUF metadata that is stored at the + index, and signed with the developer's corresponding private key. The + client will fetch the external TUF metadata as part of the package + update process. + +5. External projects MUST upload to PyPI signed TUF metadata (as allowed by + the maximum security model) about the distributions that they host + externally, and a developer public key. Package managers verify + distributions by consulting the signed metadata uploaded to PyPI. + +Only one of the options listed above should be implemented on PyPI. Option +(4) or (5) is RECOMMENDED because external distributions are signed by +developers. External distributions that are forged (due to a compromised +PyPI account or external host) may be detected if external developers are +required to sign metadata, although this requirement is likely only practical +if an easy-to-use key management solution and developer scripts are provided +by PyPI. References @@ -1055,27 +1066,30 @@ .. [24] https://pypi.python.org/pypi/pycrypto .. [25] http://ed25519.cr.yp.to/ - Acknowledgements ================ -Nick Coghlan, Daniel Holth and the distutils-sig community in general for -helping us to think about how to usably and efficiently integrate TUF with +This material is based upon work supported by the National Science Foundation +under Grants No. CNS-1345049 and CNS-0959138. Any opinions, findings, and +conclusions or recommendations expressed in this material are those of the +author(s) and do not necessarily reflect the views of the National Science +Foundation. + +We thank Nick Coghlan, Daniel Holth and the distutils-sig community in general +for helping us to think about how to usably and efficiently integrate TUF with PyPI. -Roger Dingledine, Sebastian Hahn, Nick Mathewson, Martin Peck and Justin -Samuel for helping us to design TUF from its predecessor Thandy of the Tor -project. +Roger Dingledine, Sebastian Hahn, Nick Mathewson, Martin Peck and Justin Samuel +helped us to design TUF from its predecessor Thandy of the Tor project. -Konstantin Andrianov, Geremy Condra, Vladimir Diaz, Zane Fisher, Justin Samuel, -Tian Tian, Santiago Torres, John Ward, and Yuyu Zheng for helping us to develop -TUF. +We appreciate the efforts of Konstantin Andrianov, Geremy Condra, Zane Fisher, +Justin Samuel, Tian Tian, Santiago Torres, John Ward, and Yuyu Zheng to to +develop TUF. -Vladimir Diaz, Monzur Muhammad and Sai Teja Peddinti for helping us to review -this PEP. +Vladimir Diaz, Monzur Muhammad and Sai Teja Peddinti helped us to review this +PEP. -Zane Fisher for helping us to review and transcribe this PEP. - +Zane Fisher helped us to review and transcribe this PEP. Copyright ========= diff --git a/pep-0480.txt b/pep-0480.txt new file mode 100644 --- /dev/null +++ b/pep-0480.txt @@ -0,0 +1,890 @@ +PEP: 480 +Title: Surviving a Compromise of PyPI: The Maximum Security Model +Version: $Revision$ +Last-Modified: $Date$ +Author: Trishank Karthik Kuppusamy , + Vladimir Diaz , Donald Stufft , + Justin Cappos +BDFL-Delegate: Richard Jones +Discussions-To: DistUtils mailing list +Status: Draft +Type: Standards Track +Content-Type: text/x-rst +Requires: 458 +Created: 8-Oct-2014 + + +Abstract +======== + +Proposed is an extension to PEP 458 that adds support for end-to-end signing +and the maximum security model. End-to-end signing allows both PyPI and +developers to sign for the distributions that are downloaded by clients. The +minimum security model proposed by PEP 458 supports continuous delivery of +distributions (because they are signed by online keys), but that model does not +protect distributions in the event that PyPI is compromised. In the minimum +security model, attackers may sign for malicious distributions by compromising +the signing keys stored on PyPI infrastructure. The maximum security model, +described in this PEP, retains the benefits of PEP 458 (e.g., immediate +availability of distributions that are uploaded to PyPI), but additionally +ensures that end-users are not at risk of installing forged software if PyPI is +compromised. + +This PEP discusses the changes made to PEP 458 but excludes its informational +elements to primarily focus on the maximum security model. For example, an +overview of The Update Framework or the basic mechanisms in PEP 458 are not +covered here. The changes to PEP 458 include modifications to the snapshot +process, key compromise analysis, auditing snapshots, and the steps that should +be taken in the event of a PyPI compromise. The signing and key management +process that PyPI MAY RECOMMEND is discussed but not strictly defined. How the +release process should be implemented to manage keys and metadata is left to +the implementors of the signing tools. That is, this PEP delineates the +expected cryptographic key type and signature format included in metadata that +MUST be uploaded by developers in order to support end-to-end verification of +distributions. + + +Rationale +========= + +PEP 458 [1]_ proposes how PyPI should be integrated with The Update Framework +(TUF) [2]_. It explains how modern package managers like pip can be made more +secure, and the types of attacks that can be prevented if PyPI is modified on +the server side to include TUF metadata. Package managers can reference the +TUF metadata available on PyPI to download distributions more securely. + +PEP 458 also describes the metadata layout of the PyPI repository and employs +the minimum security model, which supports continuous delivery of projects and +uses online cryptographic keys to sign the distributions uploaded by +developers. Although the minimum security model guards against most attacks on +software updaters [5]_ [7]_, such as mix-and-match and extraneous dependencies +attacks, it can be improved to support end-to-end signing and to prohibit +forged distributions in the event that PyPI is compromised. + +The main strength of PEP 458 and the minimum security model is the automated +and simplified release process: developers may upload distributions and then +have PyPI sign for their distributions. Much of the release process is handled +in an automated fashion by online roles and this approach requires storing +cryptographic signing keys on the PyPI infrastructure. Unfortunately, +cryptographic keys that are stored online are vulnerable to theft. The maximum +security model, proposed in this PEP, permits developers to sign for the +distributions that they make available to PyPI users, and does not put +end-users at risk of downloading malicious distributions if the online keys +stored on PyPI infrastructure are compromised. + + +Threat Model +============ + +The threat model assumes the following: + +* Offline keys are safe and securely stored. + +* Attackers can compromise at least one of PyPI's trusted keys that are stored + online, and may do so at once or over a period of time. + +* Attackers can respond to client requests. + +* Attackers may control any number of developer keys for projects a client does + not want to install. + +Attackers are considered successful if they can cause a client to install (or +leave installed) something other than the most up-to-date version of the +software the client is updating. When an attacker is preventing the +installation of updates, the attacker's goal is that clients not realize that +anything is wrong. + + +Definitions +=========== + +The keywords "MUST", "MUST NOT", "REQUIRED", "SHALL", "SHALL NOT", "SHOULD", +"SHOULD NOT", "RECOMMENDED", "MAY", and "OPTIONAL" in this document are to be +interpreted as described in RFC `2119`__. + +__ http://www.ietf.org/rfc/rfc2119.txt + +This PEP focuses on integrating TUF with PyPI; however, the reader is +encouraged to read about TUF's design principles [2]_. It is also RECOMMENDED +that the reader be familiar with the TUF specification [3]_, and PEP 458 [1]_ +(which this PEP is extending). + +Terms used in this PEP are defined as follows: + +* Projects: Projects are software components that are made available for + integration. Projects include Python libraries, frameworks, scripts, + plugins, applications, collections of data or other resources, and various + combinations thereof. Public Python projects are typically registered on the + Python Package Index [4]_. + +* Releases: Releases are uniquely identified snapshots of a project [4]_. + +* Distributions: Distributions are the packaged files that are used to publish + and distribute a release. + +* Simple index: The HTML page that contains internal links to the + distributions of a project [4]_. + +* Roles: There is one *root* role in PyPI. There are multiple roles whose + responsibilities are delegated to them directly or indirectly by the *root* + role. The term "top-level role" refers to the *root* role and any role + delegated by the *root* role. Each role has a single metadata file that it is + trusted to provide. + +* Metadata: Metadata are files that describe roles, other metadata, and target + files. + +* Repository: A repository is a resource comprised of named metadata and target + files. Clients request metadata and target files stored on a repository. + +* Consistent snapshot: A set of TUF metadata and PyPI targets that capture the + complete state of all projects on PyPI as they existed at some fixed point in + time. + +* The *snapshot* (*release*) role: In order to prevent confusion due to the + different meanings of the term "release" used in PEP 426 [1]_ and the TUF + specification [3]_, the *release* role is renamed to the *snapshot* role. + +* Developer: Either the owner or maintainer of a project who is allowed to + update TUF metadata, as well as distribution metadata and files for a given + project. + +* Online key: A private cryptographic key that MUST be stored on the PyPI + server infrastructure. This usually allows automated signing with the key. + An attacker who compromises the PyPI infrastructure will be able to + immediately read these keys. + +* Offline key: A private cryptographic key that MUST be stored independent of + the PyPI server infrastructure. This prevents automated signing with the + key. An attacker who compromises the PyPI infrastructure will not be able to + immediately read these keys. + +* Threshold signature scheme: A role can increase its resilience to key + compromises by specifying that at least t out of n keys are REQUIRED to sign + its metadata. A compromise of t-1 keys is insufficient to compromise the + role itself. Saying that a role requires (t, n) keys denotes the threshold + signature property. + + +Maximum Security Model +====================== + +The maximum security model permits developers to sign their projects and to +upload signed metadata to PyPI. If the PyPI infrastructure were compromised, +attackers would be unable to serve malicious versions of a *claimed* project +without having access to that project's developer key. Figure 1 depicts the +changes made to the metadata layout of the minimum security model, namely that +developer roles are now supported and that three new delegated roles exist: +*claimed*, *recently-claimed*, and *unclaimed*. The *bins* role from the +minimum security model has been renamed *unclaimed* and can contain any +projects that have not been added to *claimed*. The *unclaimed* role functions +just as before (i.e., as explained in PEP 458, projects added to this role are +signed by PyPI with an online key). Offline keys provided by developers ensure +the strength of the maximum security model over the minimum model. Although +the minimum security model supports continuous delivery of projects, all +projects are signed by an online key. That is, an attacker is able to corrupt +packages in the minimum security model, but not in the maximum model, without +also compromising a developer's key. + +.. image:: figure1.png + +Figure 1: An overview of the metadata layout in the maximum security model. +The maximum security model supports continuous delivery and survivable key +compromise. + +Projects that are signed by developers and uploaded to PyPI for the first time +are added to the *recently-claimed* role. The *recently-claimed* role uses an +online key, so projects uploaded for the first time are immediately available +to clients. After some time has passed, PyPI administrators MAY periodically +move (e.g., every month) projects listed in *recently-claimed* to the *claimed* +role for maximum security. The *claimed* role uses an offline key, thus +projects added to this role cannot be easily forged if PyPI is compromised. + +The *recently-claimed* role is separate from the *unclaimed* role for usability +and efficiency, not security. If new project delegations were prepended to +*unclaimed* metadata, *unclaimed* would need to be re-downloaded every time a +project obtained a key. By separating out new projects, the amount of data +retrieved is reduced. From a usability standpoint, it also makes it easier for +administrators to see which projects are now claimed. This information is +needed when moving keys from *recently-claimed* to *claimed*, which is +discussed in more detail in the "Producing Consistent Snapshots" section. + + +End-to-End Signing +================== + +End-to-end signing allows both PyPI and developers to sign for the metadata +downloaded by clients. PyPI is trusted to make uploaded projects available to +clients (PyPI signs the metadata for this part of the process), and developers +sign the distributions that they upload to PyPI. + +In order to delegate trust to a project, developers are required to submit a +public key to PyPI. PyPI takes the project's public key and adds it to parent +metadata that PyPI then signs. After the initial trust is established, +developers are required to sign distributions that they upload to PyPI using +the public key's corresponding private key. The signed TUF metadata that +developers upload to PyPI includes information like the distribution's file +size and hash, which package managers use to verify distributions that are +downloaded. + +The practical implications of end-to-end signing is the extra administrative +work needed to delegate trust to a project, and the signed metadata that +developers MUST upload to PyPI along with the distribution. Specifically, PyPI +is expected to periodically sign metadata with an offline key by adding +projects to the *claimed* metadata file and signing it. In contrast, projects +are only ever signed with an online key in the minimum security model. +End-to-end signing does require manual intervention to delegate trust (i.e., to +sign metadata with an offline key), but this is a one-time cost and projects +have stronger protections against PyPI compromises thereafter. + + +Metadata Signatures, Key Management, and Signing Distributions +============================================================== + +This section discusses the tools, signature scheme, and signing methods that +PyPI MAY recommend to implementors of the signing tools. Developers are +expected to use these tools to sign and upload distributions to PyPI. To +summarize the RECOMMENDED tools and schemes discussed in the subsections below, +developers MAY generate cryptographic keys and sign metadata (with the Ed25519 +signature scheme) in some automated fashion, where the metadata includes the +information required to verify the authenticity of the distribution. +Developers then upload metadata to PyPI, where it will be available for +download by package managers such as pip (i.e., package managers that support +TUF metadata). The entire process is transparent to the end-users (using a +package manager that supports TUF) that download distributions from PyPI. + +The first three subsections (Cryptographic Signature Scheme, Cryptographic Key +Files, and Key Management) cover the cryptographic components of the developer +release process. That is, which key type PyPI supports, how keys may be +stored, and how keys may be generated. The two subsections that follow the +first three discuss the PyPI modules that SHOULD be modified to support TUF +metadata. For example, Twine and Distutils are two projects that SHOULD be +modified. Finally, the last subsection goes over the automated key management +and signing solution that is RECOMMENDED for the signing tools. + +TUF's design is flexible with respect to cryptographic key types, signatures, +and signing methods. The tools, modification, and methods discussed in the +following sections are RECOMMENDATIONS for the implementors of the signing +tools. + + +Cryptographic Signature Scheme: Ed25519 +--------------------------------------- + +The package manager (pip) shipped with CPython MUST work on non-CPython +interpreters and cannot have dependencies that have to be compiled (i.e., the +PyPI+TUF integration MUST NOT require compilation of C extensions in order to +verify cryptographic signatures). Verification of signatures MUST be done in +Python, and verifying RSA [11]_ signatures in pure-Python may be impractical due +to speed. Therefore, PyPI MAY use the `Ed25519`__ signature scheme. + +__ http://ed25519.cr.yp.to/ + +Ed25519 [12]_ is a public-key signature system that uses small cryptographic +signatures and keys. A `pure-Python implementation`__ of the Ed25519 signature +scheme is available. Verification of Ed25519 signatures is fast even when +performed in Python. + +__ https://github.com/pyca/ed25519 + + +Cryptographic Key Files +----------------------- + +The implementation MAY encrypt key files with AES-256-CTR-Mode and strengthen +passwords with PBKDF2-HMAC-SHA256 (100K iterations by default, but this may be +overridden by the developer). The current Python implementation of TUF can use +any cryptographic library (support for PyCA cryptography will be added in the +future), may override the default number of PBKDF2 iterations, and the KDF +tweaked to taste. + + +Key Management: miniLock +------------------------ + +An easy-to-use key management solution is needed. One solution is to derive a +private key from a password so that developers do not have to manage +cryptographic key files across multiple computers. `miniLock`__ is an example +of how this can be done. Developers may view the cryptographic key as a +secondary password. miniLock also works well with a signature scheme like +Ed25519, which only needs a very small key. + +__ https://github.com/kaepora/miniLock#-minilock + + +Third-party Upload Tools: Twine +------------------------------- + +Third-party tools like `Twine`__ MAY be modified (if they wish to support +distributions that include TUF metadata) to sign and upload developer projects +to PyPI. Twine is a utility for interacting with PyPI that uses TLS to upload +distributions, and prevents MITM attacks on usernames and passwords. + +__ https://github.com/pypa/twine + + +Distutils +--------- + +`Distutils`__ MAY be modified to sign metadata and to upload signed distributions +to PyPI. Distutils comes packaged with CPython and is the most widely-used +tool for uploading distributions to PyPI. + +__ https://docs.python.org/2/distutils/index.html#distutils-index + + +Automated Signing Solution +-------------------------- + +An easy-to-use key management solution is RECOMMENDED for developers. One +approach is to generate a cryptographic private key from a user password, akin +to miniLock. Although developer signatures can remain optional, this approach +may be inadequate due to the great number of potentially unsigned dependencies +each distribution may have. If any one of these dependencies is unsigned, it +negates any benefit the project gains from signing its own distribution (i.e., +attackers would only need to compromise one of the unsigned dependencies to +attack end-users). Requiring developers to manually sign distributions and +manage keys is expected to render key signing an unused feature. + +A default, PyPI-mediated key management and package signing solution that is +`transparent`__ to developers and does not require a key escrow (sharing of +encrypted private keys with PyPI) is RECOMMENDED for the signing tools. +Additionally, the signing tools SHOULD circumvent the sharing of private keys +across multiple machines of each developer. + +__ https://en.wikipedia.org/wiki/Transparency_%28human%E2%80%93computer_interaction%29 + +The following outlines an automated signing solution that a new developer MAY +follow to upload a distribution to PyPI: + +1. Register a PyPI project. +2. Enter a secondary password (independent of the PyPI user account password). +3. Optional: Add a new identity to the developer's PyPI user account from a + second machine (after a password prompt). +4. Upload project. + +Step 1 is the normal procedure followed by developers to `register a PyPI +project`__. + +__ https://pypi.python.org/pypi?:action=register_form + +Step 2 generates an encrypted key file (private), uploads an Ed25519 public key +to PyPI, and signs the TUF metadata that is generated for the distribution. + +Optionally adding a new identity from a second machine, by simply entering a +password, in step 3 also generates an encrypted private key file and uploads an +Ed25519 public key to PyPI. Separate identities MAY be created to allow a +developer, or other project maintainers, to sign releases on multiple machines. +An existing verified identity (its public key is contained in project metadata +or has been uploaded to PyPI) signs for new identities. By default, project +metadata has a signature threshold of "1" and other verified identities may +create new releases to satisfy the threshold. + +Step 4 uploads the distribution file and TUF metadata to PyPI. The "Snapshot +Process" section discusses in detail the procedure followed by developers to +upload a distribution to PyPI. + +Generation of cryptographic files and signatures is transparent to the +developers in the default case: developers need not be aware that packages are +automatically signed. However, the signing tools should be flexible; a single +project key may also be shared between multiple machines if manual key +management is preferred (e.g., ssh-copy-id). + +The `repository`__ and `developer`__ TUF tools currently support all of the +recommendations previously mentioned, except for the automated signing +solution, which SHOULD be added to Distutils, Twine, and other third-party +signing tools. The automated signing solution calls available repository tool +functions to sign metadata and to generate the cryptographic key files. + +__ https://github.com/theupdateframework/tuf/blob/develop/tuf/README.md +__ https://github.com/theupdateframework/tuf/blob/develop/tuf/README-developer-tools.md + + +Snapshot Process +---------------- + +The snapshot process is fairly simple and SHOULD be automated. The snapshot +process MUST keep in memory the latest working set of *root*, *targets*, and +delegated roles. Every minute or so the snapshot process will sign for this +latest working set. (Recall that project transaction processes continuously +inform the snapshot process about the latest delegated metadata in a +concurrency-safe manner. The snapshot process will actually sign for a copy of +the latest working set while the latest working set in memory will be updated +with information that is continuously communicated by the project transaction +processes.) The snapshot process MUST generate and sign new *timestamp* +metadata that will vouch for the metadata (*root*, *targets*, and delegated +roles) generated in the previous step. Finally, the snapshot process MUST make +available to clients the new *timestamp* and *snapshot* metadata representing +the latest snapshot. + +A *claimed* or *recently-claimed* project will need to upload in its +transaction to PyPI not just targets (a simple index as well as distributions) +but also TUF metadata. The project MAY do so by uploading a ZIP file containing +two directories, /metadata/ (containing delegated targets metadata files) and +/targets/ (containing targets such as the project simple index and +distributions that are signed by the delegated targets metadata). + +Whenever the project uploads metadata or targets to PyPI, PyPI SHOULD check the +project TUF metadata for at least the following properties: + +* A threshold number of the developers keys registered with PyPI by that + project MUST have signed for the delegated targets metadata file that + represents the "root" of targets for that project (e.g. metadata/targets/ + project.txt). +* The signatures of delegated targets metadata files MUST be valid. +* The delegated targets metadata files MUST NOT have expired. +* The delegated targets metadata MUST be consistent with the targets. +* A delegator MUST NOT delegate targets that were not delegated to itself by + another delegator. +* A delegatee MUST NOT sign for targets that were not delegated to itself by a + delegator. + +If PyPI chooses to check the project TUF metadata, then PyPI MAY choose to +reject publishing any set of metadata or targets that do not meet these +requirements. + +PyPI MUST enforce access control by ensuring that each project can only write +to the TUF metadata for which it is responsible. It MUST do so by ensuring that +project transaction processes write to the correct metadata as well as correct +locations within those metadata. For example, a project transaction process for +an unclaimed project MUST write to the correct target paths in the correct +delegated unclaimed metadata for the targets of the project. + +On rare occasions, PyPI MAY wish to extend the TUF metadata format for projects +in a backward-incompatible manner. Note that PyPI will NOT be able to +automatically rewrite existing TUF metadata on behalf of projects in order to +upgrade the metadata to the new backward-incompatible format because this would +invalidate the signatures of the metadata as signed by developer keys. +Instead, package managers SHOULD be written to recognize and handle multiple +incompatible versions of TUF metadata so that claimed and recently-claimed +projects could be offered a reasonable time to migrate their metadata to newer +but backward-incompatible formats. + +If PyPI eventually runs out of disk space to produce a new consistent snapshot, +then PyPI MAY then use something like a "mark-and-sweep" algorithm to delete +sufficiently outdated consistent snapshots. That is, only outdated metadata +like *timestamp* and *snapshot* that are no longer used are deleted. +Specifically, in order to preserve the latest consistent snapshot, PyPI would +walk objects -- beginning from the root (*timestamp*) -- of the latest +consistent snapshot, mark all visited objects, and delete all unmarked objects. +The last few consistent snapshots may be preserved in a similar fashion. +Deleting a consistent snapshot will cause clients to see nothing except HTTP +404 responses to any request for a target of the deleted consistent snapshot. +Clients SHOULD then retry (as before) their requests with the latest consistent +snapshot. + +All package managers that support TUF metadata MUST be modified to download +every metadata and target file (except for *timestamp* metadata) by including, +in the request for the file, the cryptographic hash of the file in the +filename. Following the filename convention RECOMMENDED in the next +subsection, a request for the file at filename.ext will be transformed to the +equivalent request for the file at digest.filename. + +Finally, PyPI SHOULD use a `transaction log`__ to record project transaction +processes and queues so that it will be easier to recover from errors after a +server failure. + +__ https://en.wikipedia.org/wiki/Transaction_log + + +Producing Consistent Snapshots +------------------------------ + +PyPI is responsible for updating, depending on the project, either the +*claimed*, *recently-claimed*, or *unclaimed* metadata and associated delegated +metadata. Every project MUST upload its set of metadata and targets in a single +transaction. The uploaded set of files is called the "project transaction." +How PyPI MAY validate files in a project transaction is discussed in a later +section. The focus of this section is on how PyPI will respond to a project +transaction. + +Every metadata and target file MUST include in its filename the `hex digest`__ +of its `SHA-256`__ hash, which PyPI may prepend to filenames after the files +have been uploaded. For this PEP, it is RECOMMENDED that PyPI adopt a simple +convention of the form: *digest.filename*, where filename is the original +filename without a copy of the hash, and digest is the hex digest of the hash. + +__ http://docs.python.org/2/library/hashlib.html#hashlib.hash.hexdigest +__ https://en.wikipedia.org/wiki/SHA-2 + +When an unclaimed project uploads a new transaction, a project transaction +process MUST add all new targets and relevant delegated unclaimed metadata. +The project transaction process MUST inform the snapshot process about new +delegated unclaimed metadata. + +When a *recently-claimed* project uploads a new transaction, a project +transaction process MUST add all new targets and delegated targets metadata for +the project. If the project is new, then the project transaction process MUST +also add new *recently-claimed* metadata with the public keys (which MUST be +part of the transaction) for the project. *recently-claimed* projects have a +threshold value of "1" set by the transaction process. Finally, the project +transaction process MUST inform the snapshot process about new +*recently-claimed* metadata, as well as the current set of delegated targets +metadata for the project. + +The transaction process for a claimed project is slightly different in that +PyPI administrators periodically move (a manual process that MAY occur every +two weeks to a month) projects from the *recently-claimed* role to the +*claimed* role. (Moving a project from *recently-claimed* to *claimed* is a +manual process because PyPI administrators have to use an offline key to sign +the claimed project's distribution.) A project transaction process MUST then +add new *recently-claimed* and *claimed* metadata to reflect this migration. As +is the case for a *recently-claimed* project, the project transaction process +MUST always add all new targets and delegated targets metadata for the claimed +project. Finally, the project transaction process MUST inform the consistent +snapshot process about new *recently-claimed* or *claimed* metadata, as well as +the current set of delegated targets metadata for the project. + +Project transaction processes SHOULD be automated, except when PyPI +administrators move a project from the *recently-claimed* role to the *claimed* +role. Project transaction processes MUST also be applied atomically: either all +metadata and targets -- or none of them -- are added. The project transaction +processes and snapshot process SHOULD work concurrently. Finally, project +transaction processes SHOULD keep in memory the latest *claimed*, +*recently-claimed*, and *unclaimed* metadata so that they will be correctly +updated in new consistent snapshots. + +The queue MAY be processed concurrently in order of appearance, provided that +the following rules are observed: + +1. No pair of project transaction processes may concurrently work on the same + project. + +2. No pair of project transaction processes may concurrently work on + *unclaimed* projects that belong to the same delegated *unclaimed* role. + +3. No pair of project transaction processes may concurrently work on new + recently-claimed projects. + +4. No pair of project transaction processes may concurrently work on new + claimed projects. + +5. No project transaction process may work on a new claimed project while + another project transaction process is working on a new recently-claimed + project and vice versa. + +These rules MUST be observed to ensure that metadata is not read from or +written to inconsistently. + + +Auditing Snapshots +------------------ + +If a malicious party compromises PyPI, they can sign arbitrary files with any +of the online keys. The roles with offline keys (i.e., *root* and *targets*) +are still protected. To safely recover from a repository compromise, snapshots +should be audited to ensure that files are only restored to trusted versions. + +When a repository compromise has been detected, the integrity of three types of +information must be validated: + +1. If the online keys of the repository have been compromised, they can be + revoked by having the *targets* role sign new metadata, delegated to a new + key. + +2. If the role metadata on the repository has been changed, this will impact + the metadata that is signed by online keys. Any role information created + since the compromise should be discarded. As a result, developers of new + projects will need to re-register their projects. + +3. If the packages themselves may have been tampered with, they can be + validated using the stored hash information for packages that existed in + trusted metadata before the compromise. Also, new distributions that are + signed by developers in the *claimed* role may be safely retained. However, + any distributions signed by developers in the *recently-claimed* or + *unclaimed* roles should be discarded. + +In order to safely restore snapshots in the event of a compromise, PyPI SHOULD +maintain a small number of its own mirrors to copy PyPI snapshots according to +some schedule. The mirroring protocol can be used immediately for this +purpose. The mirrors must be secured and isolated such that they are +responsible only for mirroring PyPI. The mirrors can be checked against one +another to detect accidental or malicious failures. + +Another approach is to periodically generate the cryptographic hash of +*snapshot* and tweet it. For example, upon receiving the tweet, a user comes +forward with the actual metadata and the repository maintainers are then able +to verify metadata's cryptographic hash. Alternatively, PyPI may periodically +archive its own versions of *snapshot* rather than rely on externally provided +metadata. In this case, PyPI SHOULD take the cryptographic hash of every +package on the repository and store this data on an offline device. If any +package hash has changed, this indicates an attack has occurred. + +Attacks that serve different versions of metadata or that freeze a version of a +package at a specific version can be handled by TUF with techniques such as +implicit key revocation and metadata mismatch detection [2]_. +n + +Key Compromise Analysis +======================= + +This PEP has covered the maximum security model, the TUF roles that should be +added to support continuous delivery of distributions, how to generate and sign +the metadata of each role, and how to support distributions that have been +signed by developers. The remaining sections discuss how PyPI SHOULD audit +repository metadata, and the methods PyPI can use to detect and recover from a +PyPI compromise. + +Table 1 summarizes a few of the attacks possible when a threshold number of +private cryptographic keys (belonging to any of the PyPI roles) are +compromised. The leftmost column lists the roles (or a combination of roles) +that have been compromised, and the columns to the right show whether the +compromised roles leaves clients susceptible to malicious updates, freeze +attacks, or metadata inconsistency attacks. + ++-------------------+-------------------+-----------------------+-----------------------+ +| Role Compromise | Malicious Updates | Freeze Attack | Metadata Inconsistency| +| | | | Attacks | ++===================+===================+=======================+=======================+ +| timetamp | NO | YES | NO | +| | snapshot and | limited by earliest | snapshot needs to | +| | targets or any | root, targets, or bin | cooperate | +| | of the delegated | metadata expiry time | | +| | roles need to | | | +| | cooperate | | | ++-------------------+-------------------+-----------------------+-----------------------+ +| snapshot | NO | NO | NO | +| | timestamp and | timestamp needs to | timestamp needs to | +| | targets or any of | coorperate | cooperate | +| | the delegated | | | +| | roles need to | | | +| | cooperate | | | ++-------------------+-------------------+-----------------------+-----------------------+ +| timestamp | NO | YES | YES | +| *AND* | targets or any | limited by earliest | limited by earliest | +| snapshot | of the delegated | root, targets, or bin | root, targets, or bin | +| | roles need to | metadata expiry time | metadata expiry time | +| | cooperate | | | +| | | | | ++-------------------+-------------------+-----------------------+-----------------------+ +| targets | NO | NOT APPLICABLE | NOT APPLICABLE | +| *OR* | timestamp and | need timestamp and | need timestamp | +| **claimed** | snapshot need to | snapshot | and snapshot | +| *OR* | cooperate | | | +| recently-claimed | | | | +| *OR* | | | | +| unclaimed | | | | +| *OR* | | | | +| **project** | | | | ++-------------------+-------------------+-----------------------+-----------------------+ +| (timestamp | YES | YES | YES | +| *AND* | | limited by earliest | limited by earliest | +| snapshot) | | root, targets, or bin | root, targets, or bin | +| *AND* | | metadata expiry time | metadata expiry time | +| **project** | | | | +| | | | | ++-------------------+-------------------+-----------------------+-----------------------+ +| (timestamp | YES | YES | YES | +| *AND* | but only of | limited by earliest | limited by earliest | +| snapshot) | projects not | root, targets, | root, targets, | +| *AND* | delegated by | claimed, | claimed, | +| (recently-claimed | claimed | recently-claimed, | recently-claimed, | +| *OR* | | project, or unclaimed | project, or unclaimed | +| unclaimed) | | metadata expiry time | metadata expiry time | ++-------------------+-------------------+-----------------------+-----------------------+ +| (timestamp | | YES | YES | +| *AND* | | limited by earliest | limited by earliest | +| snapshot) | | root, targets, | root, targets, | +| *AND* | YES | claimed, | claimed, | +| (targets *OR* | | recently-claimed, | recently-claimed, | +| **claimed**) | | project, or unclaimed | project, or unclaimed | +| | | metadata expiry time | metadata expiry time | ++-------------------+-------------------+-----------------------+-----------------------+ +| root | YES | YES | YES | ++-------------------+-------------------+-----------------------+-----------------------+ + +Table 1: Attacks that are possible by compromising certain combinations of role +keys. In `September 2013`__, it was shown how the latest version (at the time) +of pip was susceptible to these attacks and how TUF could protect users against +them [8]_. Roles signed by offline keys are in **bold**. + +__ https://mail.python.org/pipermail/distutils-sig/2013-September/022755.html + +Note that compromising *targets* or any delegated role (except for project +targets metadata) does not immediately allow an attacker to serve malicious +updates. The attacker must also compromise the *timestamp* and *snapshot* +roles (which are both online and therefore more likely to be compromised). +This means that in order to launch any attack, one must not only be able to act +as a man-in-the-middle, but also compromise the *timestamp* key (or compromise +the *root* keys and sign a new *timestamp* key). To launch any attack other +than a freeze attack, one must also compromise the *snapshot* key. Finally, a +compromise of the PyPI infrastructure MAY introduce malicious updates to +*recently-claimed* projects because the keys for these roles are online. + + +In the Event of a Key Compromise +-------------------------------- + +A key compromise means that a threshold of keys belonging to developers or the +roles on PyPI, as well as the PyPI infrastructure, have been compromised and +used to sign new metadata on PyPI. + +If a threshold number of developer keys of a project have been compromised, +the project MUST take the following steps: + +1. The project metadata and targets MUST be restored to the last known good + consistent snapshot where the project was not known to be compromised. This + can be done by developers repackaging and resigning all targets with + the new keys. + +2. The project's metadata MUST have its version numbers incremented, expiry + times suitably extended, and signatures renewed. + +Whereas PyPI MUST take the following steps: + +1. Revoke the compromised developer keys from the *recently-claimed* or + *claimed* role. This is done by replacing the compromised developer keys + with newly issued developer keys. + +2. A new timestamped consistent snapshot MUST be issued. + +If a threshold number of *timestamp*, *snapshot*, *recently-claimed*, or +*unclaimed* keys have been compromised, then PyPI MUST take the following +steps: + +1. Revoke the *timestamp*, *snapshot*, and *targets* role keys from the + root role. This is done by replacing the compromised *timestamp*, + *snapshot*, and *targets* keys with newly issued keys. + +2. Revoke the *recently-claimed* and *unclaimed* keys from the *targets* role + by replacing their keys with newly issued keys. Sign the new targets role + metadata and discard the new keys (because, as we explained earlier, this + increases the security of targets metadata). + +3. Clear all targets or delegations in the *recently-claimed* role and delete + all associated delegated targets metadata. Recently registered projects + SHOULD register their developer keys again with PyPI. + +4. All targets of the *recently-claimed* and *unclaimed* roles SHOULD be + compared with the last known good consistent snapshot where none of the + timestamp, snapshot, recently-claimed, or unclaimed keys were known to have + been compromised. Added, updated, or deleted targets in the compromised + consistent snapshot that do not match the last known good consistent + snapshot SHOULD be restored to their previous versions. After ensuring the + integrity of all unclaimed targets, the unclaimed metadata MUST be + regenerated. + +5. The *recently-claimed* and *unclaimed* metadata MUST have their version + numbers incremented, expiry times suitably extended, and signatures + renewed. + +6. A new timestamped consistent snapshot MUST be issued. + +This would preemptively protect all of these roles even though only one of them +may have been compromised. + +If a threshold number of the *targets* or *claimed* keys have been compromised, +then there is little that an attacker would be able do without the *timestamp* +and *snapshot* keys. In this case, PyPI MUST simply revoke the compromised +*targets* or *claimed* keys by replacing them with new keys in the *root* and +*targets* roles, respectively. + +If a threshold number of the *timestamp*, *snapshot*, and *claimed* keys have +been compromised, then PyPI MUST take the following steps in addition to the +steps taken when either the *timestamp* or *snapshot* keys are compromised: + +1. Revoke the *claimed* role keys from the targets role and replace them with + newly issued keys. + +2. All project targets of the claimed roles SHOULD be compared with the last + known good consistent snapshot where none of the *timestamp*, *snapshot*, + or *claimed* keys were known to have been compromised. Added, updated, or + deleted targets in the compromised consistent snapshot that do not match + the last known good consistent snapshot MAY be restored to their previous + versions. After ensuring the integrity of all claimed project targets, the + *claimed* metadata MUST be regenerated. + +3. The claimed metadata MUST have their version numbers incremented, expiry + times suitably extended, and signatures renewed. + +Following these steps would preemptively protect all of these roles even though +only one of them may have been compromised. + +If a threshold number of *root* keys have been compromised, then PyPI MUST take +the steps taken when the *targets* role has been compromised. All of the +*root* keys must also be replaced. + +It is also RECOMMENDED that PyPI sufficiently document compromises with +security bulletins. These security bulletins will be most informative when +users of pip-with-TUF are unable to install or update a project because the +keys for the *timestamp*, *snapshot*, or *root* roles are no longer valid. +Users could then visit the PyPI web site to consult security bulletins that +would help to explain why users are no longer able to install or update, and +then take action accordingly. When a threshold number of *root* keys have not +been revoked due to a compromise, then new *root* metadata may be safely +updated because a threshold number of existing *root* keys will be used to sign +for the integrity of the new *root* metadata. TUF clients will be able to +verify the integrity of the new *root* metadata with a threshold number of +previously known *root* keys. This will be the common case. In the worst +case, where a threshold number of *root* keys have been revoked due to a +compromise, an end-user may choose to update new *root* metadata with +`out-of-band`__ mechanisms. + +__ https://en.wikipedia.org/wiki/Out-of-band#Authentication + + +Appendix A: PyPI Build Farm and End-to-End Signing +================================================== + +PyPI administrators intend to support a central build farm. The PyPI build +farm will auto-generate a `Wheel`__, for each distribution that is uploaded by +developers, on PyPI infrastructure and on supported platforms. Package +managers will likely install projects by downloading these PyPI Wheels (which +can be installed much faster than source distributions) rather than the source +distributions signed by developers. The implications of having a central build +farm with end-to-end signing SHOULD be investigated before the maximum security +model is implemented. + +__ http://wheel.readthedocs.org/en/latest/ + +An issue with a central build farm and end-to-end signing is that developers +are unlikely to sign Wheel distributions once they have been generated on PyPI +infrastructure. However, generating wheels from source distributions that are +signed by developers can still be beneficial, provided that building Wheels is +a deterministic process. If deterministic builds are infeasible, developers +may delegate trust of these wheels to a PyPI role that signs for wheels with +an online key. + + +References +========== + +.. [1] https://www.python.org/dev/peps/pep-0458/ +.. [2] https://isis.poly.edu/~jcappos/papers/samuel_tuf_ccs_2010.pdf +.. [3] https://github.com/theupdateframework/tuf/blob/develop/docs/tuf-spec.txt +.. [4] http://www.python.org/dev/peps/pep-0426/ +.. [5] https://github.com/theupdateframework/pip/wiki/Attacks-on-software-repositories +.. [6] https://mail.python.org/pipermail/distutils-sig/2013-September/022773.html +.. [7] https://isis.poly.edu/~jcappos/papers/cappos_mirror_ccs_08.pdf +.. [8] https://mail.python.org/pipermail/distutils-sig/2013-September/022755.html +.. [9] https://pypi.python.org/security +.. [10] https://mail.python.org/pipermail/distutils-sig/2013-August/022154.html +.. [11] https://en.wikipedia.org/wiki/RSA_%28algorithm%29 +.. [12] http://ed25519.cr.yp.to/ + + +Acknowledgements +================ + +This material is based upon work supported by the National Science Foundation +under Grants No. CNS-1345049 and CNS-0959138. Any opinions, findings, and +conclusions or recommendations expressed in this material are those of the +author(s) and do not necessarily reflect the views of the National Science +Foundation. + +We thank Nick Coghlan, Daniel Holth and the distutils-sig community in general +for helping us to think about how to usably and efficiently integrate TUF with +PyPI. + +Roger Dingledine, Sebastian Hahn, Nick Mathewson, Martin Peck and Justin +Samuel helped us to design TUF from its predecessor Thandy of the Tor project. + +We appreciate the efforts of Konstantin Andrianov, Geremy Condra, Zane Fisher, +Justin Samuel, Tian Tian, Santiago Torres, John Ward, and Yuyu Zheng to develop +TUF. + + +Copyright +========= + +This document has been placed in the public domain. -- Repository URL: https://hg.python.org/peps From solipsis at pitrou.net Thu Nov 20 10:33:44 2014 From: solipsis at pitrou.net (solipsis at pitrou.net) Date: Thu, 20 Nov 2014 10:33:44 +0100 Subject: [Python-checkins] Daily reference leaks (23ab1197df0b): sum=3 Message-ID: results for 23ab1197df0b on branch "default" -------------------------------------------- test_functools leaked [0, 0, 3] memory blocks, sum=3 Command line was: ['./python', '-m', 'test.regrtest', '-uall', '-R', '3:3:/home/antoine/cpython/refleaks/reflogUYAATt', '-x'] From python-checkins at python.org Thu Nov 20 11:12:19 2014 From: python-checkins at python.org (ned.deily) Date: Thu, 20 Nov 2014 10:12:19 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgMjI4Nzg6?= =?utf-8?q?_PEP_477_-_=22make_install=22_and_=22make_altinstall=22_integra?= =?utf-8?q?tion?= Message-ID: <20141120101212.43934.96838@psf.io> https://hg.python.org/cpython/rev/07f4b6ecd04a changeset: 93514:07f4b6ecd04a branch: 2.7 parent: 93506:6e26b5291c41 user: Ned Deily date: Thu Nov 20 02:11:03 2014 -0800 summary: Issue 22878: PEP 477 - "make install" and "make altinstall" integration The backport of ensurepip to 2.7.9 allows pip to optionally be installed or upgraded using the bundled pip provided by the new ensurepip module. The option can be specified persistently using the configure option: ./configure --with-ensurepip[=upgrade|install|no] It can also be overridden on either the "install" or "altinstall" targets: make [alt]install ENSUREPIP=[upgrade|install|no] For Python 2, the default option is "no" (do not install pip). files: Doc/using/unix.rst | 2 ++ Doc/whatsnew/2.7.rst | 5 +++++ Mac/Makefile.in | 29 +++++++++++++++++++++++++++-- Makefile.pre.in | 32 +++++++++++++++++++++++++++----- Misc/NEWS | 7 +++++++ configure | 30 ++++++++++++++++++++++++++++++ configure.ac | 15 +++++++++++++++ 7 files changed, 113 insertions(+), 7 deletions(-) diff --git a/Doc/using/unix.rst b/Doc/using/unix.rst --- a/Doc/using/unix.rst +++ b/Doc/using/unix.rst @@ -59,6 +59,8 @@ of Python are available and can be installed with e.g. ``pkgutil -i python27``. +.. _building-python-on-unix: + Building Python =============== diff --git a/Doc/whatsnew/2.7.rst b/Doc/whatsnew/2.7.rst --- a/Doc/whatsnew/2.7.rst +++ b/Doc/whatsnew/2.7.rst @@ -2605,6 +2605,11 @@ all platforms (where X.Y stands for the version of the Python installation), along with the ``pip`` Python package and its dependencies. +For CPython :ref:`source builds on POSIX systems `, +the ``make install`` and ``make altinstall`` commands do not bootstrap ``pip`` +by default. This behaviour can be controlled through configure options, and +overridden through Makefile options. + On Windows and Mac OS X, the CPython installers now default to installing ``pip`` along with CPython itself (users may opt out of installing it during the installation process). Window users will need to opt in to the diff --git a/Mac/Makefile.in b/Mac/Makefile.in --- a/Mac/Makefile.in +++ b/Mac/Makefile.in @@ -3,9 +3,11 @@ # commandline in that case. VERSION=@VERSION@ +ENSUREPIP=@ENSUREPIP@ builddir = .. srcdir=@srcdir@ prefix=@prefix@ +exec_prefix=@exec_prefix@ LIBDEST=$(prefix)/lib/python$(VERSION) RUNSHARED=@RUNSHARED@ BUILDEXE=@BUILDEXEEXT@ @@ -21,7 +23,7 @@ export MACOSX_DEPLOYMENT_TARGET # These are normally glimpsed from the previous set -bindir=$(prefix)/bin +BINDIR= @bindir@ PYTHONAPPSDIR=@FRAMEWORKINSTALLAPPSPREFIX@/$(PYTHONFRAMEWORK) $(VERSION) APPINSTALLDIR=$(prefix)/Resources/Python.app @@ -92,6 +94,18 @@ ln -fs "$(prefix)/bin/$${fn}" "$(DESTDIR)$(FRAMEWORKUNIXTOOLSPREFIX)/bin/$${fn}" ;\ done endif + -if test "x$(ENSUREPIP)" != "xno" ; then \ + cd "$(DESTDIR)$(FRAMEWORKUNIXTOOLSPREFIX)/bin" && \ + for fn in \ + easy_install \ + pip \ + pip2 \ + ; \ + do \ + rm -f $${fn} ;\ + $(LN) -s $(BINDIR)/$${fn} $${fn} ;\ + done ;\ + fi # @@ -112,7 +126,18 @@ ln -fs "$(prefix)/bin/$${fn}" "$(DESTDIR)$(FRAMEWORKUNIXTOOLSPREFIX)/bin/$${fn}" ;\ done endif - ln -fs "$(prefix)/bin/2to3-$(VERSION)" "$(DESTDIR)$(FRAMEWORKUNIXTOOLSPREFIX)/bin/2to3-$(VERSION)" ;\ + ln -fs "$(prefix)/bin/2to3-$(VERSION)" "$(DESTDIR)$(FRAMEWORKUNIXTOOLSPREFIX)/bin/2to3-$(VERSION)" + -if test "x$(ENSUREPIP)" != "xno" ; then \ + cd "$(DESTDIR)$(FRAMEWORKUNIXTOOLSPREFIX)/bin" && \ + for fn in \ + easy_install-$(VERSION) \ + pip$(VERSION) \ + ; \ + do \ + rm -f $${fn} ;\ + $(LN) -s $(BINDIR)/$${fn} $${fn} ;\ + done ;\ + fi # By default most tools are installed without a version in their basename, to # make it easier to install (and use) several python versions side-by-side move diff --git a/Makefile.pre.in b/Makefile.pre.in --- a/Makefile.pre.in +++ b/Makefile.pre.in @@ -144,6 +144,9 @@ # Environment to run shared python without installed libraries RUNSHARED= @RUNSHARED@ +# ensurepip options +ENSUREPIP= @ENSUREPIP@ + # Modes for directories, executables and data files created by the # install process. Default to user-only-writable for all file types. DIRMODE= 755 @@ -829,12 +832,31 @@ $(TESTPYTHON) $(TESTPROG) $(MEMTESTOPTS) # Install everything -install: @FRAMEWORKINSTALLFIRST@ altinstall bininstall maninstall @FRAMEWORKINSTALLLAST@ +install: @FRAMEWORKINSTALLFIRST@ commoninstall bininstall maninstall @FRAMEWORKINSTALLLAST@ + if test "x$(ENSUREPIP)" != "xno" ; then \ + case $(ENSUREPIP) in \ + upgrade) ensurepip="--upgrade" ;; \ + install|*) ensurepip="" ;; \ + esac; \ + $(RUNSHARED) $(PYTHON_FOR_BUILD) -m ensurepip \ + $$ensurepip --root=$(DESTDIR)/ ; \ + fi # Install almost everything without disturbing previous versions -altinstall: @FRAMEWORKALTINSTALLFIRST@ altbininstall libinstall inclinstall \ - libainstall altmaninstall \ - sharedinstall oldsharedinstall @FRAMEWORKALTINSTALLLAST@ +altinstall: commoninstall + if test "x$(ENSUREPIP)" != "xno" ; then \ + case $(ENSUREPIP) in \ + upgrade) ensurepip="--altinstall --upgrade --no-default-pip" ;; \ + install|*) ensurepip="--altinstall --no-default-pip" ;; \ + esac; \ + $(RUNSHARED) $(PYTHON_FOR_BUILD) -m ensurepip \ + $$ensurepip --root=$(DESTDIR)/ ; \ + fi + +commoninstall: @FRAMEWORKALTINSTALLFIRST@ \ + altbininstall libinstall inclinstall libainstall \ + sharedinstall oldsharedinstall altmaninstall \ + @FRAMEWORKALTINSTALLLAST@ # Install shared libraries enabled by Setup DESTDIRS= $(exec_prefix) $(LIBDIR) $(BINLIBDEST) $(DESTSHARED) @@ -1371,7 +1393,7 @@ .PHONY: frameworkinstall frameworkinstallframework frameworkinstallstructure .PHONY: frameworkinstallmaclib frameworkinstallapps frameworkinstallunixtools .PHONY: frameworkaltinstallunixtools recheck autoconf clean clobber distclean -.PHONY: smelly funny patchcheck touch altmaninstall +.PHONY: smelly funny patchcheck touch altmaninstall commoninstall .PHONY: gdbhooks # IF YOU PUT ANYTHING HERE IT WILL GO AWAY diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -326,6 +326,13 @@ - Issue #22877: PEP 477 - OS X installer now installs pip. +- Issue #22878: PEP 477 - "make install" and "make altinstall" can now install + or upgrade pip, using the bundled pip provided by the backported ensurepip + module. A configure option, --with-ensurepip[=upgrade|install|no], is + available to set the option for subsequent installs; the default for Python 2 + in "no" (do not install or upgrade pip). The option can also be set with + "make [alt]install ENSUREPIP=[upgrade|install|no]". + Windows ------- diff --git a/configure b/configure --- a/configure +++ b/configure @@ -624,6 +624,7 @@ #endif" ac_subst_vars='LTLIBOBJS +ENSUREPIP SRCDIRS THREADHEADERS UNICODE_OBJS @@ -807,6 +808,7 @@ with_libc enable_big_digits enable_unicode +with_ensurepip ' ac_precious_vars='build_alias host_alias @@ -1486,6 +1488,9 @@ --with-fpectl enable SIGFPE catching --with-libm=STRING math library --with-libc=STRING C library + --with(out)-ensurepip=[=OPTION] + "install" or "upgrade" using bundled pip, default is + "no" Some influential environment variables: CC C compiler command @@ -14604,6 +14609,31 @@ { $as_echo "$as_me:${as_lineno-$LINENO}: result: done" >&5 $as_echo "done" >&6; } +# ensurepip option +{ $as_echo "$as_me:${as_lineno-$LINENO}: checking for ensurepip" >&5 +$as_echo_n "checking for ensurepip... " >&6; } + +# Check whether --with-ensurepip was given. +if test "${with_ensurepip+set}" = set; then : + withval=$with_ensurepip; +else + with_ensurepip=no +fi + +case $with_ensurepip in #( + yes|upgrade) : + ENSUREPIP=upgrade ;; #( + install) : + ENSUREPIP=install ;; #( + no) : + ENSUREPIP=no ;; #( + *) : + as_fn_error $? "--with-ensurepip=upgrade|install|no" "$LINENO" 5 ;; +esac +{ $as_echo "$as_me:${as_lineno-$LINENO}: result: $ENSUREPIP" >&5 +$as_echo "$ENSUREPIP" >&6; } + + # generate output files ac_config_files="$ac_config_files Makefile.pre Modules/Setup.config Misc/python.pc" diff --git a/configure.ac b/configure.ac --- a/configure.ac +++ b/configure.ac @@ -4552,6 +4552,21 @@ done AC_MSG_RESULT(done) +# ensurepip option +AC_MSG_CHECKING(for ensurepip) +AC_ARG_WITH(ensurepip, + [AS_HELP_STRING([--with(out)-ensurepip=@<:@=OPTION@:>@], + ["install" or "upgrade" using bundled pip, default is "no"])], + [], + [with_ensurepip=no]) +AS_CASE($with_ensurepip, + [yes|upgrade],[ENSUREPIP=upgrade], + [install],[ENSUREPIP=install], + [no],[ENSUREPIP=no], + [AC_MSG_ERROR([--with-ensurepip=upgrade|install|no])]) +AC_MSG_RESULT($ENSUREPIP) +AC_SUBST(ENSUREPIP) + # generate output files AC_CONFIG_FILES(Makefile.pre Modules/Setup.config Misc/python.pc) AC_CONFIG_FILES([Modules/ld_so_aix], [chmod +x Modules/ld_so_aix]) -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 20 12:40:30 2014 From: python-checkins at python.org (nick.coghlan) Date: Thu, 20 Nov 2014 11:40:30 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2322869=3A_Split_py?= =?utf-8?q?thonrun_into_two_modules?= Message-ID: <20141120114020.7140.72477@psf.io> https://hg.python.org/cpython/rev/b9775a92c1d0 changeset: 93515:b9775a92c1d0 parent: 93513:23ab1197df0b user: Nick Coghlan date: Thu Nov 20 21:39:37 2014 +1000 summary: Issue #22869: Split pythonrun into two modules - interpreter startup and shutdown code moved to a new pylifecycle.c module - Py_OptimizeFlag moved into the new module with the other global flags files: Include/Python.h | 1 + Include/object.h | 7 + Include/pydebug.h | 2 + Include/pyerrors.h | 1 + Include/pylifecycle.h | 124 ++ Include/pythonrun.h | 110 -- Lib/_pyio.py | 2 +- Makefile.pre.in | 2 + Misc/NEWS | 3 + Modules/atexitmodule.c | 2 +- Modules/signalmodule.c | 2 +- Objects/object.c | 16 + Python/compile.c | 2 - Python/pylifecycle.c | 1540 ++++++++++++++++++++++++++++ Python/pythonrun.c | 1472 +-------------------------- Python/sysmodule.c | 2 +- 16 files changed, 1701 insertions(+), 1587 deletions(-) diff --git a/Include/Python.h b/Include/Python.h --- a/Include/Python.h +++ b/Include/Python.h @@ -112,6 +112,7 @@ #include "pyarena.h" #include "modsupport.h" #include "pythonrun.h" +#include "pylifecycle.h" #include "ceval.h" #include "sysmodule.h" #include "intrcheck.h" diff --git a/Include/object.h b/Include/object.h --- a/Include/object.h +++ b/Include/object.h @@ -65,6 +65,7 @@ #error Py_LIMITED_API is incompatible with Py_DEBUG, Py_TRACE_REFS, and Py_REF_DEBUG #endif + #ifdef Py_TRACE_REFS /* Define pointers to support a doubly-linked list of all live heap objects. */ #define _PyObject_HEAD_EXTRA \ @@ -710,11 +711,17 @@ _Py_NegativeRefcount(__FILE__, __LINE__, \ (PyObject *)(OP)); \ } +/* Py_REF_DEBUG also controls the display of refcounts and memory block + * allocations at the interactive prompt and at interpreter shutdown + */ +PyAPI_FUNC(void) _PyDebug_PrintTotalRefs(void); +#define _PY_DEBUG_PRINT_TOTAL_REFS() _PyDebug_PrintTotalRefs() #else #define _Py_INC_REFTOTAL #define _Py_DEC_REFTOTAL #define _Py_REF_DEBUG_COMMA #define _Py_CHECK_REFCNT(OP) /* a semicolon */; +#define _PY_DEBUG_PRINT_TOTAL_REFS() #endif /* Py_REF_DEBUG */ #ifdef COUNT_ALLOCS diff --git a/Include/pydebug.h b/Include/pydebug.h --- a/Include/pydebug.h +++ b/Include/pydebug.h @@ -5,6 +5,8 @@ extern "C" { #endif +/* These global variable are defined in pylifecycle.c */ +/* XXX (ncoghlan): move these declarations to pylifecycle.h? */ PyAPI_DATA(int) Py_DebugFlag; PyAPI_DATA(int) Py_VerboseFlag; PyAPI_DATA(int) Py_QuietFlag; diff --git a/Include/pyerrors.h b/Include/pyerrors.h --- a/Include/pyerrors.h +++ b/Include/pyerrors.h @@ -99,6 +99,7 @@ #define _Py_NO_RETURN #endif +/* Defined in Python/pylifecycle.c */ PyAPI_FUNC(void) Py_FatalError(const char *message) _Py_NO_RETURN; #if defined(Py_DEBUG) || defined(Py_LIMITED_API) diff --git a/Include/pylifecycle.h b/Include/pylifecycle.h new file mode 100644 --- /dev/null +++ b/Include/pylifecycle.h @@ -0,0 +1,124 @@ + +/* Interfaces to configure, query, create & destroy the Python runtime */ + +#ifndef Py_PYLIFECYCLE_H +#define Py_PYLIFECYCLE_H +#ifdef __cplusplus +extern "C" { +#endif + +PyAPI_FUNC(void) Py_SetProgramName(wchar_t *); +PyAPI_FUNC(wchar_t *) Py_GetProgramName(void); + +PyAPI_FUNC(void) Py_SetPythonHome(wchar_t *); +PyAPI_FUNC(wchar_t *) Py_GetPythonHome(void); + +#ifndef Py_LIMITED_API +/* Only used by applications that embed the interpreter and need to + * override the standard encoding determination mechanism + */ +PyAPI_FUNC(int) Py_SetStandardStreamEncoding(const char *encoding, + const char *errors); +#endif + +PyAPI_FUNC(void) Py_Initialize(void); +PyAPI_FUNC(void) Py_InitializeEx(int); +#ifndef Py_LIMITED_API +PyAPI_FUNC(void) _Py_InitializeEx_Private(int, int); +#endif +PyAPI_FUNC(void) Py_Finalize(void); +PyAPI_FUNC(int) Py_IsInitialized(void); +PyAPI_FUNC(PyThreadState *) Py_NewInterpreter(void); +PyAPI_FUNC(void) Py_EndInterpreter(PyThreadState *); + + +/* Py_PyAtExit is for the atexit module, Py_AtExit is for low-level + * exit functions. + */ +#ifndef Py_LIMITED_API +PyAPI_FUNC(void) _Py_PyAtExit(void (*func)(void)); +#endif +PyAPI_FUNC(int) Py_AtExit(void (*func)(void)); + +PyAPI_FUNC(void) Py_Exit(int); + +/* Restore signals that the interpreter has called SIG_IGN on to SIG_DFL. */ +#ifndef Py_LIMITED_API +PyAPI_FUNC(void) _Py_RestoreSignals(void); + +PyAPI_FUNC(int) Py_FdIsInteractive(FILE *, const char *); +#endif + +/* Bootstrap __main__ (defined in Modules/main.c) */ +PyAPI_FUNC(int) Py_Main(int argc, wchar_t **argv); + +/* In getpath.c */ +PyAPI_FUNC(wchar_t *) Py_GetProgramFullPath(void); +PyAPI_FUNC(wchar_t *) Py_GetPrefix(void); +PyAPI_FUNC(wchar_t *) Py_GetExecPrefix(void); +PyAPI_FUNC(wchar_t *) Py_GetPath(void); +PyAPI_FUNC(void) Py_SetPath(const wchar_t *); +#ifdef MS_WINDOWS +int _Py_CheckPython3(); +#endif + +/* In their own files */ +PyAPI_FUNC(const char *) Py_GetVersion(void); +PyAPI_FUNC(const char *) Py_GetPlatform(void); +PyAPI_FUNC(const char *) Py_GetCopyright(void); +PyAPI_FUNC(const char *) Py_GetCompiler(void); +PyAPI_FUNC(const char *) Py_GetBuildInfo(void); +#ifndef Py_LIMITED_API +PyAPI_FUNC(const char *) _Py_hgidentifier(void); +PyAPI_FUNC(const char *) _Py_hgversion(void); +#endif + +/* Internal -- various one-time initializations */ +#ifndef Py_LIMITED_API +PyAPI_FUNC(PyObject *) _PyBuiltin_Init(void); +PyAPI_FUNC(PyObject *) _PySys_Init(void); +PyAPI_FUNC(void) _PyImport_Init(void); +PyAPI_FUNC(void) _PyExc_Init(PyObject * bltinmod); +PyAPI_FUNC(void) _PyImportHooks_Init(void); +PyAPI_FUNC(int) _PyFrame_Init(void); +PyAPI_FUNC(int) _PyFloat_Init(void); +PyAPI_FUNC(int) PyByteArray_Init(void); +PyAPI_FUNC(void) _PyRandom_Init(void); +#endif + +/* Various internal finalizers */ +#ifndef Py_LIMITED_API +PyAPI_FUNC(void) _PyExc_Fini(void); +PyAPI_FUNC(void) _PyImport_Fini(void); +PyAPI_FUNC(void) PyMethod_Fini(void); +PyAPI_FUNC(void) PyFrame_Fini(void); +PyAPI_FUNC(void) PyCFunction_Fini(void); +PyAPI_FUNC(void) PyDict_Fini(void); +PyAPI_FUNC(void) PyTuple_Fini(void); +PyAPI_FUNC(void) PyList_Fini(void); +PyAPI_FUNC(void) PySet_Fini(void); +PyAPI_FUNC(void) PyBytes_Fini(void); +PyAPI_FUNC(void) PyByteArray_Fini(void); +PyAPI_FUNC(void) PyFloat_Fini(void); +PyAPI_FUNC(void) PyOS_FiniInterrupts(void); +PyAPI_FUNC(void) _PyGC_DumpShutdownStats(void); +PyAPI_FUNC(void) _PyGC_Fini(void); +PyAPI_FUNC(void) PySlice_Fini(void); +PyAPI_FUNC(void) _PyType_Fini(void); +PyAPI_FUNC(void) _PyRandom_Fini(void); + +PyAPI_DATA(PyThreadState *) _Py_Finalizing; +#endif + +/* Signals */ +typedef void (*PyOS_sighandler_t)(int); +PyAPI_FUNC(PyOS_sighandler_t) PyOS_getsig(int); +PyAPI_FUNC(PyOS_sighandler_t) PyOS_setsig(int, PyOS_sighandler_t); + +/* Random */ +PyAPI_FUNC(int) _PyOS_URandom (void *buffer, Py_ssize_t size); + +#ifdef __cplusplus +} +#endif +#endif /* !Py_PYLIFECYCLE_H */ diff --git a/Include/pythonrun.h b/Include/pythonrun.h --- a/Include/pythonrun.h +++ b/Include/pythonrun.h @@ -22,30 +22,6 @@ } PyCompilerFlags; #endif -PyAPI_FUNC(void) Py_SetProgramName(wchar_t *); -PyAPI_FUNC(wchar_t *) Py_GetProgramName(void); - -PyAPI_FUNC(void) Py_SetPythonHome(wchar_t *); -PyAPI_FUNC(wchar_t *) Py_GetPythonHome(void); - -#ifndef Py_LIMITED_API -/* Only used by applications that embed the interpreter and need to - * override the standard encoding determination mechanism - */ -PyAPI_FUNC(int) Py_SetStandardStreamEncoding(const char *encoding, - const char *errors); -#endif - -PyAPI_FUNC(void) Py_Initialize(void); -PyAPI_FUNC(void) Py_InitializeEx(int); -#ifndef Py_LIMITED_API -PyAPI_FUNC(void) _Py_InitializeEx_Private(int, int); -#endif -PyAPI_FUNC(void) Py_Finalize(void); -PyAPI_FUNC(int) Py_IsInitialized(void); -PyAPI_FUNC(PyThreadState *) Py_NewInterpreter(void); -PyAPI_FUNC(void) Py_EndInterpreter(PyThreadState *); - #ifndef Py_LIMITED_API PyAPI_FUNC(int) PyRun_SimpleStringFlags(const char *, PyCompilerFlags *); PyAPI_FUNC(int) PyRun_AnyFileFlags(FILE *, const char *, PyCompilerFlags *); @@ -166,26 +142,6 @@ PyAPI_FUNC(void) PyErr_PrintEx(int); PyAPI_FUNC(void) PyErr_Display(PyObject *, PyObject *, PyObject *); -/* Py_PyAtExit is for the atexit module, Py_AtExit is for low-level - * exit functions. - */ -#ifndef Py_LIMITED_API -PyAPI_FUNC(void) _Py_PyAtExit(void (*func)(void)); -#endif -PyAPI_FUNC(int) Py_AtExit(void (*func)(void)); - -PyAPI_FUNC(void) Py_Exit(int); - -/* Restore signals that the interpreter has called SIG_IGN on to SIG_DFL. */ -#ifndef Py_LIMITED_API -PyAPI_FUNC(void) _Py_RestoreSignals(void); - -PyAPI_FUNC(int) Py_FdIsInteractive(FILE *, const char *); -#endif - -/* Bootstrap */ -PyAPI_FUNC(int) Py_Main(int argc, wchar_t **argv); - #ifndef Py_LIMITED_API /* Use macros for a bunch of old variants */ #define PyRun_String(str, s, g, l) PyRun_StringFlags(str, s, g, l, NULL) @@ -207,64 +163,6 @@ PyRun_FileExFlags(fp, p, s, g, l, 0, flags) #endif -/* In getpath.c */ -PyAPI_FUNC(wchar_t *) Py_GetProgramFullPath(void); -PyAPI_FUNC(wchar_t *) Py_GetPrefix(void); -PyAPI_FUNC(wchar_t *) Py_GetExecPrefix(void); -PyAPI_FUNC(wchar_t *) Py_GetPath(void); -PyAPI_FUNC(void) Py_SetPath(const wchar_t *); -#ifdef MS_WINDOWS -int _Py_CheckPython3(); -#endif - -/* In their own files */ -PyAPI_FUNC(const char *) Py_GetVersion(void); -PyAPI_FUNC(const char *) Py_GetPlatform(void); -PyAPI_FUNC(const char *) Py_GetCopyright(void); -PyAPI_FUNC(const char *) Py_GetCompiler(void); -PyAPI_FUNC(const char *) Py_GetBuildInfo(void); -#ifndef Py_LIMITED_API -PyAPI_FUNC(const char *) _Py_hgidentifier(void); -PyAPI_FUNC(const char *) _Py_hgversion(void); -#endif - -/* Internal -- various one-time initializations */ -#ifndef Py_LIMITED_API -PyAPI_FUNC(PyObject *) _PyBuiltin_Init(void); -PyAPI_FUNC(PyObject *) _PySys_Init(void); -PyAPI_FUNC(void) _PyImport_Init(void); -PyAPI_FUNC(void) _PyExc_Init(PyObject * bltinmod); -PyAPI_FUNC(void) _PyImportHooks_Init(void); -PyAPI_FUNC(int) _PyFrame_Init(void); -PyAPI_FUNC(int) _PyFloat_Init(void); -PyAPI_FUNC(int) PyByteArray_Init(void); -PyAPI_FUNC(void) _PyRandom_Init(void); -#endif - -/* Various internal finalizers */ -#ifndef Py_LIMITED_API -PyAPI_FUNC(void) _PyExc_Fini(void); -PyAPI_FUNC(void) _PyImport_Fini(void); -PyAPI_FUNC(void) PyMethod_Fini(void); -PyAPI_FUNC(void) PyFrame_Fini(void); -PyAPI_FUNC(void) PyCFunction_Fini(void); -PyAPI_FUNC(void) PyDict_Fini(void); -PyAPI_FUNC(void) PyTuple_Fini(void); -PyAPI_FUNC(void) PyList_Fini(void); -PyAPI_FUNC(void) PySet_Fini(void); -PyAPI_FUNC(void) PyBytes_Fini(void); -PyAPI_FUNC(void) PyByteArray_Fini(void); -PyAPI_FUNC(void) PyFloat_Fini(void); -PyAPI_FUNC(void) PyOS_FiniInterrupts(void); -PyAPI_FUNC(void) _PyGC_DumpShutdownStats(void); -PyAPI_FUNC(void) _PyGC_Fini(void); -PyAPI_FUNC(void) PySlice_Fini(void); -PyAPI_FUNC(void) _PyType_Fini(void); -PyAPI_FUNC(void) _PyRandom_Fini(void); - -PyAPI_DATA(PyThreadState *) _Py_Finalizing; -#endif - /* Stuff with no proper home (yet) */ #ifndef Py_LIMITED_API PyAPI_FUNC(char *) PyOS_Readline(FILE *, FILE *, const char *); @@ -290,14 +188,6 @@ PyAPI_FUNC(int) PyOS_CheckStack(void); #endif -/* Signals */ -typedef void (*PyOS_sighandler_t)(int); -PyAPI_FUNC(PyOS_sighandler_t) PyOS_getsig(int); -PyAPI_FUNC(PyOS_sighandler_t) PyOS_setsig(int, PyOS_sighandler_t); - -/* Random */ -PyAPI_FUNC(int) _PyOS_URandom (void *buffer, Py_ssize_t size); - #ifdef __cplusplus } #endif diff --git a/Lib/_pyio.py b/Lib/_pyio.py --- a/Lib/_pyio.py +++ b/Lib/_pyio.py @@ -257,7 +257,7 @@ Trick so that open won't become a bound method when stored as a class variable (as dbm.dumb does). - See initstdio() in Python/pythonrun.c. + See initstdio() in Python/pylifecycle.c. """ __doc__ = DocDescriptor() diff --git a/Makefile.pre.in b/Makefile.pre.in --- a/Makefile.pre.in +++ b/Makefile.pre.in @@ -389,6 +389,7 @@ Python/pyctype.o \ Python/pyfpe.o \ Python/pyhash.o \ + Python/pylifecycle.o \ Python/pymath.o \ Python/pystate.o \ Python/pythonrun.o \ @@ -909,6 +910,7 @@ $(srcdir)/Include/pyerrors.h \ $(srcdir)/Include/pyfpe.h \ $(srcdir)/Include/pyhash.h \ + $(srcdir)/Include/pylifecycle.h \ $(srcdir)/Include/pymath.h \ $(srcdir)/Include/pygetopt.h \ $(srcdir)/Include/pymacro.h \ diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -10,6 +10,9 @@ Core and Builtins ----------------- +- Issue #22869: Move the interpreter startup & shutdown code to a new + dedicated pylifecycle.c module + - Issue #22847: Improve method cache efficiency. - Issue #22335: Fix crash when trying to enlarge a bytearray to 0x7fffffff diff --git a/Modules/atexitmodule.c b/Modules/atexitmodule.c --- a/Modules/atexitmodule.c +++ b/Modules/atexitmodule.c @@ -60,7 +60,7 @@ modstate->ncallbacks = 0; } -/* Installed into pythonrun.c's atexit mechanism */ +/* Installed into pylifecycle.c's atexit mechanism */ static void atexit_callfuncs(void) diff --git a/Modules/signalmodule.c b/Modules/signalmodule.c --- a/Modules/signalmodule.c +++ b/Modules/signalmodule.c @@ -304,7 +304,7 @@ if (sig_num != SIGCHLD) #endif /* If the handler was not set up with sigaction, reinstall it. See - * Python/pythonrun.c for the implementation of PyOS_setsig which + * Python/pylifecycle.c for the implementation of PyOS_setsig which * makes this true. See also issue8354. */ PyOS_setsig(sig_num, signal_handler); #endif diff --git a/Objects/object.c b/Objects/object.c --- a/Objects/object.c +++ b/Objects/object.c @@ -33,6 +33,22 @@ total -= o->ob_refcnt; return total; } + +void +_PyDebug_PrintTotalRefs(void) { + PyObject *xoptions, *value; + _Py_IDENTIFIER(showrefcount); + + xoptions = PySys_GetXOptions(); + if (xoptions == NULL) + return; + value = _PyDict_GetItemId(xoptions, &PyId_showrefcount); + if (value == Py_True) + fprintf(stderr, + "[%" PY_FORMAT_SIZE_T "d refs, " + "%" PY_FORMAT_SIZE_T "d blocks]\n", + _Py_GetRefTotal(), _Py_GetAllocatedBlocks()); +} #endif /* Py_REF_DEBUG */ /* Object allocation routines used by NEWOBJ and NEWVAROBJ macros. diff --git a/Python/compile.c b/Python/compile.c --- a/Python/compile.c +++ b/Python/compile.c @@ -30,8 +30,6 @@ #include "symtable.h" #include "opcode.h" -int Py_OptimizeFlag = 0; - #define DEFAULT_BLOCK_SIZE 16 #define DEFAULT_BLOCKS 8 #define DEFAULT_CODE_SIZE 128 diff --git a/Python/pylifecycle.c b/Python/pylifecycle.c new file mode 100644 --- /dev/null +++ b/Python/pylifecycle.c @@ -0,0 +1,1540 @@ + +/* Python interpreter top-level routines, including init/exit */ + +#include "Python.h" + +#include "Python-ast.h" +#undef Yield /* undefine macro conflicting with winbase.h */ +#include "grammar.h" +#include "node.h" +#include "token.h" +#include "parsetok.h" +#include "errcode.h" +#include "code.h" +#include "symtable.h" +#include "ast.h" +#include "marshal.h" +#include "osdefs.h" +#include + +#ifdef HAVE_SIGNAL_H +#include +#endif + +#ifdef MS_WINDOWS +#include "malloc.h" /* for alloca */ +#endif + +#ifdef HAVE_LANGINFO_H +#include +#endif + +#ifdef MS_WINDOWS +#undef BYTE +#include "windows.h" +#endif + +_Py_IDENTIFIER(flush); +_Py_IDENTIFIER(name); +_Py_IDENTIFIER(stdin); +_Py_IDENTIFIER(stdout); +_Py_IDENTIFIER(stderr); + +#ifdef __cplusplus +extern "C" { +#endif + +extern wchar_t *Py_GetPath(void); + +extern grammar _PyParser_Grammar; /* From graminit.c */ + +/* Forward */ +static void initmain(PyInterpreterState *interp); +static int initfsencoding(PyInterpreterState *interp); +static void initsite(void); +static int initstdio(void); +static void initsigs(void); +static void call_py_exitfuncs(void); +static void wait_for_thread_shutdown(void); +static void call_ll_exitfuncs(void); +extern int _PyUnicode_Init(void); +extern int _PyStructSequence_Init(void); +extern void _PyUnicode_Fini(void); +extern int _PyLong_Init(void); +extern void PyLong_Fini(void); +extern int _PyFaulthandler_Init(void); +extern void _PyFaulthandler_Fini(void); +extern void _PyHash_Fini(void); +extern int _PyTraceMalloc_Init(void); +extern int _PyTraceMalloc_Fini(void); + +#ifdef WITH_THREAD +extern void _PyGILState_Init(PyInterpreterState *, PyThreadState *); +extern void _PyGILState_Fini(void); +#endif /* WITH_THREAD */ + +/* Global configuration variable declarations are in pydebug.h */ +/* XXX (ncoghlan): move those declarations to pylifecycle.h? */ +int Py_DebugFlag; /* Needed by parser.c */ +int Py_VerboseFlag; /* Needed by import.c */ +int Py_QuietFlag; /* Needed by sysmodule.c */ +int Py_InteractiveFlag; /* Needed by Py_FdIsInteractive() below */ +int Py_InspectFlag; /* Needed to determine whether to exit at SystemExit */ +int Py_OptimizeFlag = 0; /* Needed by compile.c */ +int Py_NoSiteFlag; /* Suppress 'import site' */ +int Py_BytesWarningFlag; /* Warn on str(bytes) and str(buffer) */ +int Py_UseClassExceptionsFlag = 1; /* Needed by bltinmodule.c: deprecated */ +int Py_FrozenFlag; /* Needed by getpath.c */ +int Py_IgnoreEnvironmentFlag; /* e.g. PYTHONPATH, PYTHONHOME */ +int Py_DontWriteBytecodeFlag; /* Suppress writing bytecode files (*.py[co]) */ +int Py_NoUserSiteDirectory = 0; /* for -s and site.py */ +int Py_UnbufferedStdioFlag = 0; /* Unbuffered binary std{in,out,err} */ +int Py_HashRandomizationFlag = 0; /* for -R and PYTHONHASHSEED */ +int Py_IsolatedFlag = 0; /* for -I, isolate from user's env */ + +PyThreadState *_Py_Finalizing = NULL; + +/* Hack to force loading of object files */ +int (*_PyOS_mystrnicmp_hack)(const char *, const char *, Py_ssize_t) = \ + PyOS_mystrnicmp; /* Python/pystrcmp.o */ + +/* PyModule_GetWarningsModule is no longer necessary as of 2.6 +since _warnings is builtin. This API should not be used. */ +PyObject * +PyModule_GetWarningsModule(void) +{ + return PyImport_ImportModule("warnings"); +} + +static int initialized = 0; + +/* API to access the initialized flag -- useful for esoteric use */ + +int +Py_IsInitialized(void) +{ + return initialized; +} + +/* Helper to allow an embedding application to override the normal + * mechanism that attempts to figure out an appropriate IO encoding + */ + +static char *_Py_StandardStreamEncoding = NULL; +static char *_Py_StandardStreamErrors = NULL; + +int +Py_SetStandardStreamEncoding(const char *encoding, const char *errors) +{ + if (Py_IsInitialized()) { + /* This is too late to have any effect */ + return -1; + } + /* Can't call PyErr_NoMemory() on errors, as Python hasn't been + * initialised yet. + * + * However, the raw memory allocators are initialised appropriately + * as C static variables, so _PyMem_RawStrdup is OK even though + * Py_Initialize hasn't been called yet. + */ + if (encoding) { + _Py_StandardStreamEncoding = _PyMem_RawStrdup(encoding); + if (!_Py_StandardStreamEncoding) { + return -2; + } + } + if (errors) { + _Py_StandardStreamErrors = _PyMem_RawStrdup(errors); + if (!_Py_StandardStreamErrors) { + if (_Py_StandardStreamEncoding) { + PyMem_RawFree(_Py_StandardStreamEncoding); + } + return -3; + } + } + return 0; +} + +/* Global initializations. Can be undone by Py_Finalize(). Don't + call this twice without an intervening Py_Finalize() call. When + initializations fail, a fatal error is issued and the function does + not return. On return, the first thread and interpreter state have + been created. + + Locking: you must hold the interpreter lock while calling this. + (If the lock has not yet been initialized, that's equivalent to + having the lock, but you cannot use multiple threads.) + +*/ + +static int +add_flag(int flag, const char *envs) +{ + int env = atoi(envs); + if (flag < env) + flag = env; + if (flag < 1) + flag = 1; + return flag; +} + +static char* +get_codec_name(const char *encoding) +{ + char *name_utf8, *name_str; + PyObject *codec, *name = NULL; + + codec = _PyCodec_Lookup(encoding); + if (!codec) + goto error; + + name = _PyObject_GetAttrId(codec, &PyId_name); + Py_CLEAR(codec); + if (!name) + goto error; + + name_utf8 = _PyUnicode_AsString(name); + if (name_utf8 == NULL) + goto error; + name_str = _PyMem_RawStrdup(name_utf8); + Py_DECREF(name); + if (name_str == NULL) { + PyErr_NoMemory(); + return NULL; + } + return name_str; + +error: + Py_XDECREF(codec); + Py_XDECREF(name); + return NULL; +} + +static char* +get_locale_encoding(void) +{ +#ifdef MS_WINDOWS + char codepage[100]; + PyOS_snprintf(codepage, sizeof(codepage), "cp%d", GetACP()); + return get_codec_name(codepage); +#elif defined(HAVE_LANGINFO_H) && defined(CODESET) + char* codeset = nl_langinfo(CODESET); + if (!codeset || codeset[0] == '\0') { + PyErr_SetString(PyExc_ValueError, "CODESET is not set or empty"); + return NULL; + } + return get_codec_name(codeset); +#else + PyErr_SetNone(PyExc_NotImplementedError); + return NULL; +#endif +} + +static void +import_init(PyInterpreterState *interp, PyObject *sysmod) +{ + PyObject *importlib; + PyObject *impmod; + PyObject *sys_modules; + PyObject *value; + + /* Import _importlib through its frozen version, _frozen_importlib. */ + if (PyImport_ImportFrozenModule("_frozen_importlib") <= 0) { + Py_FatalError("Py_Initialize: can't import _frozen_importlib"); + } + else if (Py_VerboseFlag) { + PySys_FormatStderr("import _frozen_importlib # frozen\n"); + } + importlib = PyImport_AddModule("_frozen_importlib"); + if (importlib == NULL) { + Py_FatalError("Py_Initialize: couldn't get _frozen_importlib from " + "sys.modules"); + } + interp->importlib = importlib; + Py_INCREF(interp->importlib); + + /* Install _importlib as __import__ */ + impmod = PyInit_imp(); + if (impmod == NULL) { + Py_FatalError("Py_Initialize: can't import imp"); + } + else if (Py_VerboseFlag) { + PySys_FormatStderr("import imp # builtin\n"); + } + sys_modules = PyImport_GetModuleDict(); + if (Py_VerboseFlag) { + PySys_FormatStderr("import sys # builtin\n"); + } + if (PyDict_SetItemString(sys_modules, "_imp", impmod) < 0) { + Py_FatalError("Py_Initialize: can't save _imp to sys.modules"); + } + + value = PyObject_CallMethod(importlib, "_install", "OO", sysmod, impmod); + if (value == NULL) { + PyErr_Print(); + Py_FatalError("Py_Initialize: importlib install failed"); + } + Py_DECREF(value); + Py_DECREF(impmod); + + _PyImportZip_Init(); +} + + +void +_Py_InitializeEx_Private(int install_sigs, int install_importlib) +{ + PyInterpreterState *interp; + PyThreadState *tstate; + PyObject *bimod, *sysmod, *pstderr; + char *p; + extern void _Py_ReadyTypes(void); + + if (initialized) + return; + initialized = 1; + _Py_Finalizing = NULL; + +#if defined(HAVE_LANGINFO_H) && defined(HAVE_SETLOCALE) + /* Set up the LC_CTYPE locale, so we can obtain + the locale's charset without having to switch + locales. */ + setlocale(LC_CTYPE, ""); +#endif + + if ((p = Py_GETENV("PYTHONDEBUG")) && *p != '\0') + Py_DebugFlag = add_flag(Py_DebugFlag, p); + if ((p = Py_GETENV("PYTHONVERBOSE")) && *p != '\0') + Py_VerboseFlag = add_flag(Py_VerboseFlag, p); + if ((p = Py_GETENV("PYTHONOPTIMIZE")) && *p != '\0') + Py_OptimizeFlag = add_flag(Py_OptimizeFlag, p); + if ((p = Py_GETENV("PYTHONDONTWRITEBYTECODE")) && *p != '\0') + Py_DontWriteBytecodeFlag = add_flag(Py_DontWriteBytecodeFlag, p); + /* The variable is only tested for existence here; _PyRandom_Init will + check its value further. */ + if ((p = Py_GETENV("PYTHONHASHSEED")) && *p != '\0') + Py_HashRandomizationFlag = add_flag(Py_HashRandomizationFlag, p); + + _PyRandom_Init(); + + interp = PyInterpreterState_New(); + if (interp == NULL) + Py_FatalError("Py_Initialize: can't make first interpreter"); + + tstate = PyThreadState_New(interp); + if (tstate == NULL) + Py_FatalError("Py_Initialize: can't make first thread"); + (void) PyThreadState_Swap(tstate); + +#ifdef WITH_THREAD + /* We can't call _PyEval_FiniThreads() in Py_Finalize because + destroying the GIL might fail when it is being referenced from + another running thread (see issue #9901). + Instead we destroy the previously created GIL here, which ensures + that we can call Py_Initialize / Py_Finalize multiple times. */ + _PyEval_FiniThreads(); + + /* Auto-thread-state API */ + _PyGILState_Init(interp, tstate); +#endif /* WITH_THREAD */ + + _Py_ReadyTypes(); + + if (!_PyFrame_Init()) + Py_FatalError("Py_Initialize: can't init frames"); + + if (!_PyLong_Init()) + Py_FatalError("Py_Initialize: can't init longs"); + + if (!PyByteArray_Init()) + Py_FatalError("Py_Initialize: can't init bytearray"); + + if (!_PyFloat_Init()) + Py_FatalError("Py_Initialize: can't init float"); + + interp->modules = PyDict_New(); + if (interp->modules == NULL) + Py_FatalError("Py_Initialize: can't make modules dictionary"); + + /* Init Unicode implementation; relies on the codec registry */ + if (_PyUnicode_Init() < 0) + Py_FatalError("Py_Initialize: can't initialize unicode"); + if (_PyStructSequence_Init() < 0) + Py_FatalError("Py_Initialize: can't initialize structseq"); + + bimod = _PyBuiltin_Init(); + if (bimod == NULL) + Py_FatalError("Py_Initialize: can't initialize builtins modules"); + _PyImport_FixupBuiltin(bimod, "builtins"); + interp->builtins = PyModule_GetDict(bimod); + if (interp->builtins == NULL) + Py_FatalError("Py_Initialize: can't initialize builtins dict"); + Py_INCREF(interp->builtins); + + /* initialize builtin exceptions */ + _PyExc_Init(bimod); + + sysmod = _PySys_Init(); + if (sysmod == NULL) + Py_FatalError("Py_Initialize: can't initialize sys"); + interp->sysdict = PyModule_GetDict(sysmod); + if (interp->sysdict == NULL) + Py_FatalError("Py_Initialize: can't initialize sys dict"); + Py_INCREF(interp->sysdict); + _PyImport_FixupBuiltin(sysmod, "sys"); + PySys_SetPath(Py_GetPath()); + PyDict_SetItemString(interp->sysdict, "modules", + interp->modules); + + /* Set up a preliminary stderr printer until we have enough + infrastructure for the io module in place. */ + pstderr = PyFile_NewStdPrinter(fileno(stderr)); + if (pstderr == NULL) + Py_FatalError("Py_Initialize: can't set preliminary stderr"); + _PySys_SetObjectId(&PyId_stderr, pstderr); + PySys_SetObject("__stderr__", pstderr); + Py_DECREF(pstderr); + + _PyImport_Init(); + + _PyImportHooks_Init(); + + /* Initialize _warnings. */ + _PyWarnings_Init(); + + if (!install_importlib) + return; + + import_init(interp, sysmod); + + /* initialize the faulthandler module */ + if (_PyFaulthandler_Init()) + Py_FatalError("Py_Initialize: can't initialize faulthandler"); + + if (_PyTime_Init() < 0) + Py_FatalError("Py_Initialize: can't initialize time"); + + if (initfsencoding(interp) < 0) + Py_FatalError("Py_Initialize: unable to load the file system codec"); + + if (install_sigs) + initsigs(); /* Signal handling stuff, including initintr() */ + + if (_PyTraceMalloc_Init() < 0) + Py_FatalError("Py_Initialize: can't initialize tracemalloc"); + + initmain(interp); /* Module __main__ */ + if (initstdio() < 0) + Py_FatalError( + "Py_Initialize: can't initialize sys standard streams"); + + /* Initialize warnings. */ + if (PySys_HasWarnOptions()) { + PyObject *warnings_module = PyImport_ImportModule("warnings"); + if (warnings_module == NULL) { + fprintf(stderr, "'import warnings' failed; traceback:\n"); + PyErr_Print(); + } + Py_XDECREF(warnings_module); + } + + if (!Py_NoSiteFlag) + initsite(); /* Module site */ +} + +void +Py_InitializeEx(int install_sigs) +{ + _Py_InitializeEx_Private(install_sigs, 1); +} + +void +Py_Initialize(void) +{ + Py_InitializeEx(1); +} + + +#ifdef COUNT_ALLOCS +extern void dump_counts(FILE*); +#endif + +/* Flush stdout and stderr */ + +static int +file_is_closed(PyObject *fobj) +{ + int r; + PyObject *tmp = PyObject_GetAttrString(fobj, "closed"); + if (tmp == NULL) { + PyErr_Clear(); + return 0; + } + r = PyObject_IsTrue(tmp); + Py_DECREF(tmp); + if (r < 0) + PyErr_Clear(); + return r > 0; +} + +static void +flush_std_files(void) +{ + PyObject *fout = _PySys_GetObjectId(&PyId_stdout); + PyObject *ferr = _PySys_GetObjectId(&PyId_stderr); + PyObject *tmp; + + if (fout != NULL && fout != Py_None && !file_is_closed(fout)) { + tmp = _PyObject_CallMethodId(fout, &PyId_flush, ""); + if (tmp == NULL) + PyErr_WriteUnraisable(fout); + else + Py_DECREF(tmp); + } + + if (ferr != NULL && ferr != Py_None && !file_is_closed(ferr)) { + tmp = _PyObject_CallMethodId(ferr, &PyId_flush, ""); + if (tmp == NULL) + PyErr_Clear(); + else + Py_DECREF(tmp); + } +} + +/* Undo the effect of Py_Initialize(). + + Beware: if multiple interpreter and/or thread states exist, these + are not wiped out; only the current thread and interpreter state + are deleted. But since everything else is deleted, those other + interpreter and thread states should no longer be used. + + (XXX We should do better, e.g. wipe out all interpreters and + threads.) + + Locking: as above. + +*/ + +void +Py_Finalize(void) +{ + PyInterpreterState *interp; + PyThreadState *tstate; + + if (!initialized) + return; + + wait_for_thread_shutdown(); + + /* The interpreter is still entirely intact at this point, and the + * exit funcs may be relying on that. In particular, if some thread + * or exit func is still waiting to do an import, the import machinery + * expects Py_IsInitialized() to return true. So don't say the + * interpreter is uninitialized until after the exit funcs have run. + * Note that Threading.py uses an exit func to do a join on all the + * threads created thru it, so this also protects pending imports in + * the threads created via Threading. + */ + call_py_exitfuncs(); + + /* Get current thread state and interpreter pointer */ + tstate = PyThreadState_GET(); + interp = tstate->interp; + + /* Remaining threads (e.g. daemon threads) will automatically exit + after taking the GIL (in PyEval_RestoreThread()). */ + _Py_Finalizing = tstate; + initialized = 0; + + /* Flush stdout+stderr */ + flush_std_files(); + + /* Disable signal handling */ + PyOS_FiniInterrupts(); + + /* Collect garbage. This may call finalizers; it's nice to call these + * before all modules are destroyed. + * XXX If a __del__ or weakref callback is triggered here, and tries to + * XXX import a module, bad things can happen, because Python no + * XXX longer believes it's initialized. + * XXX Fatal Python error: Interpreter not initialized (version mismatch?) + * XXX is easy to provoke that way. I've also seen, e.g., + * XXX Exception exceptions.ImportError: 'No module named sha' + * XXX in ignored + * XXX but I'm unclear on exactly how that one happens. In any case, + * XXX I haven't seen a real-life report of either of these. + */ + PyGC_Collect(); +#ifdef COUNT_ALLOCS + /* With COUNT_ALLOCS, it helps to run GC multiple times: + each collection might release some types from the type + list, so they become garbage. */ + while (PyGC_Collect() > 0) + /* nothing */; +#endif + /* Destroy all modules */ + PyImport_Cleanup(); + + /* Flush stdout+stderr (again, in case more was printed) */ + flush_std_files(); + + /* Collect final garbage. This disposes of cycles created by + * class definitions, for example. + * XXX This is disabled because it caused too many problems. If + * XXX a __del__ or weakref callback triggers here, Python code has + * XXX a hard time running, because even the sys module has been + * XXX cleared out (sys.stdout is gone, sys.excepthook is gone, etc). + * XXX One symptom is a sequence of information-free messages + * XXX coming from threads (if a __del__ or callback is invoked, + * XXX other threads can execute too, and any exception they encounter + * XXX triggers a comedy of errors as subsystem after subsystem + * XXX fails to find what it *expects* to find in sys to help report + * XXX the exception and consequent unexpected failures). I've also + * XXX seen segfaults then, after adding print statements to the + * XXX Python code getting called. + */ +#if 0 + PyGC_Collect(); +#endif + + /* Disable tracemalloc after all Python objects have been destroyed, + so it is possible to use tracemalloc in objects destructor. */ + _PyTraceMalloc_Fini(); + + /* Destroy the database used by _PyImport_{Fixup,Find}Extension */ + _PyImport_Fini(); + + /* Cleanup typeobject.c's internal caches. */ + _PyType_Fini(); + + /* unload faulthandler module */ + _PyFaulthandler_Fini(); + + /* Debugging stuff */ +#ifdef COUNT_ALLOCS + dump_counts(stdout); +#endif + /* dump hash stats */ + _PyHash_Fini(); + + _PY_DEBUG_PRINT_TOTAL_REFS(); + +#ifdef Py_TRACE_REFS + /* Display all objects still alive -- this can invoke arbitrary + * __repr__ overrides, so requires a mostly-intact interpreter. + * Alas, a lot of stuff may still be alive now that will be cleaned + * up later. + */ + if (Py_GETENV("PYTHONDUMPREFS")) + _Py_PrintReferences(stderr); +#endif /* Py_TRACE_REFS */ + + /* Clear interpreter state and all thread states. */ + PyInterpreterState_Clear(interp); + + /* Now we decref the exception classes. After this point nothing + can raise an exception. That's okay, because each Fini() method + below has been checked to make sure no exceptions are ever + raised. + */ + + _PyExc_Fini(); + + /* Sundry finalizers */ + PyMethod_Fini(); + PyFrame_Fini(); + PyCFunction_Fini(); + PyTuple_Fini(); + PyList_Fini(); + PySet_Fini(); + PyBytes_Fini(); + PyByteArray_Fini(); + PyLong_Fini(); + PyFloat_Fini(); + PyDict_Fini(); + PySlice_Fini(); + _PyGC_Fini(); + _PyRandom_Fini(); + + /* Cleanup Unicode implementation */ + _PyUnicode_Fini(); + + /* reset file system default encoding */ + if (!Py_HasFileSystemDefaultEncoding && Py_FileSystemDefaultEncoding) { + PyMem_RawFree((char*)Py_FileSystemDefaultEncoding); + Py_FileSystemDefaultEncoding = NULL; + } + + /* XXX Still allocated: + - various static ad-hoc pointers to interned strings + - int and float free list blocks + - whatever various modules and libraries allocate + */ + + PyGrammar_RemoveAccelerators(&_PyParser_Grammar); + + /* Cleanup auto-thread-state */ +#ifdef WITH_THREAD + _PyGILState_Fini(); +#endif /* WITH_THREAD */ + + /* Delete current thread. After this, many C API calls become crashy. */ + PyThreadState_Swap(NULL); + PyInterpreterState_Delete(interp); + +#ifdef Py_TRACE_REFS + /* Display addresses (& refcnts) of all objects still alive. + * An address can be used to find the repr of the object, printed + * above by _Py_PrintReferences. + */ + if (Py_GETENV("PYTHONDUMPREFS")) + _Py_PrintReferenceAddresses(stderr); +#endif /* Py_TRACE_REFS */ +#ifdef PYMALLOC_DEBUG + if (Py_GETENV("PYTHONMALLOCSTATS")) + _PyObject_DebugMallocStats(stderr); +#endif + + call_ll_exitfuncs(); +} + +/* Create and initialize a new interpreter and thread, and return the + new thread. This requires that Py_Initialize() has been called + first. + + Unsuccessful initialization yields a NULL pointer. Note that *no* + exception information is available even in this case -- the + exception information is held in the thread, and there is no + thread. + + Locking: as above. + +*/ + +PyThreadState * +Py_NewInterpreter(void) +{ + PyInterpreterState *interp; + PyThreadState *tstate, *save_tstate; + PyObject *bimod, *sysmod; + + if (!initialized) + Py_FatalError("Py_NewInterpreter: call Py_Initialize first"); + + interp = PyInterpreterState_New(); + if (interp == NULL) + return NULL; + + tstate = PyThreadState_New(interp); + if (tstate == NULL) { + PyInterpreterState_Delete(interp); + return NULL; + } + + save_tstate = PyThreadState_Swap(tstate); + + /* XXX The following is lax in error checking */ + + interp->modules = PyDict_New(); + + bimod = _PyImport_FindBuiltin("builtins"); + if (bimod != NULL) { + interp->builtins = PyModule_GetDict(bimod); + if (interp->builtins == NULL) + goto handle_error; + Py_INCREF(interp->builtins); + } + + /* initialize builtin exceptions */ + _PyExc_Init(bimod); + + sysmod = _PyImport_FindBuiltin("sys"); + if (bimod != NULL && sysmod != NULL) { + PyObject *pstderr; + + interp->sysdict = PyModule_GetDict(sysmod); + if (interp->sysdict == NULL) + goto handle_error; + Py_INCREF(interp->sysdict); + PySys_SetPath(Py_GetPath()); + PyDict_SetItemString(interp->sysdict, "modules", + interp->modules); + /* Set up a preliminary stderr printer until we have enough + infrastructure for the io module in place. */ + pstderr = PyFile_NewStdPrinter(fileno(stderr)); + if (pstderr == NULL) + Py_FatalError("Py_Initialize: can't set preliminary stderr"); + _PySys_SetObjectId(&PyId_stderr, pstderr); + PySys_SetObject("__stderr__", pstderr); + Py_DECREF(pstderr); + + _PyImportHooks_Init(); + + import_init(interp, sysmod); + + if (initfsencoding(interp) < 0) + goto handle_error; + + if (initstdio() < 0) + Py_FatalError( + "Py_Initialize: can't initialize sys standard streams"); + initmain(interp); + if (!Py_NoSiteFlag) + initsite(); + } + + if (!PyErr_Occurred()) + return tstate; + +handle_error: + /* Oops, it didn't work. Undo it all. */ + + PyErr_PrintEx(0); + PyThreadState_Clear(tstate); + PyThreadState_Swap(save_tstate); + PyThreadState_Delete(tstate); + PyInterpreterState_Delete(interp); + + return NULL; +} + +/* Delete an interpreter and its last thread. This requires that the + given thread state is current, that the thread has no remaining + frames, and that it is its interpreter's only remaining thread. + It is a fatal error to violate these constraints. + + (Py_Finalize() doesn't have these constraints -- it zaps + everything, regardless.) + + Locking: as above. + +*/ + +void +Py_EndInterpreter(PyThreadState *tstate) +{ + PyInterpreterState *interp = tstate->interp; + + if (tstate != PyThreadState_GET()) + Py_FatalError("Py_EndInterpreter: thread is not current"); + if (tstate->frame != NULL) + Py_FatalError("Py_EndInterpreter: thread still has a frame"); + + wait_for_thread_shutdown(); + + if (tstate != interp->tstate_head || tstate->next != NULL) + Py_FatalError("Py_EndInterpreter: not the last thread"); + + PyImport_Cleanup(); + PyInterpreterState_Clear(interp); + PyThreadState_Swap(NULL); + PyInterpreterState_Delete(interp); +} + +#ifdef MS_WINDOWS +static wchar_t *progname = L"python"; +#else +static wchar_t *progname = L"python3"; +#endif + +void +Py_SetProgramName(wchar_t *pn) +{ + if (pn && *pn) + progname = pn; +} + +wchar_t * +Py_GetProgramName(void) +{ + return progname; +} + +static wchar_t *default_home = NULL; +static wchar_t env_home[MAXPATHLEN+1]; + +void +Py_SetPythonHome(wchar_t *home) +{ + default_home = home; +} + +wchar_t * +Py_GetPythonHome(void) +{ + wchar_t *home = default_home; + if (home == NULL && !Py_IgnoreEnvironmentFlag) { + char* chome = Py_GETENV("PYTHONHOME"); + if (chome) { + size_t size = Py_ARRAY_LENGTH(env_home); + size_t r = mbstowcs(env_home, chome, size); + if (r != (size_t)-1 && r < size) + home = env_home; + } + + } + return home; +} + +/* Create __main__ module */ + +static void +initmain(PyInterpreterState *interp) +{ + PyObject *m, *d, *loader; + m = PyImport_AddModule("__main__"); + if (m == NULL) + Py_FatalError("can't create __main__ module"); + d = PyModule_GetDict(m); + if (PyDict_GetItemString(d, "__builtins__") == NULL) { + PyObject *bimod = PyImport_ImportModule("builtins"); + if (bimod == NULL) { + Py_FatalError("Failed to retrieve builtins module"); + } + if (PyDict_SetItemString(d, "__builtins__", bimod) < 0) { + Py_FatalError("Failed to initialize __main__.__builtins__"); + } + Py_DECREF(bimod); + } + /* Main is a little special - imp.is_builtin("__main__") will return + * False, but BuiltinImporter is still the most appropriate initial + * setting for its __loader__ attribute. A more suitable value will + * be set if __main__ gets further initialized later in the startup + * process. + */ + loader = PyDict_GetItemString(d, "__loader__"); + if (loader == NULL || loader == Py_None) { + PyObject *loader = PyObject_GetAttrString(interp->importlib, + "BuiltinImporter"); + if (loader == NULL) { + Py_FatalError("Failed to retrieve BuiltinImporter"); + } + if (PyDict_SetItemString(d, "__loader__", loader) < 0) { + Py_FatalError("Failed to initialize __main__.__loader__"); + } + Py_DECREF(loader); + } +} + +static int +initfsencoding(PyInterpreterState *interp) +{ + PyObject *codec; + + if (Py_FileSystemDefaultEncoding == NULL) + { + Py_FileSystemDefaultEncoding = get_locale_encoding(); + if (Py_FileSystemDefaultEncoding == NULL) + Py_FatalError("Py_Initialize: Unable to get the locale encoding"); + + Py_HasFileSystemDefaultEncoding = 0; + interp->fscodec_initialized = 1; + return 0; + } + + /* the encoding is mbcs, utf-8 or ascii */ + codec = _PyCodec_Lookup(Py_FileSystemDefaultEncoding); + if (!codec) { + /* Such error can only occurs in critical situations: no more + * memory, import a module of the standard library failed, + * etc. */ + return -1; + } + Py_DECREF(codec); + interp->fscodec_initialized = 1; + return 0; +} + +/* Import the site module (not into __main__ though) */ + +static void +initsite(void) +{ + PyObject *m; + m = PyImport_ImportModule("site"); + if (m == NULL) { + fprintf(stderr, "Failed to import the site module\n"); + PyErr_Print(); + Py_Finalize(); + exit(1); + } + else { + Py_DECREF(m); + } +} + +static PyObject* +create_stdio(PyObject* io, + int fd, int write_mode, char* name, + char* encoding, char* errors) +{ + PyObject *buf = NULL, *stream = NULL, *text = NULL, *raw = NULL, *res; + const char* mode; + const char* newline; + PyObject *line_buffering; + int buffering, isatty; + _Py_IDENTIFIER(open); + _Py_IDENTIFIER(isatty); + _Py_IDENTIFIER(TextIOWrapper); + _Py_IDENTIFIER(mode); + + /* stdin is always opened in buffered mode, first because it shouldn't + make a difference in common use cases, second because TextIOWrapper + depends on the presence of a read1() method which only exists on + buffered streams. + */ + if (Py_UnbufferedStdioFlag && write_mode) + buffering = 0; + else + buffering = -1; + if (write_mode) + mode = "wb"; + else + mode = "rb"; + buf = _PyObject_CallMethodId(io, &PyId_open, "isiOOOi", + fd, mode, buffering, + Py_None, Py_None, Py_None, 0); + if (buf == NULL) + goto error; + + if (buffering) { + _Py_IDENTIFIER(raw); + raw = _PyObject_GetAttrId(buf, &PyId_raw); + if (raw == NULL) + goto error; + } + else { + raw = buf; + Py_INCREF(raw); + } + + text = PyUnicode_FromString(name); + if (text == NULL || _PyObject_SetAttrId(raw, &PyId_name, text) < 0) + goto error; + res = _PyObject_CallMethodId(raw, &PyId_isatty, ""); + if (res == NULL) + goto error; + isatty = PyObject_IsTrue(res); + Py_DECREF(res); + if (isatty == -1) + goto error; + if (isatty || Py_UnbufferedStdioFlag) + line_buffering = Py_True; + else + line_buffering = Py_False; + + Py_CLEAR(raw); + Py_CLEAR(text); + +#ifdef MS_WINDOWS + /* sys.stdin: enable universal newline mode, translate "\r\n" and "\r" + newlines to "\n". + sys.stdout and sys.stderr: translate "\n" to "\r\n". */ + newline = NULL; +#else + /* sys.stdin: split lines at "\n". + sys.stdout and sys.stderr: don't translate newlines (use "\n"). */ + newline = "\n"; +#endif + + stream = _PyObject_CallMethodId(io, &PyId_TextIOWrapper, "OsssO", + buf, encoding, errors, + newline, line_buffering); + Py_CLEAR(buf); + if (stream == NULL) + goto error; + + if (write_mode) + mode = "w"; + else + mode = "r"; + text = PyUnicode_FromString(mode); + if (!text || _PyObject_SetAttrId(stream, &PyId_mode, text) < 0) + goto error; + Py_CLEAR(text); + return stream; + +error: + Py_XDECREF(buf); + Py_XDECREF(stream); + Py_XDECREF(text); + Py_XDECREF(raw); + return NULL; +} + +static int +is_valid_fd(int fd) +{ + int dummy_fd; + if (fd < 0 || !_PyVerify_fd(fd)) + return 0; + dummy_fd = dup(fd); + if (dummy_fd < 0) + return 0; + close(dummy_fd); + return 1; +} + +/* Initialize sys.stdin, stdout, stderr and builtins.open */ +static int +initstdio(void) +{ + PyObject *iomod = NULL, *wrapper; + PyObject *bimod = NULL; + PyObject *m; + PyObject *std = NULL; + int status = 0, fd; + PyObject * encoding_attr; + char *pythonioencoding = NULL, *encoding, *errors; + + /* Hack to avoid a nasty recursion issue when Python is invoked + in verbose mode: pre-import the Latin-1 and UTF-8 codecs */ + if ((m = PyImport_ImportModule("encodings.utf_8")) == NULL) { + goto error; + } + Py_DECREF(m); + + if (!(m = PyImport_ImportModule("encodings.latin_1"))) { + goto error; + } + Py_DECREF(m); + + if (!(bimod = PyImport_ImportModule("builtins"))) { + goto error; + } + + if (!(iomod = PyImport_ImportModule("io"))) { + goto error; + } + if (!(wrapper = PyObject_GetAttrString(iomod, "OpenWrapper"))) { + goto error; + } + + /* Set builtins.open */ + if (PyObject_SetAttrString(bimod, "open", wrapper) == -1) { + Py_DECREF(wrapper); + goto error; + } + Py_DECREF(wrapper); + + encoding = _Py_StandardStreamEncoding; + errors = _Py_StandardStreamErrors; + if (!encoding || !errors) { + if (!errors) { + /* When the LC_CTYPE locale is the POSIX locale ("C locale"), + stdin and stdout use the surrogateescape error handler by + default, instead of the strict error handler. */ + char *loc = setlocale(LC_CTYPE, NULL); + if (loc != NULL && strcmp(loc, "C") == 0) + errors = "surrogateescape"; + } + + pythonioencoding = Py_GETENV("PYTHONIOENCODING"); + if (pythonioencoding) { + char *err; + pythonioencoding = _PyMem_Strdup(pythonioencoding); + if (pythonioencoding == NULL) { + PyErr_NoMemory(); + goto error; + } + err = strchr(pythonioencoding, ':'); + if (err) { + *err = '\0'; + err++; + if (*err && !_Py_StandardStreamErrors) { + errors = err; + } + } + if (*pythonioencoding && !encoding) { + encoding = pythonioencoding; + } + } + } + + /* Set sys.stdin */ + fd = fileno(stdin); + /* Under some conditions stdin, stdout and stderr may not be connected + * and fileno() may point to an invalid file descriptor. For example + * GUI apps don't have valid standard streams by default. + */ + if (!is_valid_fd(fd)) { + std = Py_None; + Py_INCREF(std); + } + else { + std = create_stdio(iomod, fd, 0, "", encoding, errors); + if (std == NULL) + goto error; + } /* if (fd < 0) */ + PySys_SetObject("__stdin__", std); + _PySys_SetObjectId(&PyId_stdin, std); + Py_DECREF(std); + + /* Set sys.stdout */ + fd = fileno(stdout); + if (!is_valid_fd(fd)) { + std = Py_None; + Py_INCREF(std); + } + else { + std = create_stdio(iomod, fd, 1, "", encoding, errors); + if (std == NULL) + goto error; + } /* if (fd < 0) */ + PySys_SetObject("__stdout__", std); + _PySys_SetObjectId(&PyId_stdout, std); + Py_DECREF(std); + +#if 1 /* Disable this if you have trouble debugging bootstrap stuff */ + /* Set sys.stderr, replaces the preliminary stderr */ + fd = fileno(stderr); + if (!is_valid_fd(fd)) { + std = Py_None; + Py_INCREF(std); + } + else { + std = create_stdio(iomod, fd, 1, "", encoding, "backslashreplace"); + if (std == NULL) + goto error; + } /* if (fd < 0) */ + + /* Same as hack above, pre-import stderr's codec to avoid recursion + when import.c tries to write to stderr in verbose mode. */ + encoding_attr = PyObject_GetAttrString(std, "encoding"); + if (encoding_attr != NULL) { + const char * std_encoding; + std_encoding = _PyUnicode_AsString(encoding_attr); + if (std_encoding != NULL) { + PyObject *codec_info = _PyCodec_Lookup(std_encoding); + Py_XDECREF(codec_info); + } + Py_DECREF(encoding_attr); + } + PyErr_Clear(); /* Not a fatal error if codec isn't available */ + + if (PySys_SetObject("__stderr__", std) < 0) { + Py_DECREF(std); + goto error; + } + if (_PySys_SetObjectId(&PyId_stderr, std) < 0) { + Py_DECREF(std); + goto error; + } + Py_DECREF(std); +#endif + + if (0) { + error: + status = -1; + } + + /* We won't need them anymore. */ + if (_Py_StandardStreamEncoding) { + PyMem_RawFree(_Py_StandardStreamEncoding); + _Py_StandardStreamEncoding = NULL; + } + if (_Py_StandardStreamErrors) { + PyMem_RawFree(_Py_StandardStreamErrors); + _Py_StandardStreamErrors = NULL; + } + PyMem_Free(pythonioencoding); + Py_XDECREF(bimod); + Py_XDECREF(iomod); + return status; +} + + +/* Print fatal error message and abort */ + +void +Py_FatalError(const char *msg) +{ + const int fd = fileno(stderr); + PyThreadState *tstate; + + fprintf(stderr, "Fatal Python error: %s\n", msg); + fflush(stderr); /* it helps in Windows debug build */ + if (PyErr_Occurred()) { + PyErr_PrintEx(0); + } + else { + tstate = _Py_atomic_load_relaxed(&_PyThreadState_Current); + if (tstate != NULL) { + fputc('\n', stderr); + fflush(stderr); + _Py_DumpTracebackThreads(fd, tstate->interp, tstate); + } + _PyFaulthandler_Fini(); + } + +#ifdef MS_WINDOWS + { + size_t len = strlen(msg); + WCHAR* buffer; + size_t i; + + /* Convert the message to wchar_t. This uses a simple one-to-one + conversion, assuming that the this error message actually uses ASCII + only. If this ceases to be true, we will have to convert. */ + buffer = alloca( (len+1) * (sizeof *buffer)); + for( i=0; i<=len; ++i) + buffer[i] = msg[i]; + OutputDebugStringW(L"Fatal Python error: "); + OutputDebugStringW(buffer); + OutputDebugStringW(L"\n"); + } +#ifdef _DEBUG + DebugBreak(); +#endif +#endif /* MS_WINDOWS */ + abort(); +} + +/* Clean up and exit */ + +#ifdef WITH_THREAD +#include "pythread.h" +#endif + +static void (*pyexitfunc)(void) = NULL; +/* For the atexit module. */ +void _Py_PyAtExit(void (*func)(void)) +{ + pyexitfunc = func; +} + +static void +call_py_exitfuncs(void) +{ + if (pyexitfunc == NULL) + return; + + (*pyexitfunc)(); + PyErr_Clear(); +} + +/* Wait until threading._shutdown completes, provided + the threading module was imported in the first place. + The shutdown routine will wait until all non-daemon + "threading" threads have completed. */ +static void +wait_for_thread_shutdown(void) +{ +#ifdef WITH_THREAD + _Py_IDENTIFIER(_shutdown); + PyObject *result; + PyThreadState *tstate = PyThreadState_GET(); + PyObject *threading = PyMapping_GetItemString(tstate->interp->modules, + "threading"); + if (threading == NULL) { + /* threading not imported */ + PyErr_Clear(); + return; + } + result = _PyObject_CallMethodId(threading, &PyId__shutdown, ""); + if (result == NULL) { + PyErr_WriteUnraisable(threading); + } + else { + Py_DECREF(result); + } + Py_DECREF(threading); +#endif +} + +#define NEXITFUNCS 32 +static void (*exitfuncs[NEXITFUNCS])(void); +static int nexitfuncs = 0; + +int Py_AtExit(void (*func)(void)) +{ + if (nexitfuncs >= NEXITFUNCS) + return -1; + exitfuncs[nexitfuncs++] = func; + return 0; +} + +static void +call_ll_exitfuncs(void) +{ + while (nexitfuncs > 0) + (*exitfuncs[--nexitfuncs])(); + + fflush(stdout); + fflush(stderr); +} + +void +Py_Exit(int sts) +{ + Py_Finalize(); + + exit(sts); +} + +static void +initsigs(void) +{ +#ifdef SIGPIPE + PyOS_setsig(SIGPIPE, SIG_IGN); +#endif +#ifdef SIGXFZ + PyOS_setsig(SIGXFZ, SIG_IGN); +#endif +#ifdef SIGXFSZ + PyOS_setsig(SIGXFSZ, SIG_IGN); +#endif + PyOS_InitInterrupts(); /* May imply initsignal() */ + if (PyErr_Occurred()) { + Py_FatalError("Py_Initialize: can't import signal"); + } +} + + +/* Restore signals that the interpreter has called SIG_IGN on to SIG_DFL. + * + * All of the code in this function must only use async-signal-safe functions, + * listed at `man 7 signal` or + * http://www.opengroup.org/onlinepubs/009695399/functions/xsh_chap02_04.html. + */ +void +_Py_RestoreSignals(void) +{ +#ifdef SIGPIPE + PyOS_setsig(SIGPIPE, SIG_DFL); +#endif +#ifdef SIGXFZ + PyOS_setsig(SIGXFZ, SIG_DFL); +#endif +#ifdef SIGXFSZ + PyOS_setsig(SIGXFSZ, SIG_DFL); +#endif +} + + +/* + * The file descriptor fd is considered ``interactive'' if either + * a) isatty(fd) is TRUE, or + * b) the -i flag was given, and the filename associated with + * the descriptor is NULL or "" or "???". + */ +int +Py_FdIsInteractive(FILE *fp, const char *filename) +{ + if (isatty((int)fileno(fp))) + return 1; + if (!Py_InteractiveFlag) + return 0; + return (filename == NULL) || + (strcmp(filename, "") == 0) || + (strcmp(filename, "???") == 0); +} + + +#if defined(USE_STACKCHECK) +#if defined(WIN32) && defined(_MSC_VER) + +/* Stack checking for Microsoft C */ + +#include +#include + +/* + * Return non-zero when we run out of memory on the stack; zero otherwise. + */ +int +PyOS_CheckStack(void) +{ + __try { + /* alloca throws a stack overflow exception if there's + not enough space left on the stack */ + alloca(PYOS_STACK_MARGIN * sizeof(void*)); + return 0; + } __except (GetExceptionCode() == STATUS_STACK_OVERFLOW ? + EXCEPTION_EXECUTE_HANDLER : + EXCEPTION_CONTINUE_SEARCH) { + int errcode = _resetstkoflw(); + if (errcode == 0) + { + Py_FatalError("Could not reset the stack!"); + } + } + return 1; +} + +#endif /* WIN32 && _MSC_VER */ + +/* Alternate implementations can be added here... */ + +#endif /* USE_STACKCHECK */ + + +/* Wrappers around sigaction() or signal(). */ + +PyOS_sighandler_t +PyOS_getsig(int sig) +{ +#ifdef HAVE_SIGACTION + struct sigaction context; + if (sigaction(sig, NULL, &context) == -1) + return SIG_ERR; + return context.sa_handler; +#else + PyOS_sighandler_t handler; +/* Special signal handling for the secure CRT in Visual Studio 2005 */ +#if defined(_MSC_VER) && _MSC_VER >= 1400 + switch (sig) { + /* Only these signals are valid */ + case SIGINT: + case SIGILL: + case SIGFPE: + case SIGSEGV: + case SIGTERM: + case SIGBREAK: + case SIGABRT: + break; + /* Don't call signal() with other values or it will assert */ + default: + return SIG_ERR; + } +#endif /* _MSC_VER && _MSC_VER >= 1400 */ + handler = signal(sig, SIG_IGN); + if (handler != SIG_ERR) + signal(sig, handler); + return handler; +#endif +} + +/* + * All of the code in this function must only use async-signal-safe functions, + * listed at `man 7 signal` or + * http://www.opengroup.org/onlinepubs/009695399/functions/xsh_chap02_04.html. + */ +PyOS_sighandler_t +PyOS_setsig(int sig, PyOS_sighandler_t handler) +{ +#ifdef HAVE_SIGACTION + /* Some code in Modules/signalmodule.c depends on sigaction() being + * used here if HAVE_SIGACTION is defined. Fix that if this code + * changes to invalidate that assumption. + */ + struct sigaction context, ocontext; + context.sa_handler = handler; + sigemptyset(&context.sa_mask); + context.sa_flags = 0; + if (sigaction(sig, &context, &ocontext) == -1) + return SIG_ERR; + return ocontext.sa_handler; +#else + PyOS_sighandler_t oldhandler; + oldhandler = signal(sig, handler); +#ifdef HAVE_SIGINTERRUPT + siginterrupt(sig, 1); +#endif + return oldhandler; +#endif +} + +#ifdef __cplusplus +} +#endif diff --git a/Python/pythonrun.c b/Python/pythonrun.c --- a/Python/pythonrun.c +++ b/Python/pythonrun.c @@ -40,7 +40,6 @@ _Py_IDENTIFIER(last_traceback); _Py_IDENTIFIER(last_type); _Py_IDENTIFIER(last_value); -_Py_IDENTIFIER(name); _Py_IDENTIFIER(ps1); _Py_IDENTIFIER(ps2); _Py_IDENTIFIER(stdin); @@ -48,43 +47,13 @@ _Py_IDENTIFIER(stderr); _Py_static_string(PyId_string, ""); -#ifdef Py_REF_DEBUG -static -void _print_total_refs(void) { - PyObject *xoptions, *value; - _Py_IDENTIFIER(showrefcount); - - xoptions = PySys_GetXOptions(); - if (xoptions == NULL) - return; - value = _PyDict_GetItemId(xoptions, &PyId_showrefcount); - if (value == Py_True) - fprintf(stderr, - "[%" PY_FORMAT_SIZE_T "d refs, " - "%" PY_FORMAT_SIZE_T "d blocks]\n", - _Py_GetRefTotal(), _Py_GetAllocatedBlocks()); -} -#endif - -#ifndef Py_REF_DEBUG -#define PRINT_TOTAL_REFS() -#else /* Py_REF_DEBUG */ -#define PRINT_TOTAL_REFS() _print_total_refs() -#endif - #ifdef __cplusplus extern "C" { #endif -extern wchar_t *Py_GetPath(void); - extern grammar _PyParser_Grammar; /* From graminit.c */ /* Forward */ -static void initmain(PyInterpreterState *interp); -static int initfsencoding(PyInterpreterState *interp); -static void initsite(void); -static int initstdio(void); static void flush_io(void); static PyObject *run_mod(mod_ty, PyObject *, PyObject *, PyObject *, PyCompilerFlags *, PyArena *); @@ -92,1192 +61,6 @@ PyCompilerFlags *); static void err_input(perrdetail *); static void err_free(perrdetail *); -static void initsigs(void); -static void call_py_exitfuncs(void); -static void wait_for_thread_shutdown(void); -static void call_ll_exitfuncs(void); -extern int _PyUnicode_Init(void); -extern int _PyStructSequence_Init(void); -extern void _PyUnicode_Fini(void); -extern int _PyLong_Init(void); -extern void PyLong_Fini(void); -extern int _PyFaulthandler_Init(void); -extern void _PyFaulthandler_Fini(void); -extern void _PyHash_Fini(void); -extern int _PyTraceMalloc_Init(void); -extern int _PyTraceMalloc_Fini(void); - -#ifdef WITH_THREAD -extern void _PyGILState_Init(PyInterpreterState *, PyThreadState *); -extern void _PyGILState_Fini(void); -#endif /* WITH_THREAD */ - -int Py_DebugFlag; /* Needed by parser.c */ -int Py_VerboseFlag; /* Needed by import.c */ -int Py_QuietFlag; /* Needed by sysmodule.c */ -int Py_InteractiveFlag; /* Needed by Py_FdIsInteractive() below */ -int Py_InspectFlag; /* Needed to determine whether to exit at SystemExit */ -int Py_NoSiteFlag; /* Suppress 'import site' */ -int Py_BytesWarningFlag; /* Warn on str(bytes) and str(buffer) */ -int Py_DontWriteBytecodeFlag; /* Suppress writing bytecode files (*.py[co]) */ -int Py_UseClassExceptionsFlag = 1; /* Needed by bltinmodule.c: deprecated */ -int Py_FrozenFlag; /* Needed by getpath.c */ -int Py_IgnoreEnvironmentFlag; /* e.g. PYTHONPATH, PYTHONHOME */ -int Py_NoUserSiteDirectory = 0; /* for -s and site.py */ -int Py_UnbufferedStdioFlag = 0; /* Unbuffered binary std{in,out,err} */ -int Py_HashRandomizationFlag = 0; /* for -R and PYTHONHASHSEED */ -int Py_IsolatedFlag = 0; /* for -I, isolate from user's env */ - -PyThreadState *_Py_Finalizing = NULL; - -/* Hack to force loading of object files */ -int (*_PyOS_mystrnicmp_hack)(const char *, const char *, Py_ssize_t) = \ - PyOS_mystrnicmp; /* Python/pystrcmp.o */ - -/* PyModule_GetWarningsModule is no longer necessary as of 2.6 -since _warnings is builtin. This API should not be used. */ -PyObject * -PyModule_GetWarningsModule(void) -{ - return PyImport_ImportModule("warnings"); -} - -static int initialized = 0; - -/* API to access the initialized flag -- useful for esoteric use */ - -int -Py_IsInitialized(void) -{ - return initialized; -} - -/* Helper to allow an embedding application to override the normal - * mechanism that attempts to figure out an appropriate IO encoding - */ - -static char *_Py_StandardStreamEncoding = NULL; -static char *_Py_StandardStreamErrors = NULL; - -int -Py_SetStandardStreamEncoding(const char *encoding, const char *errors) -{ - if (Py_IsInitialized()) { - /* This is too late to have any effect */ - return -1; - } - /* Can't call PyErr_NoMemory() on errors, as Python hasn't been - * initialised yet. - * - * However, the raw memory allocators are initialised appropriately - * as C static variables, so _PyMem_RawStrdup is OK even though - * Py_Initialize hasn't been called yet. - */ - if (encoding) { - _Py_StandardStreamEncoding = _PyMem_RawStrdup(encoding); - if (!_Py_StandardStreamEncoding) { - return -2; - } - } - if (errors) { - _Py_StandardStreamErrors = _PyMem_RawStrdup(errors); - if (!_Py_StandardStreamErrors) { - if (_Py_StandardStreamEncoding) { - PyMem_RawFree(_Py_StandardStreamEncoding); - } - return -3; - } - } - return 0; -} - -/* Global initializations. Can be undone by Py_Finalize(). Don't - call this twice without an intervening Py_Finalize() call. When - initializations fail, a fatal error is issued and the function does - not return. On return, the first thread and interpreter state have - been created. - - Locking: you must hold the interpreter lock while calling this. - (If the lock has not yet been initialized, that's equivalent to - having the lock, but you cannot use multiple threads.) - -*/ - -static int -add_flag(int flag, const char *envs) -{ - int env = atoi(envs); - if (flag < env) - flag = env; - if (flag < 1) - flag = 1; - return flag; -} - -static char* -get_codec_name(const char *encoding) -{ - char *name_utf8, *name_str; - PyObject *codec, *name = NULL; - - codec = _PyCodec_Lookup(encoding); - if (!codec) - goto error; - - name = _PyObject_GetAttrId(codec, &PyId_name); - Py_CLEAR(codec); - if (!name) - goto error; - - name_utf8 = _PyUnicode_AsString(name); - if (name_utf8 == NULL) - goto error; - name_str = _PyMem_RawStrdup(name_utf8); - Py_DECREF(name); - if (name_str == NULL) { - PyErr_NoMemory(); - return NULL; - } - return name_str; - -error: - Py_XDECREF(codec); - Py_XDECREF(name); - return NULL; -} - -static char* -get_locale_encoding(void) -{ -#ifdef MS_WINDOWS - char codepage[100]; - PyOS_snprintf(codepage, sizeof(codepage), "cp%d", GetACP()); - return get_codec_name(codepage); -#elif defined(HAVE_LANGINFO_H) && defined(CODESET) - char* codeset = nl_langinfo(CODESET); - if (!codeset || codeset[0] == '\0') { - PyErr_SetString(PyExc_ValueError, "CODESET is not set or empty"); - return NULL; - } - return get_codec_name(codeset); -#else - PyErr_SetNone(PyExc_NotImplementedError); - return NULL; -#endif -} - -static void -import_init(PyInterpreterState *interp, PyObject *sysmod) -{ - PyObject *importlib; - PyObject *impmod; - PyObject *sys_modules; - PyObject *value; - - /* Import _importlib through its frozen version, _frozen_importlib. */ - if (PyImport_ImportFrozenModule("_frozen_importlib") <= 0) { - Py_FatalError("Py_Initialize: can't import _frozen_importlib"); - } - else if (Py_VerboseFlag) { - PySys_FormatStderr("import _frozen_importlib # frozen\n"); - } - importlib = PyImport_AddModule("_frozen_importlib"); - if (importlib == NULL) { - Py_FatalError("Py_Initialize: couldn't get _frozen_importlib from " - "sys.modules"); - } - interp->importlib = importlib; - Py_INCREF(interp->importlib); - - /* Install _importlib as __import__ */ - impmod = PyInit_imp(); - if (impmod == NULL) { - Py_FatalError("Py_Initialize: can't import imp"); - } - else if (Py_VerboseFlag) { - PySys_FormatStderr("import imp # builtin\n"); - } - sys_modules = PyImport_GetModuleDict(); - if (Py_VerboseFlag) { - PySys_FormatStderr("import sys # builtin\n"); - } - if (PyDict_SetItemString(sys_modules, "_imp", impmod) < 0) { - Py_FatalError("Py_Initialize: can't save _imp to sys.modules"); - } - - value = PyObject_CallMethod(importlib, "_install", "OO", sysmod, impmod); - if (value == NULL) { - PyErr_Print(); - Py_FatalError("Py_Initialize: importlib install failed"); - } - Py_DECREF(value); - Py_DECREF(impmod); - - _PyImportZip_Init(); -} - - -void -_Py_InitializeEx_Private(int install_sigs, int install_importlib) -{ - PyInterpreterState *interp; - PyThreadState *tstate; - PyObject *bimod, *sysmod, *pstderr; - char *p; - extern void _Py_ReadyTypes(void); - - if (initialized) - return; - initialized = 1; - _Py_Finalizing = NULL; - -#if defined(HAVE_LANGINFO_H) && defined(HAVE_SETLOCALE) - /* Set up the LC_CTYPE locale, so we can obtain - the locale's charset without having to switch - locales. */ - setlocale(LC_CTYPE, ""); -#endif - - if ((p = Py_GETENV("PYTHONDEBUG")) && *p != '\0') - Py_DebugFlag = add_flag(Py_DebugFlag, p); - if ((p = Py_GETENV("PYTHONVERBOSE")) && *p != '\0') - Py_VerboseFlag = add_flag(Py_VerboseFlag, p); - if ((p = Py_GETENV("PYTHONOPTIMIZE")) && *p != '\0') - Py_OptimizeFlag = add_flag(Py_OptimizeFlag, p); - if ((p = Py_GETENV("PYTHONDONTWRITEBYTECODE")) && *p != '\0') - Py_DontWriteBytecodeFlag = add_flag(Py_DontWriteBytecodeFlag, p); - /* The variable is only tested for existence here; _PyRandom_Init will - check its value further. */ - if ((p = Py_GETENV("PYTHONHASHSEED")) && *p != '\0') - Py_HashRandomizationFlag = add_flag(Py_HashRandomizationFlag, p); - - _PyRandom_Init(); - - interp = PyInterpreterState_New(); - if (interp == NULL) - Py_FatalError("Py_Initialize: can't make first interpreter"); - - tstate = PyThreadState_New(interp); - if (tstate == NULL) - Py_FatalError("Py_Initialize: can't make first thread"); - (void) PyThreadState_Swap(tstate); - -#ifdef WITH_THREAD - /* We can't call _PyEval_FiniThreads() in Py_Finalize because - destroying the GIL might fail when it is being referenced from - another running thread (see issue #9901). - Instead we destroy the previously created GIL here, which ensures - that we can call Py_Initialize / Py_Finalize multiple times. */ - _PyEval_FiniThreads(); - - /* Auto-thread-state API */ - _PyGILState_Init(interp, tstate); -#endif /* WITH_THREAD */ - - _Py_ReadyTypes(); - - if (!_PyFrame_Init()) - Py_FatalError("Py_Initialize: can't init frames"); - - if (!_PyLong_Init()) - Py_FatalError("Py_Initialize: can't init longs"); - - if (!PyByteArray_Init()) - Py_FatalError("Py_Initialize: can't init bytearray"); - - if (!_PyFloat_Init()) - Py_FatalError("Py_Initialize: can't init float"); - - interp->modules = PyDict_New(); - if (interp->modules == NULL) - Py_FatalError("Py_Initialize: can't make modules dictionary"); - - /* Init Unicode implementation; relies on the codec registry */ - if (_PyUnicode_Init() < 0) - Py_FatalError("Py_Initialize: can't initialize unicode"); - if (_PyStructSequence_Init() < 0) - Py_FatalError("Py_Initialize: can't initialize structseq"); - - bimod = _PyBuiltin_Init(); - if (bimod == NULL) - Py_FatalError("Py_Initialize: can't initialize builtins modules"); - _PyImport_FixupBuiltin(bimod, "builtins"); - interp->builtins = PyModule_GetDict(bimod); - if (interp->builtins == NULL) - Py_FatalError("Py_Initialize: can't initialize builtins dict"); - Py_INCREF(interp->builtins); - - /* initialize builtin exceptions */ - _PyExc_Init(bimod); - - sysmod = _PySys_Init(); - if (sysmod == NULL) - Py_FatalError("Py_Initialize: can't initialize sys"); - interp->sysdict = PyModule_GetDict(sysmod); - if (interp->sysdict == NULL) - Py_FatalError("Py_Initialize: can't initialize sys dict"); - Py_INCREF(interp->sysdict); - _PyImport_FixupBuiltin(sysmod, "sys"); - PySys_SetPath(Py_GetPath()); - PyDict_SetItemString(interp->sysdict, "modules", - interp->modules); - - /* Set up a preliminary stderr printer until we have enough - infrastructure for the io module in place. */ - pstderr = PyFile_NewStdPrinter(fileno(stderr)); - if (pstderr == NULL) - Py_FatalError("Py_Initialize: can't set preliminary stderr"); - _PySys_SetObjectId(&PyId_stderr, pstderr); - PySys_SetObject("__stderr__", pstderr); - Py_DECREF(pstderr); - - _PyImport_Init(); - - _PyImportHooks_Init(); - - /* Initialize _warnings. */ - _PyWarnings_Init(); - - if (!install_importlib) - return; - - import_init(interp, sysmod); - - /* initialize the faulthandler module */ - if (_PyFaulthandler_Init()) - Py_FatalError("Py_Initialize: can't initialize faulthandler"); - - if (_PyTime_Init() < 0) - Py_FatalError("Py_Initialize: can't initialize time"); - - if (initfsencoding(interp) < 0) - Py_FatalError("Py_Initialize: unable to load the file system codec"); - - if (install_sigs) - initsigs(); /* Signal handling stuff, including initintr() */ - - if (_PyTraceMalloc_Init() < 0) - Py_FatalError("Py_Initialize: can't initialize tracemalloc"); - - initmain(interp); /* Module __main__ */ - if (initstdio() < 0) - Py_FatalError( - "Py_Initialize: can't initialize sys standard streams"); - - /* Initialize warnings. */ - if (PySys_HasWarnOptions()) { - PyObject *warnings_module = PyImport_ImportModule("warnings"); - if (warnings_module == NULL) { - fprintf(stderr, "'import warnings' failed; traceback:\n"); - PyErr_Print(); - } - Py_XDECREF(warnings_module); - } - - if (!Py_NoSiteFlag) - initsite(); /* Module site */ -} - -void -Py_InitializeEx(int install_sigs) -{ - _Py_InitializeEx_Private(install_sigs, 1); -} - -void -Py_Initialize(void) -{ - Py_InitializeEx(1); -} - - -#ifdef COUNT_ALLOCS -extern void dump_counts(FILE*); -#endif - -/* Flush stdout and stderr */ - -static int -file_is_closed(PyObject *fobj) -{ - int r; - PyObject *tmp = PyObject_GetAttrString(fobj, "closed"); - if (tmp == NULL) { - PyErr_Clear(); - return 0; - } - r = PyObject_IsTrue(tmp); - Py_DECREF(tmp); - if (r < 0) - PyErr_Clear(); - return r > 0; -} - -static void -flush_std_files(void) -{ - PyObject *fout = _PySys_GetObjectId(&PyId_stdout); - PyObject *ferr = _PySys_GetObjectId(&PyId_stderr); - PyObject *tmp; - - if (fout != NULL && fout != Py_None && !file_is_closed(fout)) { - tmp = _PyObject_CallMethodId(fout, &PyId_flush, ""); - if (tmp == NULL) - PyErr_WriteUnraisable(fout); - else - Py_DECREF(tmp); - } - - if (ferr != NULL && ferr != Py_None && !file_is_closed(ferr)) { - tmp = _PyObject_CallMethodId(ferr, &PyId_flush, ""); - if (tmp == NULL) - PyErr_Clear(); - else - Py_DECREF(tmp); - } -} - -/* Undo the effect of Py_Initialize(). - - Beware: if multiple interpreter and/or thread states exist, these - are not wiped out; only the current thread and interpreter state - are deleted. But since everything else is deleted, those other - interpreter and thread states should no longer be used. - - (XXX We should do better, e.g. wipe out all interpreters and - threads.) - - Locking: as above. - -*/ - -void -Py_Finalize(void) -{ - PyInterpreterState *interp; - PyThreadState *tstate; - - if (!initialized) - return; - - wait_for_thread_shutdown(); - - /* The interpreter is still entirely intact at this point, and the - * exit funcs may be relying on that. In particular, if some thread - * or exit func is still waiting to do an import, the import machinery - * expects Py_IsInitialized() to return true. So don't say the - * interpreter is uninitialized until after the exit funcs have run. - * Note that Threading.py uses an exit func to do a join on all the - * threads created thru it, so this also protects pending imports in - * the threads created via Threading. - */ - call_py_exitfuncs(); - - /* Get current thread state and interpreter pointer */ - tstate = PyThreadState_GET(); - interp = tstate->interp; - - /* Remaining threads (e.g. daemon threads) will automatically exit - after taking the GIL (in PyEval_RestoreThread()). */ - _Py_Finalizing = tstate; - initialized = 0; - - /* Flush stdout+stderr */ - flush_std_files(); - - /* Disable signal handling */ - PyOS_FiniInterrupts(); - - /* Collect garbage. This may call finalizers; it's nice to call these - * before all modules are destroyed. - * XXX If a __del__ or weakref callback is triggered here, and tries to - * XXX import a module, bad things can happen, because Python no - * XXX longer believes it's initialized. - * XXX Fatal Python error: Interpreter not initialized (version mismatch?) - * XXX is easy to provoke that way. I've also seen, e.g., - * XXX Exception exceptions.ImportError: 'No module named sha' - * XXX in ignored - * XXX but I'm unclear on exactly how that one happens. In any case, - * XXX I haven't seen a real-life report of either of these. - */ - PyGC_Collect(); -#ifdef COUNT_ALLOCS - /* With COUNT_ALLOCS, it helps to run GC multiple times: - each collection might release some types from the type - list, so they become garbage. */ - while (PyGC_Collect() > 0) - /* nothing */; -#endif - /* Destroy all modules */ - PyImport_Cleanup(); - - /* Flush stdout+stderr (again, in case more was printed) */ - flush_std_files(); - - /* Collect final garbage. This disposes of cycles created by - * class definitions, for example. - * XXX This is disabled because it caused too many problems. If - * XXX a __del__ or weakref callback triggers here, Python code has - * XXX a hard time running, because even the sys module has been - * XXX cleared out (sys.stdout is gone, sys.excepthook is gone, etc). - * XXX One symptom is a sequence of information-free messages - * XXX coming from threads (if a __del__ or callback is invoked, - * XXX other threads can execute too, and any exception they encounter - * XXX triggers a comedy of errors as subsystem after subsystem - * XXX fails to find what it *expects* to find in sys to help report - * XXX the exception and consequent unexpected failures). I've also - * XXX seen segfaults then, after adding print statements to the - * XXX Python code getting called. - */ -#if 0 - PyGC_Collect(); -#endif - - /* Disable tracemalloc after all Python objects have been destroyed, - so it is possible to use tracemalloc in objects destructor. */ - _PyTraceMalloc_Fini(); - - /* Destroy the database used by _PyImport_{Fixup,Find}Extension */ - _PyImport_Fini(); - - /* Cleanup typeobject.c's internal caches. */ - _PyType_Fini(); - - /* unload faulthandler module */ - _PyFaulthandler_Fini(); - - /* Debugging stuff */ -#ifdef COUNT_ALLOCS - dump_counts(stdout); -#endif - /* dump hash stats */ - _PyHash_Fini(); - - PRINT_TOTAL_REFS(); - -#ifdef Py_TRACE_REFS - /* Display all objects still alive -- this can invoke arbitrary - * __repr__ overrides, so requires a mostly-intact interpreter. - * Alas, a lot of stuff may still be alive now that will be cleaned - * up later. - */ - if (Py_GETENV("PYTHONDUMPREFS")) - _Py_PrintReferences(stderr); -#endif /* Py_TRACE_REFS */ - - /* Clear interpreter state and all thread states. */ - PyInterpreterState_Clear(interp); - - /* Now we decref the exception classes. After this point nothing - can raise an exception. That's okay, because each Fini() method - below has been checked to make sure no exceptions are ever - raised. - */ - - _PyExc_Fini(); - - /* Sundry finalizers */ - PyMethod_Fini(); - PyFrame_Fini(); - PyCFunction_Fini(); - PyTuple_Fini(); - PyList_Fini(); - PySet_Fini(); - PyBytes_Fini(); - PyByteArray_Fini(); - PyLong_Fini(); - PyFloat_Fini(); - PyDict_Fini(); - PySlice_Fini(); - _PyGC_Fini(); - _PyRandom_Fini(); - - /* Cleanup Unicode implementation */ - _PyUnicode_Fini(); - - /* reset file system default encoding */ - if (!Py_HasFileSystemDefaultEncoding && Py_FileSystemDefaultEncoding) { - PyMem_RawFree((char*)Py_FileSystemDefaultEncoding); - Py_FileSystemDefaultEncoding = NULL; - } - - /* XXX Still allocated: - - various static ad-hoc pointers to interned strings - - int and float free list blocks - - whatever various modules and libraries allocate - */ - - PyGrammar_RemoveAccelerators(&_PyParser_Grammar); - - /* Cleanup auto-thread-state */ -#ifdef WITH_THREAD - _PyGILState_Fini(); -#endif /* WITH_THREAD */ - - /* Delete current thread. After this, many C API calls become crashy. */ - PyThreadState_Swap(NULL); - PyInterpreterState_Delete(interp); - -#ifdef Py_TRACE_REFS - /* Display addresses (& refcnts) of all objects still alive. - * An address can be used to find the repr of the object, printed - * above by _Py_PrintReferences. - */ - if (Py_GETENV("PYTHONDUMPREFS")) - _Py_PrintReferenceAddresses(stderr); -#endif /* Py_TRACE_REFS */ -#ifdef PYMALLOC_DEBUG - if (Py_GETENV("PYTHONMALLOCSTATS")) - _PyObject_DebugMallocStats(stderr); -#endif - - call_ll_exitfuncs(); -} - -/* Create and initialize a new interpreter and thread, and return the - new thread. This requires that Py_Initialize() has been called - first. - - Unsuccessful initialization yields a NULL pointer. Note that *no* - exception information is available even in this case -- the - exception information is held in the thread, and there is no - thread. - - Locking: as above. - -*/ - -PyThreadState * -Py_NewInterpreter(void) -{ - PyInterpreterState *interp; - PyThreadState *tstate, *save_tstate; - PyObject *bimod, *sysmod; - - if (!initialized) - Py_FatalError("Py_NewInterpreter: call Py_Initialize first"); - - interp = PyInterpreterState_New(); - if (interp == NULL) - return NULL; - - tstate = PyThreadState_New(interp); - if (tstate == NULL) { - PyInterpreterState_Delete(interp); - return NULL; - } - - save_tstate = PyThreadState_Swap(tstate); - - /* XXX The following is lax in error checking */ - - interp->modules = PyDict_New(); - - bimod = _PyImport_FindBuiltin("builtins"); - if (bimod != NULL) { - interp->builtins = PyModule_GetDict(bimod); - if (interp->builtins == NULL) - goto handle_error; - Py_INCREF(interp->builtins); - } - - /* initialize builtin exceptions */ - _PyExc_Init(bimod); - - sysmod = _PyImport_FindBuiltin("sys"); - if (bimod != NULL && sysmod != NULL) { - PyObject *pstderr; - - interp->sysdict = PyModule_GetDict(sysmod); - if (interp->sysdict == NULL) - goto handle_error; - Py_INCREF(interp->sysdict); - PySys_SetPath(Py_GetPath()); - PyDict_SetItemString(interp->sysdict, "modules", - interp->modules); - /* Set up a preliminary stderr printer until we have enough - infrastructure for the io module in place. */ - pstderr = PyFile_NewStdPrinter(fileno(stderr)); - if (pstderr == NULL) - Py_FatalError("Py_Initialize: can't set preliminary stderr"); - _PySys_SetObjectId(&PyId_stderr, pstderr); - PySys_SetObject("__stderr__", pstderr); - Py_DECREF(pstderr); - - _PyImportHooks_Init(); - - import_init(interp, sysmod); - - if (initfsencoding(interp) < 0) - goto handle_error; - - if (initstdio() < 0) - Py_FatalError( - "Py_Initialize: can't initialize sys standard streams"); - initmain(interp); - if (!Py_NoSiteFlag) - initsite(); - } - - if (!PyErr_Occurred()) - return tstate; - -handle_error: - /* Oops, it didn't work. Undo it all. */ - - PyErr_PrintEx(0); - PyThreadState_Clear(tstate); - PyThreadState_Swap(save_tstate); - PyThreadState_Delete(tstate); - PyInterpreterState_Delete(interp); - - return NULL; -} - -/* Delete an interpreter and its last thread. This requires that the - given thread state is current, that the thread has no remaining - frames, and that it is its interpreter's only remaining thread. - It is a fatal error to violate these constraints. - - (Py_Finalize() doesn't have these constraints -- it zaps - everything, regardless.) - - Locking: as above. - -*/ - -void -Py_EndInterpreter(PyThreadState *tstate) -{ - PyInterpreterState *interp = tstate->interp; - - if (tstate != PyThreadState_GET()) - Py_FatalError("Py_EndInterpreter: thread is not current"); - if (tstate->frame != NULL) - Py_FatalError("Py_EndInterpreter: thread still has a frame"); - - wait_for_thread_shutdown(); - - if (tstate != interp->tstate_head || tstate->next != NULL) - Py_FatalError("Py_EndInterpreter: not the last thread"); - - PyImport_Cleanup(); - PyInterpreterState_Clear(interp); - PyThreadState_Swap(NULL); - PyInterpreterState_Delete(interp); -} - -#ifdef MS_WINDOWS -static wchar_t *progname = L"python"; -#else -static wchar_t *progname = L"python3"; -#endif - -void -Py_SetProgramName(wchar_t *pn) -{ - if (pn && *pn) - progname = pn; -} - -wchar_t * -Py_GetProgramName(void) -{ - return progname; -} - -static wchar_t *default_home = NULL; -static wchar_t env_home[MAXPATHLEN+1]; - -void -Py_SetPythonHome(wchar_t *home) -{ - default_home = home; -} - -wchar_t * -Py_GetPythonHome(void) -{ - wchar_t *home = default_home; - if (home == NULL && !Py_IgnoreEnvironmentFlag) { - char* chome = Py_GETENV("PYTHONHOME"); - if (chome) { - size_t size = Py_ARRAY_LENGTH(env_home); - size_t r = mbstowcs(env_home, chome, size); - if (r != (size_t)-1 && r < size) - home = env_home; - } - - } - return home; -} - -/* Create __main__ module */ - -static void -initmain(PyInterpreterState *interp) -{ - PyObject *m, *d, *loader; - m = PyImport_AddModule("__main__"); - if (m == NULL) - Py_FatalError("can't create __main__ module"); - d = PyModule_GetDict(m); - if (PyDict_GetItemString(d, "__builtins__") == NULL) { - PyObject *bimod = PyImport_ImportModule("builtins"); - if (bimod == NULL) { - Py_FatalError("Failed to retrieve builtins module"); - } - if (PyDict_SetItemString(d, "__builtins__", bimod) < 0) { - Py_FatalError("Failed to initialize __main__.__builtins__"); - } - Py_DECREF(bimod); - } - /* Main is a little special - imp.is_builtin("__main__") will return - * False, but BuiltinImporter is still the most appropriate initial - * setting for its __loader__ attribute. A more suitable value will - * be set if __main__ gets further initialized later in the startup - * process. - */ - loader = PyDict_GetItemString(d, "__loader__"); - if (loader == NULL || loader == Py_None) { - PyObject *loader = PyObject_GetAttrString(interp->importlib, - "BuiltinImporter"); - if (loader == NULL) { - Py_FatalError("Failed to retrieve BuiltinImporter"); - } - if (PyDict_SetItemString(d, "__loader__", loader) < 0) { - Py_FatalError("Failed to initialize __main__.__loader__"); - } - Py_DECREF(loader); - } -} - -static int -initfsencoding(PyInterpreterState *interp) -{ - PyObject *codec; - - if (Py_FileSystemDefaultEncoding == NULL) - { - Py_FileSystemDefaultEncoding = get_locale_encoding(); - if (Py_FileSystemDefaultEncoding == NULL) - Py_FatalError("Py_Initialize: Unable to get the locale encoding"); - - Py_HasFileSystemDefaultEncoding = 0; - interp->fscodec_initialized = 1; - return 0; - } - - /* the encoding is mbcs, utf-8 or ascii */ - codec = _PyCodec_Lookup(Py_FileSystemDefaultEncoding); - if (!codec) { - /* Such error can only occurs in critical situations: no more - * memory, import a module of the standard library failed, - * etc. */ - return -1; - } - Py_DECREF(codec); - interp->fscodec_initialized = 1; - return 0; -} - -/* Import the site module (not into __main__ though) */ - -static void -initsite(void) -{ - PyObject *m; - m = PyImport_ImportModule("site"); - if (m == NULL) { - fprintf(stderr, "Failed to import the site module\n"); - PyErr_Print(); - Py_Finalize(); - exit(1); - } - else { - Py_DECREF(m); - } -} - -static PyObject* -create_stdio(PyObject* io, - int fd, int write_mode, char* name, - char* encoding, char* errors) -{ - PyObject *buf = NULL, *stream = NULL, *text = NULL, *raw = NULL, *res; - const char* mode; - const char* newline; - PyObject *line_buffering; - int buffering, isatty; - _Py_IDENTIFIER(open); - _Py_IDENTIFIER(isatty); - _Py_IDENTIFIER(TextIOWrapper); - _Py_IDENTIFIER(mode); - - /* stdin is always opened in buffered mode, first because it shouldn't - make a difference in common use cases, second because TextIOWrapper - depends on the presence of a read1() method which only exists on - buffered streams. - */ - if (Py_UnbufferedStdioFlag && write_mode) - buffering = 0; - else - buffering = -1; - if (write_mode) - mode = "wb"; - else - mode = "rb"; - buf = _PyObject_CallMethodId(io, &PyId_open, "isiOOOi", - fd, mode, buffering, - Py_None, Py_None, Py_None, 0); - if (buf == NULL) - goto error; - - if (buffering) { - _Py_IDENTIFIER(raw); - raw = _PyObject_GetAttrId(buf, &PyId_raw); - if (raw == NULL) - goto error; - } - else { - raw = buf; - Py_INCREF(raw); - } - - text = PyUnicode_FromString(name); - if (text == NULL || _PyObject_SetAttrId(raw, &PyId_name, text) < 0) - goto error; - res = _PyObject_CallMethodId(raw, &PyId_isatty, ""); - if (res == NULL) - goto error; - isatty = PyObject_IsTrue(res); - Py_DECREF(res); - if (isatty == -1) - goto error; - if (isatty || Py_UnbufferedStdioFlag) - line_buffering = Py_True; - else - line_buffering = Py_False; - - Py_CLEAR(raw); - Py_CLEAR(text); - -#ifdef MS_WINDOWS - /* sys.stdin: enable universal newline mode, translate "\r\n" and "\r" - newlines to "\n". - sys.stdout and sys.stderr: translate "\n" to "\r\n". */ - newline = NULL; -#else - /* sys.stdin: split lines at "\n". - sys.stdout and sys.stderr: don't translate newlines (use "\n"). */ - newline = "\n"; -#endif - - stream = _PyObject_CallMethodId(io, &PyId_TextIOWrapper, "OsssO", - buf, encoding, errors, - newline, line_buffering); - Py_CLEAR(buf); - if (stream == NULL) - goto error; - - if (write_mode) - mode = "w"; - else - mode = "r"; - text = PyUnicode_FromString(mode); - if (!text || _PyObject_SetAttrId(stream, &PyId_mode, text) < 0) - goto error; - Py_CLEAR(text); - return stream; - -error: - Py_XDECREF(buf); - Py_XDECREF(stream); - Py_XDECREF(text); - Py_XDECREF(raw); - return NULL; -} - -static int -is_valid_fd(int fd) -{ - int dummy_fd; - if (fd < 0 || !_PyVerify_fd(fd)) - return 0; - dummy_fd = dup(fd); - if (dummy_fd < 0) - return 0; - close(dummy_fd); - return 1; -} - -/* Initialize sys.stdin, stdout, stderr and builtins.open */ -static int -initstdio(void) -{ - PyObject *iomod = NULL, *wrapper; - PyObject *bimod = NULL; - PyObject *m; - PyObject *std = NULL; - int status = 0, fd; - PyObject * encoding_attr; - char *pythonioencoding = NULL, *encoding, *errors; - - /* Hack to avoid a nasty recursion issue when Python is invoked - in verbose mode: pre-import the Latin-1 and UTF-8 codecs */ - if ((m = PyImport_ImportModule("encodings.utf_8")) == NULL) { - goto error; - } - Py_DECREF(m); - - if (!(m = PyImport_ImportModule("encodings.latin_1"))) { - goto error; - } - Py_DECREF(m); - - if (!(bimod = PyImport_ImportModule("builtins"))) { - goto error; - } - - if (!(iomod = PyImport_ImportModule("io"))) { - goto error; - } - if (!(wrapper = PyObject_GetAttrString(iomod, "OpenWrapper"))) { - goto error; - } - - /* Set builtins.open */ - if (PyObject_SetAttrString(bimod, "open", wrapper) == -1) { - Py_DECREF(wrapper); - goto error; - } - Py_DECREF(wrapper); - - encoding = _Py_StandardStreamEncoding; - errors = _Py_StandardStreamErrors; - if (!encoding || !errors) { - if (!errors) { - /* When the LC_CTYPE locale is the POSIX locale ("C locale"), - stdin and stdout use the surrogateescape error handler by - default, instead of the strict error handler. */ - char *loc = setlocale(LC_CTYPE, NULL); - if (loc != NULL && strcmp(loc, "C") == 0) - errors = "surrogateescape"; - } - - pythonioencoding = Py_GETENV("PYTHONIOENCODING"); - if (pythonioencoding) { - char *err; - pythonioencoding = _PyMem_Strdup(pythonioencoding); - if (pythonioencoding == NULL) { - PyErr_NoMemory(); - goto error; - } - err = strchr(pythonioencoding, ':'); - if (err) { - *err = '\0'; - err++; - if (*err && !_Py_StandardStreamErrors) { - errors = err; - } - } - if (*pythonioencoding && !encoding) { - encoding = pythonioencoding; - } - } - } - - /* Set sys.stdin */ - fd = fileno(stdin); - /* Under some conditions stdin, stdout and stderr may not be connected - * and fileno() may point to an invalid file descriptor. For example - * GUI apps don't have valid standard streams by default. - */ - if (!is_valid_fd(fd)) { - std = Py_None; - Py_INCREF(std); - } - else { - std = create_stdio(iomod, fd, 0, "", encoding, errors); - if (std == NULL) - goto error; - } /* if (fd < 0) */ - PySys_SetObject("__stdin__", std); - _PySys_SetObjectId(&PyId_stdin, std); - Py_DECREF(std); - - /* Set sys.stdout */ - fd = fileno(stdout); - if (!is_valid_fd(fd)) { - std = Py_None; - Py_INCREF(std); - } - else { - std = create_stdio(iomod, fd, 1, "", encoding, errors); - if (std == NULL) - goto error; - } /* if (fd < 0) */ - PySys_SetObject("__stdout__", std); - _PySys_SetObjectId(&PyId_stdout, std); - Py_DECREF(std); - -#if 1 /* Disable this if you have trouble debugging bootstrap stuff */ - /* Set sys.stderr, replaces the preliminary stderr */ - fd = fileno(stderr); - if (!is_valid_fd(fd)) { - std = Py_None; - Py_INCREF(std); - } - else { - std = create_stdio(iomod, fd, 1, "", encoding, "backslashreplace"); - if (std == NULL) - goto error; - } /* if (fd < 0) */ - - /* Same as hack above, pre-import stderr's codec to avoid recursion - when import.c tries to write to stderr in verbose mode. */ - encoding_attr = PyObject_GetAttrString(std, "encoding"); - if (encoding_attr != NULL) { - const char * std_encoding; - std_encoding = _PyUnicode_AsString(encoding_attr); - if (std_encoding != NULL) { - PyObject *codec_info = _PyCodec_Lookup(std_encoding); - Py_XDECREF(codec_info); - } - Py_DECREF(encoding_attr); - } - PyErr_Clear(); /* Not a fatal error if codec isn't available */ - - if (PySys_SetObject("__stderr__", std) < 0) { - Py_DECREF(std); - goto error; - } - if (_PySys_SetObjectId(&PyId_stderr, std) < 0) { - Py_DECREF(std); - goto error; - } - Py_DECREF(std); -#endif - - if (0) { - error: - status = -1; - } - - /* We won't need them anymore. */ - if (_Py_StandardStreamEncoding) { - PyMem_RawFree(_Py_StandardStreamEncoding); - _Py_StandardStreamEncoding = NULL; - } - if (_Py_StandardStreamErrors) { - PyMem_RawFree(_Py_StandardStreamErrors); - _Py_StandardStreamErrors = NULL; - } - PyMem_Free(pythonioencoding); - Py_XDECREF(bimod); - Py_XDECREF(iomod); - return status; -} /* Parse input from a file and execute it */ @@ -1327,7 +110,7 @@ err = -1; for (;;) { ret = PyRun_InteractiveOneObject(fp, filename, flags); - PRINT_TOTAL_REFS(); + _PY_DEBUG_PRINT_TOTAL_REFS(); if (ret == E_EOF) { err = 0; break; @@ -2592,192 +1375,6 @@ } } -/* Print fatal error message and abort */ - -void -Py_FatalError(const char *msg) -{ - const int fd = fileno(stderr); - PyThreadState *tstate; - - fprintf(stderr, "Fatal Python error: %s\n", msg); - fflush(stderr); /* it helps in Windows debug build */ - if (PyErr_Occurred()) { - PyErr_PrintEx(0); - } - else { - tstate = _Py_atomic_load_relaxed(&_PyThreadState_Current); - if (tstate != NULL) { - fputc('\n', stderr); - fflush(stderr); - _Py_DumpTracebackThreads(fd, tstate->interp, tstate); - } - _PyFaulthandler_Fini(); - } - -#ifdef MS_WINDOWS - { - size_t len = strlen(msg); - WCHAR* buffer; - size_t i; - - /* Convert the message to wchar_t. This uses a simple one-to-one - conversion, assuming that the this error message actually uses ASCII - only. If this ceases to be true, we will have to convert. */ - buffer = alloca( (len+1) * (sizeof *buffer)); - for( i=0; i<=len; ++i) - buffer[i] = msg[i]; - OutputDebugStringW(L"Fatal Python error: "); - OutputDebugStringW(buffer); - OutputDebugStringW(L"\n"); - } -#ifdef _DEBUG - DebugBreak(); -#endif -#endif /* MS_WINDOWS */ - abort(); -} - -/* Clean up and exit */ - -#ifdef WITH_THREAD -#include "pythread.h" -#endif - -static void (*pyexitfunc)(void) = NULL; -/* For the atexit module. */ -void _Py_PyAtExit(void (*func)(void)) -{ - pyexitfunc = func; -} - -static void -call_py_exitfuncs(void) -{ - if (pyexitfunc == NULL) - return; - - (*pyexitfunc)(); - PyErr_Clear(); -} - -/* Wait until threading._shutdown completes, provided - the threading module was imported in the first place. - The shutdown routine will wait until all non-daemon - "threading" threads have completed. */ -static void -wait_for_thread_shutdown(void) -{ -#ifdef WITH_THREAD - _Py_IDENTIFIER(_shutdown); - PyObject *result; - PyThreadState *tstate = PyThreadState_GET(); - PyObject *threading = PyMapping_GetItemString(tstate->interp->modules, - "threading"); - if (threading == NULL) { - /* threading not imported */ - PyErr_Clear(); - return; - } - result = _PyObject_CallMethodId(threading, &PyId__shutdown, ""); - if (result == NULL) { - PyErr_WriteUnraisable(threading); - } - else { - Py_DECREF(result); - } - Py_DECREF(threading); -#endif -} - -#define NEXITFUNCS 32 -static void (*exitfuncs[NEXITFUNCS])(void); -static int nexitfuncs = 0; - -int Py_AtExit(void (*func)(void)) -{ - if (nexitfuncs >= NEXITFUNCS) - return -1; - exitfuncs[nexitfuncs++] = func; - return 0; -} - -static void -call_ll_exitfuncs(void) -{ - while (nexitfuncs > 0) - (*exitfuncs[--nexitfuncs])(); - - fflush(stdout); - fflush(stderr); -} - -void -Py_Exit(int sts) -{ - Py_Finalize(); - - exit(sts); -} - -static void -initsigs(void) -{ -#ifdef SIGPIPE - PyOS_setsig(SIGPIPE, SIG_IGN); -#endif -#ifdef SIGXFZ - PyOS_setsig(SIGXFZ, SIG_IGN); -#endif -#ifdef SIGXFSZ - PyOS_setsig(SIGXFSZ, SIG_IGN); -#endif - PyOS_InitInterrupts(); /* May imply initsignal() */ - if (PyErr_Occurred()) { - Py_FatalError("Py_Initialize: can't import signal"); - } -} - - -/* Restore signals that the interpreter has called SIG_IGN on to SIG_DFL. - * - * All of the code in this function must only use async-signal-safe functions, - * listed at `man 7 signal` or - * http://www.opengroup.org/onlinepubs/009695399/functions/xsh_chap02_04.html. - */ -void -_Py_RestoreSignals(void) -{ -#ifdef SIGPIPE - PyOS_setsig(SIGPIPE, SIG_DFL); -#endif -#ifdef SIGXFZ - PyOS_setsig(SIGXFZ, SIG_DFL); -#endif -#ifdef SIGXFSZ - PyOS_setsig(SIGXFSZ, SIG_DFL); -#endif -} - - -/* - * The file descriptor fd is considered ``interactive'' if either - * a) isatty(fd) is TRUE, or - * b) the -i flag was given, and the filename associated with - * the descriptor is NULL or "" or "???". - */ -int -Py_FdIsInteractive(FILE *fp, const char *filename) -{ - if (isatty((int)fileno(fp))) - return 1; - if (!Py_InteractiveFlag) - return 0; - return (filename == NULL) || - (strcmp(filename, "") == 0) || - (strcmp(filename, "???") == 0); -} - #if defined(USE_STACKCHECK) #if defined(WIN32) && defined(_MSC_VER) @@ -2816,73 +1413,6 @@ #endif /* USE_STACKCHECK */ - -/* Wrappers around sigaction() or signal(). */ - -PyOS_sighandler_t -PyOS_getsig(int sig) -{ -#ifdef HAVE_SIGACTION - struct sigaction context; - if (sigaction(sig, NULL, &context) == -1) - return SIG_ERR; - return context.sa_handler; -#else - PyOS_sighandler_t handler; -/* Special signal handling for the secure CRT in Visual Studio 2005 */ -#if defined(_MSC_VER) && _MSC_VER >= 1400 - switch (sig) { - /* Only these signals are valid */ - case SIGINT: - case SIGILL: - case SIGFPE: - case SIGSEGV: - case SIGTERM: - case SIGBREAK: - case SIGABRT: - break; - /* Don't call signal() with other values or it will assert */ - default: - return SIG_ERR; - } -#endif /* _MSC_VER && _MSC_VER >= 1400 */ - handler = signal(sig, SIG_IGN); - if (handler != SIG_ERR) - signal(sig, handler); - return handler; -#endif -} - -/* - * All of the code in this function must only use async-signal-safe functions, - * listed at `man 7 signal` or - * http://www.opengroup.org/onlinepubs/009695399/functions/xsh_chap02_04.html. - */ -PyOS_sighandler_t -PyOS_setsig(int sig, PyOS_sighandler_t handler) -{ -#ifdef HAVE_SIGACTION - /* Some code in Modules/signalmodule.c depends on sigaction() being - * used here if HAVE_SIGACTION is defined. Fix that if this code - * changes to invalidate that assumption. - */ - struct sigaction context, ocontext; - context.sa_handler = handler; - sigemptyset(&context.sa_mask); - context.sa_flags = 0; - if (sigaction(sig, &context, &ocontext) == -1) - return SIG_ERR; - return ocontext.sa_handler; -#else - PyOS_sighandler_t oldhandler; - oldhandler = signal(sig, handler); -#ifdef HAVE_SIGINTERRUPT - siginterrupt(sig, 1); -#endif - return oldhandler; -#endif -} - /* Deprecated C API functions still provided for binary compatiblity */ #undef PyParser_SimpleParseFile diff --git a/Python/sysmodule.c b/Python/sysmodule.c --- a/Python/sysmodule.c +++ b/Python/sysmodule.c @@ -1681,7 +1681,7 @@ } #endif - /* stdin/stdout/stderr are now set by pythonrun.c */ + /* stdin/stdout/stderr are set in pylifecycle.c */ SET_SYS_FROM_STRING_BORROW("__displayhook__", PyDict_GetItemString(sysdict, "displayhook")); -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 20 14:20:43 2014 From: python-checkins at python.org (victor.stinner) Date: Thu, 20 Nov 2014 13:20:43 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogYXN5bmNpbywgdGVz?= =?utf-8?q?t=5Fevents=3A_Ignore_the_=22SSL_handshake_failed=22_log_in_debu?= =?utf-8?q?g_mode?= Message-ID: <20141120132040.130911.64441@psf.io> https://hg.python.org/cpython/rev/ab7b942dfaa8 changeset: 93517:ab7b942dfaa8 branch: 3.4 user: Victor Stinner date: Thu Nov 20 14:19:23 2014 +0100 summary: asyncio, test_events: Ignore the "SSL handshake failed" log in debug mode files: Lib/test/test_asyncio/test_events.py | 4 +++- 1 files changed, 3 insertions(+), 1 deletions(-) diff --git a/Lib/test/test_asyncio/test_events.py b/Lib/test/test_asyncio/test_events.py --- a/Lib/test/test_asyncio/test_events.py +++ b/Lib/test/test_asyncio/test_events.py @@ -634,7 +634,9 @@ # validation will fail with self.assertRaises(ssl.SSLError) as cm: conn_fut = create_connection(ssl=True) - self._basetest_create_ssl_connection(conn_fut, check_sockname) + # Ignore the "SSL handshake failed" log in debug mode + with test_utils.disable_logger(): + self._basetest_create_ssl_connection(conn_fut, check_sockname) self.assertEqual(cm.exception.reason, 'CERTIFICATE_VERIFY_FAILED') -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 20 14:20:43 2014 From: python-checkins at python.org (victor.stinner) Date: Thu, 20 Nov 2014 13:20:43 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogYXN5bmNpbzogRml4?= =?utf-8?q?_formatting_of_the_=22Future_exception_was_never_retrieved=22_i?= =?utf-8?q?n?= Message-ID: <20141120132040.43946.89261@psf.io> https://hg.python.org/cpython/rev/307cf392914e changeset: 93516:307cf392914e branch: 3.4 parent: 93512:fb06c8ccfd41 user: Victor Stinner date: Thu Nov 20 14:16:31 2014 +0100 summary: asyncio: Fix formatting of the "Future exception was never retrieved" in release mode files: Lib/asyncio/futures.py | 7 +- Lib/test/test_asyncio/test_events.py | 34 ++++--- Lib/test/test_asyncio/test_futures.py | 65 +++++++++----- 3 files changed, 64 insertions(+), 42 deletions(-) diff --git a/Lib/asyncio/futures.py b/Lib/asyncio/futures.py --- a/Lib/asyncio/futures.py +++ b/Lib/asyncio/futures.py @@ -104,10 +104,11 @@ def __del__(self): if self.tb: - msg = 'Future/Task exception was never retrieved' + msg = 'Future/Task exception was never retrieved\n' if self.source_traceback: - msg += '\nFuture/Task created at (most recent call last):\n' - msg += ''.join(traceback.format_list(self.source_traceback)) + src = ''.join(traceback.format_list(self.source_traceback)) + msg += 'Future/Task created at (most recent call last):\n' + msg += '%s\n' % src.rstrip() msg += ''.join(self.tb).rstrip() self.loop.call_exception_handler({'message': msg}) diff --git a/Lib/test/test_asyncio/test_events.py b/Lib/test/test_asyncio/test_events.py --- a/Lib/test/test_asyncio/test_events.py +++ b/Lib/test/test_asyncio/test_events.py @@ -606,27 +606,29 @@ self.assertGreater(pr.nbytes, 0) tr.close() - if ssl: - def _dummy_ssl_create_context(self, purpose=ssl.Purpose.SERVER_AUTH, *, - cafile=None, capath=None, cadata=None): - """ - A ssl.create_default_context() replacement that doesn't enable - cert validation. - """ - self.assertEqual(purpose, ssl.Purpose.SERVER_AUTH) - return test_utils.dummy_ssl_context() - def _test_create_ssl_connection(self, httpd, create_connection, check_sockname=True): conn_fut = create_connection(ssl=test_utils.dummy_ssl_context()) self._basetest_create_ssl_connection(conn_fut, check_sockname) - # With ssl=True, ssl.create_default_context() should be called - with mock.patch('ssl.create_default_context', - side_effect=self._dummy_ssl_create_context) as m: - conn_fut = create_connection(ssl=True) - self._basetest_create_ssl_connection(conn_fut, check_sockname) - self.assertEqual(m.call_count, 1) + # ssl.Purpose was introduced in Python 3.4 + if hasattr(ssl, 'Purpose'): + def _dummy_ssl_create_context(purpose=ssl.Purpose.SERVER_AUTH, *, + cafile=None, capath=None, + cadata=None): + """ + A ssl.create_default_context() replacement that doesn't enable + cert validation. + """ + self.assertEqual(purpose, ssl.Purpose.SERVER_AUTH) + return test_utils.dummy_ssl_context() + + # With ssl=True, ssl.create_default_context() should be called + with mock.patch('ssl.create_default_context', + side_effect=_dummy_ssl_create_context) as m: + conn_fut = create_connection(ssl=True) + self._basetest_create_ssl_connection(conn_fut, check_sockname) + self.assertEqual(m.call_count, 1) # With the real ssl.create_default_context(), certificate # validation will fail diff --git a/Lib/test/test_asyncio/test_futures.py b/Lib/test/test_asyncio/test_futures.py --- a/Lib/test/test_asyncio/test_futures.py +++ b/Lib/test/test_asyncio/test_futures.py @@ -307,8 +307,8 @@ 'test_future_source_traceback')) @mock.patch('asyncio.base_events.logger') - def test_future_exception_never_retrieved(self, m_log): - self.loop.set_debug(True) + def check_future_exception_never_retrieved(self, debug, m_log): + self.loop.set_debug(debug) def memory_error(): try: @@ -318,40 +318,59 @@ exc = memory_error() future = asyncio.Future(loop=self.loop) - source_traceback = future._source_traceback + if debug: + source_traceback = future._source_traceback future.set_exception(exc) future = None test_utils.run_briefly(self.loop) support.gc_collect() if sys.version_info >= (3, 4): - frame = source_traceback[-1] - regex = (r'^Future exception was never retrieved\n' - r'future: \n' - r'source_traceback: Object created at $most recent call last$:\n' - r' File' - r'.*\n' - r' File "{filename}", line {lineno}, in test_future_exception_never_retrieved\n' - r' future = asyncio\.Future$loop=self\.loop$$' - ).format(filename=re.escape(frame[0]), lineno=frame[1]) + if debug: + frame = source_traceback[-1] + regex = (r'^Future exception was never retrieved\n' + r'future: \n' + r'source_traceback: Object created at $most recent call last$:\n' + r' File' + r'.*\n' + r' File "{filename}", line {lineno}, in check_future_exception_never_retrieved\n' + r' future = asyncio\.Future$loop=self\.loop$$' + ).format(filename=re.escape(frame[0]), lineno=frame[1]) + else: + regex = (r'^Future exception was never retrieved\n' + r'future: $' + ) exc_info = (type(exc), exc, exc.__traceback__) m_log.error.assert_called_once_with(mock.ANY, exc_info=exc_info) else: - frame = source_traceback[-1] - regex = (r'^Future/Task exception was never retrieved\n' - r'Future/Task created at $most recent call last$:\n' - r' File' - r'.*\n' - r' File "{filename}", line {lineno}, in test_future_exception_never_retrieved\n' - r' future = asyncio\.Future$loop=self\.loop$\n' - r'Traceback $most recent call last$:\n' - r'.*\n' - r'MemoryError$' - ).format(filename=re.escape(frame[0]), lineno=frame[1]) + if debug: + frame = source_traceback[-1] + regex = (r'^Future/Task exception was never retrieved\n' + r'Future/Task created at $most recent call last$:\n' + r' File' + r'.*\n' + r' File "{filename}", line {lineno}, in check_future_exception_never_retrieved\n' + r' future = asyncio\.Future$loop=self\.loop$\n' + r'Traceback $most recent call last$:\n' + r'.*\n' + r'MemoryError$' + ).format(filename=re.escape(frame[0]), lineno=frame[1]) + else: + regex = (r'^Future/Task exception was never retrieved\n' + r'Traceback $most recent call last$:\n' + r'.*\n' + r'MemoryError$' + ) m_log.error.assert_called_once_with(mock.ANY, exc_info=False) message = m_log.error.call_args[0][0] self.assertRegex(message, re.compile(regex, re.DOTALL)) + def test_future_exception_never_retrieved(self): + self.check_future_exception_never_retrieved(False) + + def test_future_exception_never_retrieved_debug(self): + self.check_future_exception_never_retrieved(True) + def test_set_result_unless_cancelled(self): fut = asyncio.Future(loop=self.loop) fut.cancel() -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 20 14:20:43 2014 From: python-checkins at python.org (victor.stinner) Date: Thu, 20 Nov 2014 13:20:43 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?b?KTogTWVyZ2Ugd2l0aCAzLjQgKGFzeW5jaW8p?= Message-ID: <20141120132040.7142.51283@psf.io> https://hg.python.org/cpython/rev/3d3928940da3 changeset: 93518:3d3928940da3 parent: 93515:b9775a92c1d0 parent: 93517:ab7b942dfaa8 user: Victor Stinner date: Thu Nov 20 14:19:49 2014 +0100 summary: Merge with 3.4 (asyncio) files: Lib/asyncio/futures.py | 7 +- Lib/test/test_asyncio/test_events.py | 38 ++++--- Lib/test/test_asyncio/test_futures.py | 65 +++++++++----- 3 files changed, 67 insertions(+), 43 deletions(-) diff --git a/Lib/asyncio/futures.py b/Lib/asyncio/futures.py --- a/Lib/asyncio/futures.py +++ b/Lib/asyncio/futures.py @@ -104,10 +104,11 @@ def __del__(self): if self.tb: - msg = 'Future/Task exception was never retrieved' + msg = 'Future/Task exception was never retrieved\n' if self.source_traceback: - msg += '\nFuture/Task created at (most recent call last):\n' - msg += ''.join(traceback.format_list(self.source_traceback)) + src = ''.join(traceback.format_list(self.source_traceback)) + msg += 'Future/Task created at (most recent call last):\n' + msg += '%s\n' % src.rstrip() msg += ''.join(self.tb).rstrip() self.loop.call_exception_handler({'message': msg}) diff --git a/Lib/test/test_asyncio/test_events.py b/Lib/test/test_asyncio/test_events.py --- a/Lib/test/test_asyncio/test_events.py +++ b/Lib/test/test_asyncio/test_events.py @@ -606,33 +606,37 @@ self.assertGreater(pr.nbytes, 0) tr.close() - if ssl: - def _dummy_ssl_create_context(self, purpose=ssl.Purpose.SERVER_AUTH, *, - cafile=None, capath=None, cadata=None): - """ - A ssl.create_default_context() replacement that doesn't enable - cert validation. - """ - self.assertEqual(purpose, ssl.Purpose.SERVER_AUTH) - return test_utils.dummy_ssl_context() - def _test_create_ssl_connection(self, httpd, create_connection, check_sockname=True): conn_fut = create_connection(ssl=test_utils.dummy_ssl_context()) self._basetest_create_ssl_connection(conn_fut, check_sockname) - # With ssl=True, ssl.create_default_context() should be called - with mock.patch('ssl.create_default_context', - side_effect=self._dummy_ssl_create_context) as m: - conn_fut = create_connection(ssl=True) - self._basetest_create_ssl_connection(conn_fut, check_sockname) - self.assertEqual(m.call_count, 1) + # ssl.Purpose was introduced in Python 3.4 + if hasattr(ssl, 'Purpose'): + def _dummy_ssl_create_context(purpose=ssl.Purpose.SERVER_AUTH, *, + cafile=None, capath=None, + cadata=None): + """ + A ssl.create_default_context() replacement that doesn't enable + cert validation. + """ + self.assertEqual(purpose, ssl.Purpose.SERVER_AUTH) + return test_utils.dummy_ssl_context() + + # With ssl=True, ssl.create_default_context() should be called + with mock.patch('ssl.create_default_context', + side_effect=_dummy_ssl_create_context) as m: + conn_fut = create_connection(ssl=True) + self._basetest_create_ssl_connection(conn_fut, check_sockname) + self.assertEqual(m.call_count, 1) # With the real ssl.create_default_context(), certificate # validation will fail with self.assertRaises(ssl.SSLError) as cm: conn_fut = create_connection(ssl=True) - self._basetest_create_ssl_connection(conn_fut, check_sockname) + # Ignore the "SSL handshake failed" log in debug mode + with test_utils.disable_logger(): + self._basetest_create_ssl_connection(conn_fut, check_sockname) self.assertEqual(cm.exception.reason, 'CERTIFICATE_VERIFY_FAILED') diff --git a/Lib/test/test_asyncio/test_futures.py b/Lib/test/test_asyncio/test_futures.py --- a/Lib/test/test_asyncio/test_futures.py +++ b/Lib/test/test_asyncio/test_futures.py @@ -307,8 +307,8 @@ 'test_future_source_traceback')) @mock.patch('asyncio.base_events.logger') - def test_future_exception_never_retrieved(self, m_log): - self.loop.set_debug(True) + def check_future_exception_never_retrieved(self, debug, m_log): + self.loop.set_debug(debug) def memory_error(): try: @@ -318,40 +318,59 @@ exc = memory_error() future = asyncio.Future(loop=self.loop) - source_traceback = future._source_traceback + if debug: + source_traceback = future._source_traceback future.set_exception(exc) future = None test_utils.run_briefly(self.loop) support.gc_collect() if sys.version_info >= (3, 4): - frame = source_traceback[-1] - regex = (r'^Future exception was never retrieved\n' - r'future: \n' - r'source_traceback: Object created at $most recent call last$:\n' - r' File' - r'.*\n' - r' File "{filename}", line {lineno}, in test_future_exception_never_retrieved\n' - r' future = asyncio\.Future$loop=self\.loop$$' - ).format(filename=re.escape(frame[0]), lineno=frame[1]) + if debug: + frame = source_traceback[-1] + regex = (r'^Future exception was never retrieved\n' + r'future: \n' + r'source_traceback: Object created at $most recent call last$:\n' + r' File' + r'.*\n' + r' File "{filename}", line {lineno}, in check_future_exception_never_retrieved\n' + r' future = asyncio\.Future$loop=self\.loop$$' + ).format(filename=re.escape(frame[0]), lineno=frame[1]) + else: + regex = (r'^Future exception was never retrieved\n' + r'future: $' + ) exc_info = (type(exc), exc, exc.__traceback__) m_log.error.assert_called_once_with(mock.ANY, exc_info=exc_info) else: - frame = source_traceback[-1] - regex = (r'^Future/Task exception was never retrieved\n' - r'Future/Task created at $most recent call last$:\n' - r' File' - r'.*\n' - r' File "{filename}", line {lineno}, in test_future_exception_never_retrieved\n' - r' future = asyncio\.Future$loop=self\.loop$\n' - r'Traceback $most recent call last$:\n' - r'.*\n' - r'MemoryError$' - ).format(filename=re.escape(frame[0]), lineno=frame[1]) + if debug: + frame = source_traceback[-1] + regex = (r'^Future/Task exception was never retrieved\n' + r'Future/Task created at $most recent call last$:\n' + r' File' + r'.*\n' + r' File "{filename}", line {lineno}, in check_future_exception_never_retrieved\n' + r' future = asyncio\.Future$loop=self\.loop$\n' + r'Traceback $most recent call last$:\n' + r'.*\n' + r'MemoryError$' + ).format(filename=re.escape(frame[0]), lineno=frame[1]) + else: + regex = (r'^Future/Task exception was never retrieved\n' + r'Traceback $most recent call last$:\n' + r'.*\n' + r'MemoryError$' + ) m_log.error.assert_called_once_with(mock.ANY, exc_info=False) message = m_log.error.call_args[0][0] self.assertRegex(message, re.compile(regex, re.DOTALL)) + def test_future_exception_never_retrieved(self): + self.check_future_exception_never_retrieved(False) + + def test_future_exception_never_retrieved_debug(self): + self.check_future_exception_never_retrieved(True) + def test_set_result_unless_cancelled(self): fut = asyncio.Future(loop=self.loop) fut.cancel() -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 20 15:05:19 2014 From: python-checkins at python.org (victor.stinner) Date: Thu, 20 Nov 2014 14:05:19 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_Merge_3=2E4_=28asyncio=29?= Message-ID: <20141120140507.130913.3418@psf.io> https://hg.python.org/cpython/rev/5dbe3c3d014b changeset: 93520:5dbe3c3d014b parent: 93518:3d3928940da3 parent: 93519:1b5d23a4a5fd user: Victor Stinner date: Thu Nov 20 15:04:31 2014 +0100 summary: Merge 3.4 (asyncio) files: Lib/asyncio/base_events.py | 11 ++- Lib/asyncio/unix_events.py | 5 +- Lib/test/test_asyncio/test_base_events.py | 26 ++++++---- Lib/test/test_asyncio/test_unix_events.py | 14 ++++- 4 files changed, 35 insertions(+), 21 deletions(-) diff --git a/Lib/asyncio/base_events.py b/Lib/asyncio/base_events.py --- a/Lib/asyncio/base_events.py +++ b/Lib/asyncio/base_events.py @@ -357,7 +357,8 @@ Absolute time corresponds to the event loop's time() method. """ - if coroutines.iscoroutinefunction(callback): + if (coroutines.iscoroutine(callback) + or coroutines.iscoroutinefunction(callback)): raise TypeError("coroutines cannot be used with call_at()") if self._debug: self._assert_is_current_event_loop() @@ -384,7 +385,8 @@ return handle def _call_soon(self, callback, args, check_loop): - if coroutines.iscoroutinefunction(callback): + if (coroutines.iscoroutine(callback) + or coroutines.iscoroutinefunction(callback)): raise TypeError("coroutines cannot be used with call_soon()") if self._debug and check_loop: self._assert_is_current_event_loop() @@ -421,8 +423,9 @@ return handle def run_in_executor(self, executor, callback, *args): - if coroutines.iscoroutinefunction(callback): - raise TypeError("Coroutines cannot be used with run_in_executor()") + if (coroutines.iscoroutine(callback) + or coroutines.iscoroutinefunction(callback)): + raise TypeError("coroutines cannot be used with run_in_executor()") if isinstance(callback, events.Handle): assert not args assert not isinstance(callback, events.TimerHandle) diff --git a/Lib/asyncio/unix_events.py b/Lib/asyncio/unix_events.py --- a/Lib/asyncio/unix_events.py +++ b/Lib/asyncio/unix_events.py @@ -67,8 +67,9 @@ Raise ValueError if the signal number is invalid or uncatchable. Raise RuntimeError if there is a problem setting up the handler. """ - if coroutines.iscoroutinefunction(callback): - raise TypeError("coroutines cannot be used with call_soon()") + if (coroutines.iscoroutine(callback) + or coroutines.iscoroutinefunction(callback)): + raise TypeError("coroutines cannot be used with add_signal_handler()") self._check_signal(sig) try: # set_wakeup_fd() raises ValueError if this is not the diff --git a/Lib/test/test_asyncio/test_base_events.py b/Lib/test/test_asyncio/test_base_events.py --- a/Lib/test/test_asyncio/test_base_events.py +++ b/Lib/test/test_asyncio/test_base_events.py @@ -1107,19 +1107,23 @@ def test_call_coroutine(self): @asyncio.coroutine - def coroutine_function(): + def simple_coroutine(): pass - with self.assertRaises(TypeError): - self.loop.call_soon(coroutine_function) - with self.assertRaises(TypeError): - self.loop.call_soon_threadsafe(coroutine_function) - with self.assertRaises(TypeError): - self.loop.call_later(60, coroutine_function) - with self.assertRaises(TypeError): - self.loop.call_at(self.loop.time() + 60, coroutine_function) - with self.assertRaises(TypeError): - self.loop.run_in_executor(None, coroutine_function) + coro_func = simple_coroutine + coro_obj = coro_func() + self.addCleanup(coro_obj.close) + for func in (coro_func, coro_obj): + with self.assertRaises(TypeError): + self.loop.call_soon(func) + with self.assertRaises(TypeError): + self.loop.call_soon_threadsafe(func) + with self.assertRaises(TypeError): + self.loop.call_later(60, func) + with self.assertRaises(TypeError): + self.loop.call_at(self.loop.time() + 60, func) + with self.assertRaises(TypeError): + self.loop.run_in_executor(None, func) @mock.patch('asyncio.base_events.logger') def test_log_slow_callbacks(self, m_logger): diff --git a/Lib/test/test_asyncio/test_unix_events.py b/Lib/test/test_asyncio/test_unix_events.py --- a/Lib/test/test_asyncio/test_unix_events.py +++ b/Lib/test/test_asyncio/test_unix_events.py @@ -65,15 +65,21 @@ @mock.patch('asyncio.unix_events.signal') def test_add_signal_handler_coroutine_error(self, m_signal): + m_signal.NSIG = signal.NSIG @asyncio.coroutine def simple_coroutine(): yield from [] - self.assertRaises( - TypeError, - self.loop.add_signal_handler, - signal.SIGINT, simple_coroutine) + # callback must not be a coroutine function + coro_func = simple_coroutine + coro_obj = coro_func() + self.addCleanup(coro_obj.close) + for func in (coro_func, coro_obj): + self.assertRaisesRegex( + TypeError, 'coroutines cannot be used with add_signal_handler', + self.loop.add_signal_handler, + signal.SIGINT, func) @mock.patch('asyncio.unix_events.signal') def test_add_signal_handler(self, m_signal): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 20 15:05:19 2014 From: python-checkins at python.org (victor.stinner) Date: Thu, 20 Nov 2014 14:05:19 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogYXN5bmNpbzogQ29y?= =?utf-8?q?outine_objects_are_now_rejected_with_a_TypeError_by_the_followi?= =?utf-8?q?ng?= Message-ID: <20141120140507.68812.20648@psf.io> https://hg.python.org/cpython/rev/1b5d23a4a5fd changeset: 93519:1b5d23a4a5fd branch: 3.4 parent: 93517:ab7b942dfaa8 user: Victor Stinner date: Thu Nov 20 15:03:52 2014 +0100 summary: asyncio: Coroutine objects are now rejected with a TypeError by the following functions: * add_signal_handler() * call_at() * call_later() * call_soon() * call_soon_threadsafe() * run_in_executor() Fix also the error message of add_signal_handler() (fix the name of the function). files: Lib/asyncio/base_events.py | 11 ++- Lib/asyncio/unix_events.py | 5 +- Lib/test/test_asyncio/test_base_events.py | 26 ++++++---- Lib/test/test_asyncio/test_unix_events.py | 14 ++++- 4 files changed, 35 insertions(+), 21 deletions(-) diff --git a/Lib/asyncio/base_events.py b/Lib/asyncio/base_events.py --- a/Lib/asyncio/base_events.py +++ b/Lib/asyncio/base_events.py @@ -357,7 +357,8 @@ Absolute time corresponds to the event loop's time() method. """ - if coroutines.iscoroutinefunction(callback): + if (coroutines.iscoroutine(callback) + or coroutines.iscoroutinefunction(callback)): raise TypeError("coroutines cannot be used with call_at()") if self._debug: self._assert_is_current_event_loop() @@ -384,7 +385,8 @@ return handle def _call_soon(self, callback, args, check_loop): - if coroutines.iscoroutinefunction(callback): + if (coroutines.iscoroutine(callback) + or coroutines.iscoroutinefunction(callback)): raise TypeError("coroutines cannot be used with call_soon()") if self._debug and check_loop: self._assert_is_current_event_loop() @@ -421,8 +423,9 @@ return handle def run_in_executor(self, executor, callback, *args): - if coroutines.iscoroutinefunction(callback): - raise TypeError("Coroutines cannot be used with run_in_executor()") + if (coroutines.iscoroutine(callback) + or coroutines.iscoroutinefunction(callback)): + raise TypeError("coroutines cannot be used with run_in_executor()") if isinstance(callback, events.Handle): assert not args assert not isinstance(callback, events.TimerHandle) diff --git a/Lib/asyncio/unix_events.py b/Lib/asyncio/unix_events.py --- a/Lib/asyncio/unix_events.py +++ b/Lib/asyncio/unix_events.py @@ -67,8 +67,9 @@ Raise ValueError if the signal number is invalid or uncatchable. Raise RuntimeError if there is a problem setting up the handler. """ - if coroutines.iscoroutinefunction(callback): - raise TypeError("coroutines cannot be used with call_soon()") + if (coroutines.iscoroutine(callback) + or coroutines.iscoroutinefunction(callback)): + raise TypeError("coroutines cannot be used with add_signal_handler()") self._check_signal(sig) try: # set_wakeup_fd() raises ValueError if this is not the diff --git a/Lib/test/test_asyncio/test_base_events.py b/Lib/test/test_asyncio/test_base_events.py --- a/Lib/test/test_asyncio/test_base_events.py +++ b/Lib/test/test_asyncio/test_base_events.py @@ -1107,19 +1107,23 @@ def test_call_coroutine(self): @asyncio.coroutine - def coroutine_function(): + def simple_coroutine(): pass - with self.assertRaises(TypeError): - self.loop.call_soon(coroutine_function) - with self.assertRaises(TypeError): - self.loop.call_soon_threadsafe(coroutine_function) - with self.assertRaises(TypeError): - self.loop.call_later(60, coroutine_function) - with self.assertRaises(TypeError): - self.loop.call_at(self.loop.time() + 60, coroutine_function) - with self.assertRaises(TypeError): - self.loop.run_in_executor(None, coroutine_function) + coro_func = simple_coroutine + coro_obj = coro_func() + self.addCleanup(coro_obj.close) + for func in (coro_func, coro_obj): + with self.assertRaises(TypeError): + self.loop.call_soon(func) + with self.assertRaises(TypeError): + self.loop.call_soon_threadsafe(func) + with self.assertRaises(TypeError): + self.loop.call_later(60, func) + with self.assertRaises(TypeError): + self.loop.call_at(self.loop.time() + 60, func) + with self.assertRaises(TypeError): + self.loop.run_in_executor(None, func) @mock.patch('asyncio.base_events.logger') def test_log_slow_callbacks(self, m_logger): diff --git a/Lib/test/test_asyncio/test_unix_events.py b/Lib/test/test_asyncio/test_unix_events.py --- a/Lib/test/test_asyncio/test_unix_events.py +++ b/Lib/test/test_asyncio/test_unix_events.py @@ -65,15 +65,21 @@ @mock.patch('asyncio.unix_events.signal') def test_add_signal_handler_coroutine_error(self, m_signal): + m_signal.NSIG = signal.NSIG @asyncio.coroutine def simple_coroutine(): yield from [] - self.assertRaises( - TypeError, - self.loop.add_signal_handler, - signal.SIGINT, simple_coroutine) + # callback must not be a coroutine function + coro_func = simple_coroutine + coro_obj = coro_func() + self.addCleanup(coro_obj.close) + for func in (coro_func, coro_obj): + self.assertRaisesRegex( + TypeError, 'coroutines cannot be used with add_signal_handler', + self.loop.add_signal_handler, + signal.SIGINT, func) @mock.patch('asyncio.unix_events.signal') def test_add_signal_handler(self, m_signal): -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 20 15:38:47 2014 From: python-checkins at python.org (donald.stufft) Date: Thu, 20 Nov 2014 14:38:47 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzIyODI3?= =?utf-8?q?=3A_Backport_the_new_Distributing_and_Instaling_Docs_from_3=2E4?= Message-ID: <20141120143838.7146.46168@psf.io> https://hg.python.org/cpython/rev/8bc29f5ebeff changeset: 93521:8bc29f5ebeff branch: 2.7 parent: 93514:07f4b6ecd04a user: Donald Stufft date: Thu Nov 20 09:38:31 2014 -0500 summary: Issue #22827: Backport the new Distributing and Instaling Docs from 3.4 files: Doc/conf.py | 4 +- Doc/contents.rst | 12 +- Doc/distributing/index.rst | 170 +++++++++++++++++++ Doc/glossary.rst | 6 + Doc/installing/index.rst | 215 +++++++++++++++++++++++++ 5 files changed, 403 insertions(+), 4 deletions(-) diff --git a/Doc/conf.py b/Doc/conf.py --- a/Doc/conf.py +++ b/Doc/conf.py @@ -94,11 +94,11 @@ latex_documents = [ ('c-api/index', 'c-api.tex', 'The Python/C API', _stdauthor, 'manual'), - ('distutils/index', 'distutils.tex', + ('distributing/index', 'distributing.tex', 'Distributing Python Modules', _stdauthor, 'manual'), ('extending/index', 'extending.tex', 'Extending and Embedding Python', _stdauthor, 'manual'), - ('install/index', 'install.tex', + ('installing/index', 'installing.tex', 'Installing Python Modules', _stdauthor, 'manual'), ('library/index', 'library.tex', 'The Python Library Reference', _stdauthor, 'manual'), diff --git a/Doc/contents.rst b/Doc/contents.rst --- a/Doc/contents.rst +++ b/Doc/contents.rst @@ -11,8 +11,8 @@ library/index.rst extending/index.rst c-api/index.rst - distutils/index.rst - install/index.rst + distributing/index.rst + installing/index.rst howto/index.rst faq/index.rst glossary.rst @@ -21,3 +21,11 @@ bugs.rst copyright.rst license.rst + +.. to include legacy packaging docs in build + +.. toctree:: + :hidden: + + distutils/index.rst + install/index.rst diff --git a/Doc/distributing/index.rst b/Doc/distributing/index.rst new file mode 100644 --- /dev/null +++ b/Doc/distributing/index.rst @@ -0,0 +1,170 @@ +.. _distributing-index: + +############################### + Distributing Python Modules +############################### + +:Email: distutils-sig at python.org + + +As a popular open source development project, Python has an active +supporting community of contributors and users that also make their software +available for other Python developers to use under open source license terms. + +This allows Python users to share and collaborate effectively, benefiting +from the solutions others have already created to common (and sometimes +even rare!) problems, as well as potentially contributing their own +solutions to the common pool. + +This guide covers the distribution part of the process. For a guide to +installing other Python projects, refer to the +:ref:`installation guide `. + +.. note:: + + For corporate and other institutional users, be aware that many + organisations have their own policies around using and contributing to + open source software. Please take such policies into account when making + use of the distribution and installation tools provided with Python. + + +Key terms +========= + +* the `Python Packaging Index `__ is a public + repository of open source licensed packages made available for use by + other Python users +* the `Python Packaging Authority + `__ are the group of + developers and documentation authors responsible for the maintenance and + evolution of the standard packaging tools and the associated metadata and + file format standards. They maintain a variety of tools, documentation + and issue trackers on both `GitHub `__ and + `BitBucket `__. +* :mod:`distutils` is the original build and distribution system first added + to the Python standard library in 1998. While direct use of :mod:`distutils` + is being phased out, it still laid the foundation for the current packaging + and distribution infrastructure, and it not only remains part of the + standard library, but its name lives on in other ways (such as the name + of the mailing list used to coordinate Python packaging standards + development). +* `setuptools`_ is a (largely) drop-in replacement for :mod:`distutils` first + published in 2004. Its most notable addition over the unmodified + :mod:`distutils` tools was the ability to declare dependencies on other + packages. It is currently recommended as a more regularly updated + alternative to :mod:`distutils` that offers consistent support for more + recent packaging standards across a wide range of Python versions. +* `wheel`_ (in this context) is a project that adds the ``bdist_wheel`` + command to :mod:`distutils`/`setuptools`_. This produces a cross platform + binary packaging format (called "wheels" or "wheel files" and defined in + :pep:`427`) that allows Python libraries, even those including binary + extensions, to be installed on a system without needing to be built + locally. + +.. _setuptools: https://setuptools.pypa.io/en/latest/setuptools.html +.. _wheel: http://wheel.readthedocs.org + +Open source licensing and collaboration +======================================= + +In most parts of the world, software is automatically covered by copyright. +This means that other developers require explicit permission to copy, use, +modify and redistribute the software. + +Open source licensing is a way of explicitly granting such permission in a +relatively consistent way, allowing developers to share and collaborate +efficiently by making common solutions to various problems freely available. +This leaves many developers free to spend more time focusing on the problems +that are relatively unique to their specific situation. + +The distribution tools provided with Python are designed to make it +reasonably straightforward for developers to make their own contributions +back to that common pool of software if they choose to do so. + +The same distribution tools can also be used to distribute software within +an organisation, regardless of whether that software is published as open +source software or not. + + +Installing the tools +==================== + +The standard library does not include build tools that support modern +Python packaging standards, as the core development team has found that it +is important to have standard tools that work consistently, even on older +versions of Python. + +The currently recommended build and distribution tools can be installed +by invoking the ``pip`` module at the command line:: + + python -m pip install setuptools wheel twine + +.. note:: + + For POSIX users (including Mac OS X and Linux users), these instructions + assume the use of a :term:`virtual environment`. + + For Windows users, these instructions assume that the option to + adjust the system PATH environment variable was selected when installing + Python. + +The Python Packaging User Guide includes more details on the `currently +recommended tools`_. + +.. _currently recommended tools: https://packaging.python.org/en/latest/current.html#packaging-tool-recommendations + +Reading the guide +================= + +The Python Packaging User Guide covers the various key steps and elements +involved in creating a project: + +* `Project structure`_ +* `Building and packaging the project`_ +* `Uploading the project to the Python Packaging Index`_ + +.. _Project structure: \ + https://packaging.python.org/en/latest/distributing.html#creating-your-own-project +.. _Building and packaging the project: \ + https://packaging.python.org/en/latest/distributing.html#packaging-your-project +.. _Uploading the project to the Python Packaging Index: \ + https://packaging.python.org/en/latest/distributing.html#uploading-your-project-to-pypi + + +How do I...? +============ + +These are quick answers or links for some common tasks. + +... choose a name for my project? +--------------------------------- + +This isn't an easy topic, but here are a few tips: + +* check the Python Packaging Index to see if the name is already in use +* check popular hosting sites like GitHub, BitBucket, etc to see if there + is already a project with that name +* check what comes up in a web search for the name you're considering +* avoid particularly common words, especially ones with multiple meanings, + as they can make it difficult for users to find your software when + searching for it + + +... create and distribute binary extensions? +-------------------------------------------- + +This is actually quite a complex topic, with a variety of alternatives +available depending on exactly what you're aiming to achieve. See the +Python Packaging User Guide for more information and recommendations. + +.. seealso:: + + `Python Packaging User Guide: Binary Extensions + `__ + +.. other topics: + + Once the Development & Deployment part of PPUG is fleshed out, some of + those sections should be linked from new questions here (most notably, + we should have a question about avoiding depending on PyPI that links to + https://packaging.python.org/en/latest/deployment.html#pypi-mirrors-and-caches) diff --git a/Doc/glossary.rst b/Doc/glossary.rst --- a/Doc/glossary.rst +++ b/Doc/glossary.rst @@ -720,6 +720,12 @@ the dictionary view to become a full list use ``list(dictview)``. See :ref:`dict-views`. + virtual environment + A cooperatively isolated runtime environment that allows Python users + and applications to install and upgrade Python distribution packages + without interfering with the behaviour of other Python applications + running on the same system. + virtual machine A computer defined entirely in software. Python's virtual machine executes the :term:`bytecode` emitted by the bytecode compiler. diff --git a/Doc/installing/index.rst b/Doc/installing/index.rst new file mode 100644 --- /dev/null +++ b/Doc/installing/index.rst @@ -0,0 +1,215 @@ +.. highlightlang:: none + +.. _installing-index: + +***************************** + Installing Python Modules +***************************** + +:Email: distutils-sig at python.org + +As a popular open source development project, Python has an active +supporting community of contributors and users that also make their software +available for other Python developers to use under open source license terms. + +This allows Python users to share and collaborate effectively, benefiting +from the solutions others have already created to common (and sometimes +even rare!) problems, as well as potentially contributing their own +solutions to the common pool. + +This guide covers the installation part of the process. For a guide to +creating and sharing your own Python projects, refer to the +:ref:`distribution guide `. + +.. note:: + + For corporate and other institutional users, be aware that many + organisations have their own policies around using and contributing to + open source software. Please take such policies into account when making + use of the distribution and installation tools provided with Python. + + +Key terms +========= + +* ``pip`` is the preferred installer program. Starting with Python 2.7.9, it + is included by default with the Python binary installers. +* a virtual environment is a semi-isolated Python environment that allows + packages to be installed for use by a particular application, rather than + being installed system wide +* ``virtualenv`` is a third party tools for creating virtual environments, it + is defaults to installing ``pip`` into all created virtual environments. +* the `Python Packaging Index `__ is a public + repository of open source licensed packages made available for use by + other Python users +* the `Python Packaging Authority + `__ are the group of + developers and documentation authors responsible for the maintenance and + evolution of the standard packaging tools and the associated metadata and + file format standards. They maintain a variety of tools, documentation + and issue trackers on both `GitHub `__ and + `BitBucket `__. +* ``distutils`` is the original build and distribution system first added to + the Python standard library in 1998. While direct use of ``distutils`` is + being phased out, it still laid the foundation for the current packaging + and distribution infrastructure, and it not only remains part of the + standard library, but its name lives on in other ways (such as the name + of the mailing list used to coordinate Python packaging standards + development). + + +Basic usage +=========== + +The standard packaging tools are all designed to be used from the command +line. + +The following command will install the latest version of a module and its +dependencies from the Python Packaging Index:: + + python -m pip install SomePackage + +.. note:: + + For POSIX users (including Mac OS X and Linux users), the examples in + this guide assume the use of a :term:`virtual environment`. You may install + ``virtualenv`` to provide such environments using either pip + (``pip install virtualenv``) or through your system package manager + (commonly called ``virtualenv`` or ``python-virtualenv``). + + For Windows users, the examples in this guide assume that the option to + adjust the system PATH environment variable was selected when installing + Python. + +It's also possible to specify an exact or minimum version directly on the +command line:: + + python -m pip install SomePackage==1.0.4 # specific version + python -m pip install 'SomePackage>=1.0.4' # minimum version + +Normally, if a suitable module is already installed, attempting to install +it again will have no effect. Upgrading existing modules must be requested +explicitly:: + + python -m pip install --upgrade SomePackage + +More information and resources regarding ``pip`` and its capabilities can be +found in the `Python Packaging User Guide `__. + +.. seealso:: + + `Python Packaging User Guide: Installing Python Distribution Packages + `__ + + +How do I ...? +============= + +These are quick answers or links for some common tasks. + +... install ``pip`` in versions of Python prior to Python 2.7.9? +---------------------------------------------------------------- + +Python only started bundling ``pip`` with Python 2.7.9. For earlier versions, +``pip`` needs to be "bootstrapped" as described in the Python Packaging +User Guide. + +.. seealso:: + + `Python Packaging User Guide: Setup for Installing Distribution Packages + `__ + + +.. installing-per-user-installation: + +... install packages just for the current user? +----------------------------------------------- + +Passing the ``--user`` option to ``python -m pip install`` will install a +package just for the current user, rather than for all users of the system. + + +... install scientific Python packages? +--------------------------------------- + +A number of scientific Python packages have complex binary dependencies, and +aren't currently easy to install using ``pip`` directly. At this point in +time, it will often be easier for users to install these packages by +`other means +`__ +rather than attempting to install them with ``pip``. + +.. seealso:: + + `Python Packaging User Guide: Installing Scientific Packages + `__ + + +... work with multiple versions of Python installed in parallel? +---------------------------------------------------------------- + +On Linux, Mac OS X and other POSIX systems, use the versioned Python commands +in combination with the ``-m`` switch to run the appropriate copy of +``pip``:: + + python2 -m pip install SomePackage # default Python 2 + python2.7 -m pip install SomePackage # specifically Python 2.7 + python3 -m pip install SomePackage # default Python 3 + python3.4 -m pip install SomePackage # specifically Python 3.4 + +(appropriately versioned ``pip`` commands may also be available) + +On Windows, use the ``py`` Python launcher in combination with the ``-m`` +switch:: + + py -2 -m pip install SomePackage # default Python 2 + py -2.7 -m pip install SomePackage # specifically Python 2.7 + py -3 -m pip install SomePackage # default Python 3 + py -3.4 -m pip install SomePackage # specifically Python 3.4 + +.. other questions: + + Once the Development & Deployment part of PPUG is fleshed out, some of + those sections should be linked from new questions here (most notably, + we should have a question about avoiding depending on PyPI that links to + https://packaging.python.org/en/latest/deployment.html#pypi-mirrors-and-caches) + + +Common installation issues +========================== + +Installing into the system Python on Linux +------------------------------------------ + +On Linux systems, a Python installation will typically be included as part +of the distribution. Installing into this Python installation requires +root access to the system, and may interfere with the operation of the +system package manager and other components of the system if a component +is unexpectedly upgraded using ``pip``. + +On such systems, it is often better to use a virtual environment or a +per-user installation when installing packages with ``pip``. + + +Installing binary extensions +---------------------------- + +Python has typically relied heavily on source based distribution, with end +users being expected to compile extension modules from source as part of +the installation process. + +With the introduction of support for the binary ``wheel`` format, and the +ability to publish wheels for at least Windows and Mac OS X through the +Python Packaging Index, this problem is expected to diminish over time, +as users are more regularly able to install pre-built extensions rather +than needing to build them themselves. + +Some of the solutions for installing `scientific software +`__ +that is not yet available as pre-built ``wheel`` files may also help with +obtaining other binary extensions without needing to build them locally. + +.. seealso:: + + `Python Packaging User Guide: Binary Extensions + `__ -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Thu Nov 20 19:56:12 2014 From: python-checkins at python.org (guido.van.rossum) Date: Thu, 20 Nov 2014 18:56:12 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_Add_a_clarifying_paragraph_to?= =?utf-8?q?_PEP_0479=2C_and_another_post-history_date=2E?= Message-ID: <20141120185553.43952.76776@psf.io> https://hg.python.org/peps/rev/b218685f6a4d changeset: 5603:b218685f6a4d user: Guido van Rossum date: Thu Nov 20 10:55:48 2014 -0800 summary: Add a clarifying paragraph to PEP 0479, and another post-history date. files: pep-0479.txt | 16 +++++++++++++++- 1 files changed, 15 insertions(+), 1 deletions(-) diff --git a/pep-0479.txt b/pep-0479.txt --- a/pep-0479.txt +++ b/pep-0479.txt @@ -8,7 +8,7 @@ Content-Type: text/x-rst Created: 15-Nov-2014 Python-Version: 3.5 -Post-History: 15-Nov-2014 +Post-History: 15-Nov-2014, 19-Nov-2014 Abstract @@ -179,6 +179,20 @@ in favor of changing list comprehensions to match generator expressions (!), the other was in favor of this PEP's main proposal. +The existing model has been compared to the perfectly-acceptable +issues inherent to every other case where an exception has special +meaning. For instance, an unexpected ``KeyError`` inside a +``__getitem__`` method will be interpreted as failure, rather than +permitted to bubble up. However, there is a difference. Dunder +methods use ``return`` to indicate normality, and ``raise`` to signal +abnormality; generators ``yield`` to indicate data, and ``return`` to +signal the abnormal state. This makes explicitly raising +``StopIteration`` entirely redundant, and potentially surprising. If +other dunder methods had dedicated keywords to distinguish between +their return paths, they too could turn unexpected exceptions into +``RuntimeError``; the fact that they cannot should not preclude +generators from doing so. + References ========== -- Repository URL: https://hg.python.org/peps From python-checkins at python.org Thu Nov 20 20:08:22 2014 From: python-checkins at python.org (guido.van.rossum) Date: Thu, 20 Nov 2014 19:08:22 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_PEP_479=3A_Use_a_shorter_=5F?= =?utf-8?q?=5Ffuture=5F=5F_name_=28generator=5Freturn=29=2E?= Message-ID: <20141120190809.119870.15675@psf.io> https://hg.python.org/peps/rev/944968d549a8 changeset: 5604:944968d549a8 user: Guido van Rossum date: Thu Nov 20 11:01:20 2014 -0800 summary: PEP 479: Use a shorter __future__ name (generator_return). files: pep-0479.txt | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/pep-0479.txt b/pep-0479.txt --- a/pep-0479.txt +++ b/pep-0479.txt @@ -90,7 +90,7 @@ mechanism to introduce this in Python 3.5, finally making it standard in Python 3.6 or 3.7. The proposed syntax is:: - from __future__ import replace_stopiteration_in_generators + from __future__ import generator_return Any generator function constructed under the influence of this directive will have the REPLACE_STOPITERATION flag set on its code -- Repository URL: https://hg.python.org/peps From python-checkins at python.org Thu Nov 20 20:15:10 2014 From: python-checkins at python.org (guido.van.rossum) Date: Thu, 20 Nov 2014 19:15:10 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_Remove_=22implicitly-raised?= =?utf-8?q?=22_from_abstract=2C_it_is_just_confusing=2E?= Message-ID: <20141120191504.43938.70565@psf.io> https://hg.python.org/peps/rev/3cafc73b266a changeset: 5605:3cafc73b266a user: Guido van Rossum date: Thu Nov 20 11:14:58 2014 -0800 summary: Remove "implicitly-raised" from abstract, it is just confusing. files: pep-0479.txt | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/pep-0479.txt b/pep-0479.txt --- a/pep-0479.txt +++ b/pep-0479.txt @@ -19,7 +19,7 @@ comprehensions and generator expressions, reducing surprises such as the one that started this discussion [1]_. This is also the main backwards incompatibility of the proposal -- any generator that -depends on an implicitly-raised ``StopIteration`` to terminate it will +depends on raising ``StopIteration`` to terminate it will have to be rewritten to either catch that exception or use a for-loop. -- Repository URL: https://hg.python.org/peps From python-checkins at python.org Thu Nov 20 20:31:27 2014 From: python-checkins at python.org (guido.van.rossum) Date: Thu, 20 Nov 2014 19:31:27 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_PEP_479=3A_Add_link_to_issue_?= =?utf-8?q?22906=2E?= Message-ID: <20141120193051.68814.51436@psf.io> https://hg.python.org/peps/rev/dd19add74b21 changeset: 5606:dd19add74b21 user: Guido van Rossum date: Thu Nov 20 11:30:39 2014 -0800 summary: PEP 479: Add link to issue 22906. files: pep-0479.txt | 3 +++ 1 files changed, 3 insertions(+), 0 deletions(-) diff --git a/pep-0479.txt b/pep-0479.txt --- a/pep-0479.txt +++ b/pep-0479.txt @@ -224,6 +224,9 @@ .. [9] Thread on comp.lang.python started by Steven D'Aprano (https://mail.python.org/pipermail/python-list/2014-November/680757.html) +.. [10] Tracker issue with Proof-of-Concept patch + (http://bugs.python.org/issue22906) + Copyright ========= -- Repository URL: https://hg.python.org/peps From python-checkins at python.org Fri Nov 21 00:25:07 2014 From: python-checkins at python.org (victor.stinner) Date: Thu, 20 Nov 2014 23:25:07 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMy40KTogYXN5bmNpbzogQmFz?= =?utf-8?q?eSelectorEventLoop=2Eclose=28=29_now_closes_the_self-pipe_befor?= =?utf-8?q?e_calling?= Message-ID: <20141120232504.130919.88374@psf.io> https://hg.python.org/cpython/rev/a08c3703f844 changeset: 93522:a08c3703f844 branch: 3.4 parent: 93519:1b5d23a4a5fd user: Victor Stinner date: Fri Nov 21 00:23:27 2014 +0100 summary: asyncio: BaseSelectorEventLoop.close() now closes the self-pipe before calling the parent close() method. If the event loop is already closed, the self-pipe is not unregistered from the selector. files: Lib/asyncio/selector_events.py | 4 +++- 1 files changed, 3 insertions(+), 1 deletions(-) diff --git a/Lib/asyncio/selector_events.py b/Lib/asyncio/selector_events.py --- a/Lib/asyncio/selector_events.py +++ b/Lib/asyncio/selector_events.py @@ -68,10 +68,12 @@ address, waiter, extra) def close(self): + if self._running: + raise RuntimeError("Cannot close a running event loop") if self.is_closed(): return + self._close_self_pipe() super().close() - self._close_self_pipe() if self._selector is not None: self._selector.close() self._selector = None -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 21 00:25:07 2014 From: python-checkins at python.org (victor.stinner) Date: Thu, 20 Nov 2014 23:25:07 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=28merge_3=2E4_-=3E_default?= =?utf-8?q?=29=3A_=28Merge_3=2E4=29_asyncio=3A_BaseSelectorEventLoop=2Eclo?= =?utf-8?q?se=28=29_now_closes_the_self-pipe?= Message-ID: <20141120232504.68820.97036@psf.io> https://hg.python.org/cpython/rev/7ce62e80d3cd changeset: 93523:7ce62e80d3cd parent: 93520:5dbe3c3d014b parent: 93522:a08c3703f844 user: Victor Stinner date: Fri Nov 21 00:23:59 2014 +0100 summary: (Merge 3.4) asyncio: BaseSelectorEventLoop.close() now closes the self-pipe before calling the parent close() method. If the event loop is already closed, the self-pipe is not unregistered from the selector. files: Lib/asyncio/selector_events.py | 4 +++- 1 files changed, 3 insertions(+), 1 deletions(-) diff --git a/Lib/asyncio/selector_events.py b/Lib/asyncio/selector_events.py --- a/Lib/asyncio/selector_events.py +++ b/Lib/asyncio/selector_events.py @@ -68,10 +68,12 @@ address, waiter, extra) def close(self): + if self._running: + raise RuntimeError("Cannot close a running event loop") if self.is_closed(): return + self._close_self_pipe() super().close() - self._close_self_pipe() if self._selector is not None: self._selector.close() self._selector = None -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 21 00:44:10 2014 From: python-checkins at python.org (guido.van.rossum) Date: Thu, 20 Nov 2014 23:44:10 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_PEP_479=3A_switch_to_=22from_?= =?utf-8?q?=5F=5Ffuture=5F=5F_import_generator=5Fstop=22=2E?= Message-ID: <20141120234408.7148.54117@psf.io> https://hg.python.org/peps/rev/5eb88d52c5a3 changeset: 5607:5eb88d52c5a3 user: Guido van Rossum date: Thu Nov 20 15:43:56 2014 -0800 summary: PEP 479: switch to "from __future__ import generator_stop". files: pep-0479.txt | 2 +- 1 files changed, 1 insertions(+), 1 deletions(-) diff --git a/pep-0479.txt b/pep-0479.txt --- a/pep-0479.txt +++ b/pep-0479.txt @@ -90,7 +90,7 @@ mechanism to introduce this in Python 3.5, finally making it standard in Python 3.6 or 3.7. The proposed syntax is:: - from __future__ import generator_return + from __future__ import generator_stop Any generator function constructed under the influence of this directive will have the REPLACE_STOPITERATION flag set on its code -- Repository URL: https://hg.python.org/peps From python-checkins at python.org Fri Nov 21 01:24:00 2014 From: python-checkins at python.org (antoine.pitrou) Date: Fri, 21 Nov 2014 00:24:00 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2322796=3A_HTTP_coo?= =?utf-8?q?kie_parsing_is_now_stricter=2C_in_order_to_protect_against?= Message-ID: <20141121002353.7136.51457@psf.io> https://hg.python.org/cpython/rev/a065ab1c67a8 changeset: 93524:a065ab1c67a8 user: Antoine Pitrou date: Fri Nov 21 01:20:57 2014 +0100 summary: Issue #22796: HTTP cookie parsing is now stricter, in order to protect against potential injection attacks. files: Lib/http/cookies.py | 56 ++++++++++++++++------ Lib/test/test_http_cookies.py | 12 +--- Misc/NEWS | 3 + 3 files changed, 48 insertions(+), 23 deletions(-) diff --git a/Lib/http/cookies.py b/Lib/http/cookies.py --- a/Lib/http/cookies.py +++ b/Lib/http/cookies.py @@ -533,10 +533,17 @@ return def __parse_string(self, str, patt=_CookiePattern): - i = 0 # Our starting point - n = len(str) # Length of string - M = None # current morsel + i = 0 # Our starting point + n = len(str) # Length of string + parsed_items = [] # Parsed (type, key, value) triples + morsel_seen = False # A key=value pair was previously encountered + TYPE_ATTRIBUTE = 1 + TYPE_KEYVALUE = 2 + + # We first parse the whole cookie string and reject it if it's + # syntactically invalid (this helps avoid some classes of injection + # attacks). while 0 <= i < n: # Start looking for a cookie match = patt.match(str, i) @@ -547,22 +554,41 @@ key, value = match.group("key"), match.group("val") i = match.end(0) - # Parse the key, value in case it's metainfo if key[0] == "$": - # We ignore attributes which pertain to the cookie - # mechanism as a whole. See RFC 2109. - # (Does anyone care?) - if M: - M[key[1:]] = value + if not morsel_seen: + # We ignore attributes which pertain to the cookie + # mechanism as a whole, such as "$Version". + # See RFC 2965. (Does anyone care?) + continue + parsed_items.append((TYPE_ATTRIBUTE, key[1:], value)) elif key.lower() in Morsel._reserved: - if M: - if value is None: - if key.lower() in Morsel._flags: - M[key] = True + if not morsel_seen: + # Invalid cookie string + return + if value is None: + if key.lower() in Morsel._flags: + parsed_items.append((TYPE_ATTRIBUTE, key, True)) else: - M[key] = _unquote(value) + # Invalid cookie string + return + else: + parsed_items.append((TYPE_ATTRIBUTE, key, _unquote(value))) elif value is not None: - rval, cval = self.value_decode(value) + parsed_items.append((TYPE_KEYVALUE, key, self.value_decode(value))) + morsel_seen = True + else: + # Invalid cookie string + return + + # The cookie string is valid, apply it. + M = None # current morsel + for tp, key, value in parsed_items: + if tp == TYPE_ATTRIBUTE: + assert M is not None + M[key] = value + else: + assert tp == TYPE_KEYVALUE + rval, cval = value self.__set(key, rval, cval) M = self[key] diff --git a/Lib/test/test_http_cookies.py b/Lib/test/test_http_cookies.py --- a/Lib/test/test_http_cookies.py +++ b/Lib/test/test_http_cookies.py @@ -141,13 +141,6 @@ self.assertEqual(C['eggs']['httponly'], 'foo') self.assertEqual(C['eggs']['secure'], 'bar') - def test_bad_attrs(self): - # issue 16611: make sure we don't break backward compatibility. - C = cookies.SimpleCookie() - C.load('cookie=with; invalid; version; second=cookie;') - self.assertEqual(C.output(), - 'Set-Cookie: cookie=with\r\nSet-Cookie: second=cookie') - def test_extra_spaces(self): C = cookies.SimpleCookie() C.load('eggs = scrambled ; secure ; path = bar ; foo=foo ') @@ -182,7 +175,10 @@ def test_invalid_cookies(self): # Accepting these could be a security issue C = cookies.SimpleCookie() - for s in (']foo=x', '[foo=x', 'blah]foo=x', 'blah[foo=x'): + for s in (']foo=x', '[foo=x', 'blah]foo=x', 'blah[foo=x', + 'Set-Cookie: foo=bar', 'Set-Cookie: foo', + 'foo=bar; baz', 'baz; foo=bar', + 'secure;foo=bar', 'Version=1;foo=bar'): C.load(s) self.assertEqual(dict(C), {}) self.assertEqual(C.output(), '') diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -188,6 +188,9 @@ Library ------- +- Issue #22796: HTTP cookie parsing is now stricter, in order to protect + against potential injection attacks. + - Issue #22370: Windows detection in pathlib is now more robust. - Issue #22841: Reject coroutines in asyncio add_signal_handler(). -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 21 01:46:49 2014 From: python-checkins at python.org (steve.dower) Date: Fri, 21 Nov 2014 00:46:49 +0000 Subject: [Python-checkins] =?utf-8?q?cpython=3A_Issue_=2322869=3A_Add_pyli?= =?utf-8?q?fecycle=2Ec/=2Eh_files_to_pythoncore_project=2E?= Message-ID: <20141121004642.43958.4038@psf.io> https://hg.python.org/cpython/rev/31fd106bb68a changeset: 93525:31fd106bb68a user: Steve Dower date: Thu Nov 20 16:45:36 2014 -0800 summary: Issue #22869: Add pylifecycle.c/.h files to pythoncore project. files: PCbuild/pythoncore.vcxproj | 2 ++ PCbuild/pythoncore.vcxproj.filters | 6 ++++++ 2 files changed, 8 insertions(+), 0 deletions(-) diff --git a/PCbuild/pythoncore.vcxproj b/PCbuild/pythoncore.vcxproj --- a/PCbuild/pythoncore.vcxproj +++ b/PCbuild/pythoncore.vcxproj @@ -502,6 +502,7 @@ + @@ -734,6 +735,7 @@ + diff --git a/PCbuild/pythoncore.vcxproj.filters b/PCbuild/pythoncore.vcxproj.filters --- a/PCbuild/pythoncore.vcxproj.filters +++ b/PCbuild/pythoncore.vcxproj.filters @@ -216,6 +216,9 @@ Include + + Include + Include @@ -890,6 +893,9 @@ Python + + Python + Python -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 21 02:05:24 2014 From: python-checkins at python.org (antoine.pitrou) Date: Fri, 21 Nov 2014 01:05:24 +0000 Subject: [Python-checkins] =?utf-8?q?cpython_=282=2E7=29=3A_Add_regression?= =?utf-8?q?_issue_number_to_Misc/NEWS_entry=2E?= Message-ID: <20141121010514.119880.40076@psf.io> https://hg.python.org/cpython/rev/c9b4dc1ab7ae changeset: 93527:c9b4dc1ab7ae branch: 2.7 user: Antoine Pitrou date: Fri Nov 21 02:05:06 2014 +0100 summary: Add regression issue number to Misc/NEWS entry. files: Misc/NEWS | 8 ++++---- 1 files changed, 4 insertions(+), 4 deletions(-) diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -10,10 +10,10 @@ Core and Builtins ----------------- -- Backout issue #1856 patch (avoid crashes and lockups when daemon threads - run while the interpreter is shutting down; instead, these threads are - now killed when they try to take the GIL), as it seems to break some - existing code. +- Issue #21963: backout issue #1856 patch (avoid crashes and lockups when + daemon threads run while the interpreter is shutting down; instead, these + threads are now killed when they try to take the GIL), as it seems to + break some existing code. - Issue #22604: Fix assertion error in debug mode when dividing a complex number by (nan+0j). -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 21 02:05:24 2014 From: python-checkins at python.org (antoine.pitrou) Date: Fri, 21 Nov 2014 01:05:24 +0000 Subject: [Python-checkins] =?utf-8?b?Y3B5dGhvbiAoMi43KTogSXNzdWUgIzIxOTYz?= =?utf-8?q?=3A_backout_issue_=231856_patch_=28avoid_crashes_and_lockups_wh?= =?utf-8?q?en?= Message-ID: <20141121010514.68812.96958@psf.io> https://hg.python.org/cpython/rev/4ceca79d1c63 changeset: 93526:4ceca79d1c63 branch: 2.7 parent: 93521:8bc29f5ebeff user: Antoine Pitrou date: Fri Nov 21 02:04:21 2014 +0100 summary: Issue #21963: backout issue #1856 patch (avoid crashes and lockups when daemon threads run while the interpreter is shutting down; instead, these threads are now killed when they try to take the GIL), as it seems to break some existing code. files: Include/pythonrun.h | 2 - Lib/test/test_threading.py | 43 -------------------------- Misc/NEWS | 9 +++-- Python/ceval.c | 12 ------- Python/pythonrun.c | 9 +---- Python/thread_pthread.h | 4 +- 6 files changed, 8 insertions(+), 71 deletions(-) diff --git a/Include/pythonrun.h b/Include/pythonrun.h --- a/Include/pythonrun.h +++ b/Include/pythonrun.h @@ -147,8 +147,6 @@ PyAPI_FUNC(void) PyByteArray_Fini(void); PyAPI_FUNC(void) _PyRandom_Fini(void); -PyAPI_DATA(PyThreadState *) _Py_Finalizing; - /* Stuff with no proper home (yet) */ PyAPI_FUNC(char *) PyOS_Readline(FILE *, FILE *, char *); PyAPI_DATA(int) (*PyOS_InputHook)(void); diff --git a/Lib/test/test_threading.py b/Lib/test/test_threading.py --- a/Lib/test/test_threading.py +++ b/Lib/test/test_threading.py @@ -700,49 +700,6 @@ output = "end of worker thread\nend of main thread\n" self.assertScriptHasOutput(script, output) - @unittest.skipIf(sys.platform in platforms_to_skip, "due to known OS bug") - def test_6_daemon_threads(self): - # Check that a daemon thread cannot crash the interpreter on shutdown - # by manipulating internal structures that are being disposed of in - # the main thread. - script = """if True: - import os - import random - import sys - import time - import threading - - thread_has_run = set() - - def random_io(): - '''Loop for a while sleeping random tiny amounts and doing some I/O.''' - while True: - in_f = open(os.__file__, 'rb') - stuff = in_f.read(200) - null_f = open(os.devnull, 'wb') - null_f.write(stuff) - time.sleep(random.random() / 1995) - null_f.close() - in_f.close() - thread_has_run.add(threading.current_thread()) - - def main(): - count = 0 - for _ in range(40): - new_thread = threading.Thread(target=random_io) - new_thread.daemon = True - new_thread.start() - count += 1 - while len(thread_has_run) < count: - time.sleep(0.001) - # Trigger process shutdown - sys.exit(0) - - main() - """ - rc, out, err = assert_python_ok('-c', script) - self.assertFalse(err) - @unittest.skipUnless(hasattr(os, 'fork'), "needs os.fork()") @unittest.skipIf(sys.platform in platforms_to_skip, "due to known OS bug") def test_reinit_tls_after_fork(self): diff --git a/Misc/NEWS b/Misc/NEWS --- a/Misc/NEWS +++ b/Misc/NEWS @@ -10,6 +10,11 @@ Core and Builtins ----------------- +- Backout issue #1856 patch (avoid crashes and lockups when daemon threads + run while the interpreter is shutting down; instead, these threads are + now killed when they try to take the GIL), as it seems to break some + existing code. + - Issue #22604: Fix assertion error in debug mode when dividing a complex number by (nan+0j). @@ -360,10 +365,6 @@ - Issue #21831: Avoid integer overflow when large sizes and offsets are given to the buffer type. CVE-2014-7185. -- Issue #1856: Avoid crashes and lockups when daemon threads run while the - interpreter is shutting down; instead, these threads are now killed when they - try to take the GIL. - - Issue #19656: Running Python with the -3 option now also warns about non-ascii bytes literals. diff --git a/Python/ceval.c b/Python/ceval.c --- a/Python/ceval.c +++ b/Python/ceval.c @@ -355,12 +355,6 @@ if (interpreter_lock) { int err = errno; PyThread_acquire_lock(interpreter_lock, 1); - /* _Py_Finalizing is protected by the GIL */ - if (_Py_Finalizing && tstate != _Py_Finalizing) { - PyThread_release_lock(interpreter_lock); - PyThread_exit_thread(); - assert(0); /* unreachable */ - } errno = err; } #endif @@ -1025,12 +1019,6 @@ PyThread_acquire_lock(interpreter_lock, 1); - /* Check if we should make a quick exit. */ - if (_Py_Finalizing && _Py_Finalizing != tstate) { - PyThread_release_lock(interpreter_lock); - PyThread_exit_thread(); - } - if (PyThreadState_Swap(tstate) != NULL) Py_FatalError("ceval: orphan tstate"); diff --git a/Python/pythonrun.c b/Python/pythonrun.c --- a/Python/pythonrun.c +++ b/Python/pythonrun.c @@ -91,8 +91,6 @@ int Py_NoUserSiteDirectory = 0; /* for -s and site.py */ int Py_HashRandomizationFlag = 0; /* for -R and PYTHONHASHSEED */ -PyThreadState *_Py_Finalizing = NULL; - /* Hack to force loading of object files */ int (*_PyOS_mystrnicmp_hack)(const char *, const char *, Py_ssize_t) = \ @@ -165,7 +163,6 @@ if (initialized) return; initialized = 1; - _Py_Finalizing = NULL; if ((p = Py_GETENV("PYTHONDEBUG")) && *p != '\0') Py_DebugFlag = add_flag(Py_DebugFlag, p); @@ -425,16 +422,12 @@ * the threads created via Threading. */ call_sys_exitfunc(); + initialized = 0; /* Get current thread state and interpreter pointer */ tstate = PyThreadState_GET(); interp = tstate->interp; - /* Remaining threads (e.g. daemon threads) will automatically exit - after taking the GIL (in PyEval_RestoreThread()). */ - _Py_Finalizing = tstate; - initialized = 0; - /* Disable signal handling */ PyOS_FiniInterrupts(); diff --git a/Python/thread_pthread.h b/Python/thread_pthread.h --- a/Python/thread_pthread.h +++ b/Python/thread_pthread.h @@ -242,9 +242,9 @@ PyThread_exit_thread(void) { dprintf(("PyThread_exit_thread called\n")); - if (!initialized) + if (!initialized) { exit(0); - pthread_exit(0); + } } #ifdef USE_SEMAPHORES -- Repository URL: https://hg.python.org/cpython From python-checkins at python.org Fri Nov 21 06:14:23 2014 From: python-checkins at python.org (guido.van.rossum) Date: Fri, 21 Nov 2014 05:14:23 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_PEP_479=3A_Fix_formatting_of_?= =?utf-8?q?examples=2E?= Message-ID: <20141121051422.130917.96819@psf.io> https://hg.python.org/peps/rev/73625fa16b36 changeset: 5609:73625fa16b36 user: Guido van Rossum date: Thu Nov 20 21:14:17 2014 -0800 summary: PEP 479: Fix formatting of examples. files: pep-0479.txt | 17 +++++++++++++++++ 1 files changed, 17 insertions(+), 0 deletions(-) diff --git a/pep-0479.txt b/pep-0479.txt --- a/pep-0479.txt +++ b/pep-0479.txt @@ -106,25 +106,33 @@ existing Python versions, and will not be affected by __future__. Lib/ipaddress.py:: + if other == self: raise StopIteration + Becomes:: + if other == self: return In some cases, this can be combined with ``yield from`` to simplify the code, such as Lib/difflib.py:: + if context is None: while True: yield next(line_pair_iterator) + Becomes:: + if context is None: yield from line_pair_iterator return + (The ``return`` is necessary for a strictly-equivalent translation, though in this particular file, there is no further code, and the ``return`` can be elided.) For compatibility with pre-3.3 versions of Python, this could be written with an explicit ``for`` loop:: + if context is None: for line in line_pair_iterator: yield line @@ -132,6 +140,7 @@ More complicated iteration patterns will need explicit try/catch constructs. For example, a parser construct like this:: + def unwrap(f): while True: data = next(f) @@ -140,7 +149,9 @@ if line == "- end -": break data += line yield data + would need to be rewritten as:: + def parser(f): while True: try: @@ -152,7 +163,9 @@ yield data except StopIteration: return + or possibly:: + def parser(f): for data in f: while True: @@ -186,9 +199,11 @@ raise ``AttributeError``), ``__getitem__`` (can raise ``KeyError``), and so on. A helper function for an iterator can be written to follow the same protocol; for example:: + def helper(x, y): if x > y: return 1 / (x - y) raise StopIteration + def __next__(self): if self.a: return helper(self.b, self.c) return helper(self.d, self.e) @@ -201,8 +216,10 @@ Each time it is (re)started, it may either yield a value, or return (including "falling off the end"). A helper function for a generator can also be written, but it must also follow generator protocol:: + def helper(x, y): if x > y: yield 1 / (x - y) + def gen(self): if self.a: return (yield from helper(self.b, self.c)) return (yield from helper(self.d, self.e)) -- Repository URL: https://hg.python.org/peps From python-checkins at python.org Fri Nov 21 06:14:23 2014 From: python-checkins at python.org (guido.van.rossum) Date: Fri, 21 Nov 2014 05:14:23 +0000 Subject: [Python-checkins] =?utf-8?q?peps=3A_New_examples=2C_explanations_?= =?utf-8?q?and_a_few_edits=2C_all_by_Chris=2E?= Message-ID: <20141121051422.43944.79292@psf.io> https://hg.python.org/peps/rev/43d99a738fa1 changeset: 5608:43d99a738fa1 user: Guido van Rossum