[Python-checkins] cpython (merge 3.3 -> default): Issue #16564: Fixed a performance regression relative to Python 3.1 in the

serhiy.storchaka python-checkins at python.org
Sat Mar 16 21:56:40 CET 2013


http://hg.python.org/cpython/rev/9d458ded8304
changeset:   82705:9d458ded8304
parent:      82702:5da005db8166
parent:      82704:4b4dddd670d0
user:        Serhiy Storchaka <storchaka at gmail.com>
date:        Sat Mar 16 22:55:04 2013 +0200
summary:
  Issue #16564: Fixed a performance regression relative to Python 3.1 in the
caching of compiled regular expressions.

files:
  Lib/re.py |  30 ++++++++++++++++++++++++------
  Misc/NEWS |   3 +++
  2 files changed, 27 insertions(+), 6 deletions(-)


diff --git a/Lib/re.py b/Lib/re.py
--- a/Lib/re.py
+++ b/Lib/re.py
@@ -215,8 +215,8 @@
 
 def purge():
     "Clear the regular expression caches"
-    _compile.cache_clear()
-    _compile_repl.cache_clear()
+    _cache.clear()
+    _cache_repl.clear()
 
 def template(pattern, flags=0):
     "Compile a template pattern, returning a pattern object"
@@ -259,11 +259,18 @@
 # --------------------------------------------------------------------
 # internals
 
+_cache = {}
+_cache_repl = {}
+
 _pattern_type = type(sre_compile.compile("", 0))
 
- at functools.lru_cache(maxsize=512, typed=True)
+_MAXCACHE = 512
 def _compile(pattern, flags):
     # internal: compile pattern
+    try:
+        return _cache[type(pattern), pattern, flags]
+    except KeyError:
+        pass
     if isinstance(pattern, _pattern_type):
         if flags:
             raise ValueError(
@@ -271,12 +278,23 @@
         return pattern
     if not sre_compile.isstring(pattern):
         raise TypeError("first argument must be string or compiled pattern")
-    return sre_compile.compile(pattern, flags)
+    p = sre_compile.compile(pattern, flags)
+    if len(_cache) >= _MAXCACHE:
+        _cache.clear()
+    _cache[type(pattern), pattern, flags] = p
+    return p
 
- at functools.lru_cache(maxsize=512)
 def _compile_repl(repl, pattern):
     # internal: compile replacement pattern
-    return sre_parse.parse_template(repl, pattern)
+    try:
+        return _cache_repl[repl, pattern]
+    except KeyError:
+        pass
+    p = sre_parse.parse_template(repl, pattern)
+    if len(_cache_repl) >= _MAXCACHE:
+        _cache_repl.clear()
+    _cache_repl[repl, pattern] = p
+    return p
 
 def _expand(pattern, match, template):
     # internal: match.expand implementation hook
diff --git a/Misc/NEWS b/Misc/NEWS
--- a/Misc/NEWS
+++ b/Misc/NEWS
@@ -283,6 +283,9 @@
 Library
 -------
 
+- Issue #16564: Fixed a performance regression relative to Python 3.1 in the
+  caching of compiled regular expressions.
+
 - Added missing FeedParser and BytesFeedParser to email.parser.__all__.
 
 - Issue #17431: Fix missing import of BytesFeedParser in email.parser.

-- 
Repository URL: http://hg.python.org/cpython


More information about the Python-checkins mailing list