forked from pool/python312
383 lines
13 KiB
Diff
383 lines
13 KiB
Diff
|
|
From 122a417f8000eb904a3cac9aacf4de8d288d7148 Mon Sep 17 00:00:00 2001
|
||
|
|
From: Serhiy Storchaka <storchaka@gmail.com>
|
||
|
|
Date: Fri, 31 Oct 2025 15:49:51 +0200
|
||
|
|
Subject: [PATCH 1/2] [3.12] gh-136065: Fix quadratic complexity in
|
||
|
|
os.path.expandvars() (GH-134952) (cherry picked from commit
|
||
|
|
f029e8db626ddc6e3a3beea4eff511a71aaceb5c)
|
||
|
|
MIME-Version: 1.0
|
||
|
|
Content-Type: text/plain; charset=UTF-8
|
||
|
|
Content-Transfer-Encoding: 8bit
|
||
|
|
|
||
|
|
Co-authored-by: Serhiy Storchaka <storchaka@gmail.com>
|
||
|
|
Co-authored-by: Łukasz Langa <lukasz@langa.pl>
|
||
|
|
---
|
||
|
|
Lib/ntpath.py | 126 ++++++------------
|
||
|
|
Lib/posixpath.py | 43 +++---
|
||
|
|
Lib/test/test_genericpath.py | 14 ++
|
||
|
|
Lib/test/test_ntpath.py | 22 ++-
|
||
|
|
...-05-30-22-33-27.gh-issue-136065.bu337o.rst | 1 +
|
||
|
|
5 files changed, 93 insertions(+), 113 deletions(-)
|
||
|
|
create mode 100644 Misc/NEWS.d/next/Security/2025-05-30-22-33-27.gh-issue-136065.bu337o.rst
|
||
|
|
|
||
|
|
diff --git a/Lib/ntpath.py b/Lib/ntpath.py
|
||
|
|
index 1bef630bd9c0ff..393d358b0afb8c 100644
|
||
|
|
--- a/Lib/ntpath.py
|
||
|
|
+++ b/Lib/ntpath.py
|
||
|
|
@@ -409,17 +409,23 @@ def expanduser(path):
|
||
|
|
# XXX With COMMAND.COM you can use any characters in a variable name,
|
||
|
|
# XXX except '^|<>='.
|
||
|
|
|
||
|
|
+_varpattern = r"'[^']*'?|%(%|[^%]*%?)|\$(\$|[-\w]+|\{[^}]*\}?)"
|
||
|
|
+_varsub = None
|
||
|
|
+_varsubb = None
|
||
|
|
+
|
||
|
|
def expandvars(path):
|
||
|
|
"""Expand shell variables of the forms $var, ${var} and %var%.
|
||
|
|
|
||
|
|
Unknown variables are left unchanged."""
|
||
|
|
path = os.fspath(path)
|
||
|
|
+ global _varsub, _varsubb
|
||
|
|
if isinstance(path, bytes):
|
||
|
|
if b'$' not in path and b'%' not in path:
|
||
|
|
return path
|
||
|
|
- import string
|
||
|
|
- varchars = bytes(string.ascii_letters + string.digits + '_-', 'ascii')
|
||
|
|
- quote = b'\''
|
||
|
|
+ if not _varsubb:
|
||
|
|
+ import re
|
||
|
|
+ _varsubb = re.compile(_varpattern.encode(), re.ASCII).sub
|
||
|
|
+ sub = _varsubb
|
||
|
|
percent = b'%'
|
||
|
|
brace = b'{'
|
||
|
|
rbrace = b'}'
|
||
|
|
@@ -428,94 +434,44 @@ def expandvars(path):
|
||
|
|
else:
|
||
|
|
if '$' not in path and '%' not in path:
|
||
|
|
return path
|
||
|
|
- import string
|
||
|
|
- varchars = string.ascii_letters + string.digits + '_-'
|
||
|
|
- quote = '\''
|
||
|
|
+ if not _varsub:
|
||
|
|
+ import re
|
||
|
|
+ _varsub = re.compile(_varpattern, re.ASCII).sub
|
||
|
|
+ sub = _varsub
|
||
|
|
percent = '%'
|
||
|
|
brace = '{'
|
||
|
|
rbrace = '}'
|
||
|
|
dollar = '$'
|
||
|
|
environ = os.environ
|
||
|
|
- res = path[:0]
|
||
|
|
- index = 0
|
||
|
|
- pathlen = len(path)
|
||
|
|
- while index < pathlen:
|
||
|
|
- c = path[index:index+1]
|
||
|
|
- if c == quote: # no expansion within single quotes
|
||
|
|
- path = path[index + 1:]
|
||
|
|
- pathlen = len(path)
|
||
|
|
- try:
|
||
|
|
- index = path.index(c)
|
||
|
|
- res += c + path[:index + 1]
|
||
|
|
- except ValueError:
|
||
|
|
- res += c + path
|
||
|
|
- index = pathlen - 1
|
||
|
|
- elif c == percent: # variable or '%'
|
||
|
|
- if path[index + 1:index + 2] == percent:
|
||
|
|
- res += c
|
||
|
|
- index += 1
|
||
|
|
- else:
|
||
|
|
- path = path[index+1:]
|
||
|
|
- pathlen = len(path)
|
||
|
|
- try:
|
||
|
|
- index = path.index(percent)
|
||
|
|
- except ValueError:
|
||
|
|
- res += percent + path
|
||
|
|
- index = pathlen - 1
|
||
|
|
- else:
|
||
|
|
- var = path[:index]
|
||
|
|
- try:
|
||
|
|
- if environ is None:
|
||
|
|
- value = os.fsencode(os.environ[os.fsdecode(var)])
|
||
|
|
- else:
|
||
|
|
- value = environ[var]
|
||
|
|
- except KeyError:
|
||
|
|
- value = percent + var + percent
|
||
|
|
- res += value
|
||
|
|
- elif c == dollar: # variable or '$$'
|
||
|
|
- if path[index + 1:index + 2] == dollar:
|
||
|
|
- res += c
|
||
|
|
- index += 1
|
||
|
|
- elif path[index + 1:index + 2] == brace:
|
||
|
|
- path = path[index+2:]
|
||
|
|
- pathlen = len(path)
|
||
|
|
- try:
|
||
|
|
- index = path.index(rbrace)
|
||
|
|
- except ValueError:
|
||
|
|
- res += dollar + brace + path
|
||
|
|
- index = pathlen - 1
|
||
|
|
- else:
|
||
|
|
- var = path[:index]
|
||
|
|
- try:
|
||
|
|
- if environ is None:
|
||
|
|
- value = os.fsencode(os.environ[os.fsdecode(var)])
|
||
|
|
- else:
|
||
|
|
- value = environ[var]
|
||
|
|
- except KeyError:
|
||
|
|
- value = dollar + brace + var + rbrace
|
||
|
|
- res += value
|
||
|
|
- else:
|
||
|
|
- var = path[:0]
|
||
|
|
- index += 1
|
||
|
|
- c = path[index:index + 1]
|
||
|
|
- while c and c in varchars:
|
||
|
|
- var += c
|
||
|
|
- index += 1
|
||
|
|
- c = path[index:index + 1]
|
||
|
|
- try:
|
||
|
|
- if environ is None:
|
||
|
|
- value = os.fsencode(os.environ[os.fsdecode(var)])
|
||
|
|
- else:
|
||
|
|
- value = environ[var]
|
||
|
|
- except KeyError:
|
||
|
|
- value = dollar + var
|
||
|
|
- res += value
|
||
|
|
- if c:
|
||
|
|
- index -= 1
|
||
|
|
+
|
||
|
|
+ def repl(m):
|
||
|
|
+ lastindex = m.lastindex
|
||
|
|
+ if lastindex is None:
|
||
|
|
+ return m[0]
|
||
|
|
+ name = m[lastindex]
|
||
|
|
+ if lastindex == 1:
|
||
|
|
+ if name == percent:
|
||
|
|
+ return name
|
||
|
|
+ if not name.endswith(percent):
|
||
|
|
+ return m[0]
|
||
|
|
+ name = name[:-1]
|
||
|
|
else:
|
||
|
|
- res += c
|
||
|
|
- index += 1
|
||
|
|
- return res
|
||
|
|
+ if name == dollar:
|
||
|
|
+ return name
|
||
|
|
+ if name.startswith(brace):
|
||
|
|
+ if not name.endswith(rbrace):
|
||
|
|
+ return m[0]
|
||
|
|
+ name = name[1:-1]
|
||
|
|
+
|
||
|
|
+ try:
|
||
|
|
+ if environ is None:
|
||
|
|
+ return os.fsencode(os.environ[os.fsdecode(name)])
|
||
|
|
+ else:
|
||
|
|
+ return environ[name]
|
||
|
|
+ except KeyError:
|
||
|
|
+ return m[0]
|
||
|
|
+
|
||
|
|
+ return sub(repl, path)
|
||
|
|
|
||
|
|
|
||
|
|
# Normalize a path, e.g. A//B, A/./B and A/foo/../B all become A\B.
|
||
|
|
diff --git a/Lib/posixpath.py b/Lib/posixpath.py
|
||
|
|
index 90a6f545f90529..6306f14f53491b 100644
|
||
|
|
--- a/Lib/posixpath.py
|
||
|
|
+++ b/Lib/posixpath.py
|
||
|
|
@@ -314,42 +314,41 @@ def expanduser(path):
|
||
|
|
# This expands the forms $variable and ${variable} only.
|
||
|
|
# Non-existent variables are left unchanged.
|
||
|
|
|
||
|
|
-_varprog = None
|
||
|
|
-_varprogb = None
|
||
|
|
+_varpattern = r'\$(\w+|\{[^}]*\}?)'
|
||
|
|
+_varsub = None
|
||
|
|
+_varsubb = None
|
||
|
|
|
||
|
|
def expandvars(path):
|
||
|
|
"""Expand shell variables of form $var and ${var}. Unknown variables
|
||
|
|
are left unchanged."""
|
||
|
|
path = os.fspath(path)
|
||
|
|
- global _varprog, _varprogb
|
||
|
|
+ global _varsub, _varsubb
|
||
|
|
if isinstance(path, bytes):
|
||
|
|
if b'$' not in path:
|
||
|
|
return path
|
||
|
|
- if not _varprogb:
|
||
|
|
+ if not _varsubb:
|
||
|
|
import re
|
||
|
|
- _varprogb = re.compile(br'\$(\w+|\{[^}]*\})', re.ASCII)
|
||
|
|
- search = _varprogb.search
|
||
|
|
+ _varsubb = re.compile(_varpattern.encode(), re.ASCII).sub
|
||
|
|
+ sub = _varsubb
|
||
|
|
start = b'{'
|
||
|
|
end = b'}'
|
||
|
|
environ = getattr(os, 'environb', None)
|
||
|
|
else:
|
||
|
|
if '$' not in path:
|
||
|
|
return path
|
||
|
|
- if not _varprog:
|
||
|
|
+ if not _varsub:
|
||
|
|
import re
|
||
|
|
- _varprog = re.compile(r'\$(\w+|\{[^}]*\})', re.ASCII)
|
||
|
|
- search = _varprog.search
|
||
|
|
+ _varsub = re.compile(_varpattern, re.ASCII).sub
|
||
|
|
+ sub = _varsub
|
||
|
|
start = '{'
|
||
|
|
end = '}'
|
||
|
|
environ = os.environ
|
||
|
|
- i = 0
|
||
|
|
- while True:
|
||
|
|
- m = search(path, i)
|
||
|
|
- if not m:
|
||
|
|
- break
|
||
|
|
- i, j = m.span(0)
|
||
|
|
- name = m.group(1)
|
||
|
|
- if name.startswith(start) and name.endswith(end):
|
||
|
|
+
|
||
|
|
+ def repl(m):
|
||
|
|
+ name = m[1]
|
||
|
|
+ if name.startswith(start):
|
||
|
|
+ if not name.endswith(end):
|
||
|
|
+ return m[0]
|
||
|
|
name = name[1:-1]
|
||
|
|
try:
|
||
|
|
if environ is None:
|
||
|
|
@@ -357,13 +356,11 @@ def expandvars(path):
|
||
|
|
else:
|
||
|
|
value = environ[name]
|
||
|
|
except KeyError:
|
||
|
|
- i = j
|
||
|
|
+ return m[0]
|
||
|
|
else:
|
||
|
|
- tail = path[j:]
|
||
|
|
- path = path[:i] + value
|
||
|
|
- i = len(path)
|
||
|
|
- path += tail
|
||
|
|
- return path
|
||
|
|
+ return value
|
||
|
|
+
|
||
|
|
+ return sub(repl, path)
|
||
|
|
|
||
|
|
|
||
|
|
# Normalize a path, e.g. A//B, A/./B and A/foo/../B all become A/B.
|
||
|
|
diff --git a/Lib/test/test_genericpath.py b/Lib/test/test_genericpath.py
|
||
|
|
index 3eefb722b81e55..1cec587e875888 100644
|
||
|
|
--- a/Lib/test/test_genericpath.py
|
||
|
|
+++ b/Lib/test/test_genericpath.py
|
||
|
|
@@ -7,6 +7,7 @@
|
||
|
|
import sys
|
||
|
|
import unittest
|
||
|
|
import warnings
|
||
|
|
+from test import support
|
||
|
|
from test.support import is_emscripten
|
||
|
|
from test.support import os_helper
|
||
|
|
from test.support import warnings_helper
|
||
|
|
@@ -443,6 +444,19 @@ def check(value, expected):
|
||
|
|
os.fsencode('$bar%s bar' % nonascii))
|
||
|
|
check(b'$spam}bar', os.fsencode('%s}bar' % nonascii))
|
||
|
|
|
||
|
|
+ @support.requires_resource('cpu')
|
||
|
|
+ def test_expandvars_large(self):
|
||
|
|
+ expandvars = self.pathmodule.expandvars
|
||
|
|
+ with os_helper.EnvironmentVarGuard() as env:
|
||
|
|
+ env.clear()
|
||
|
|
+ env["A"] = "B"
|
||
|
|
+ n = 100_000
|
||
|
|
+ self.assertEqual(expandvars('$A'*n), 'B'*n)
|
||
|
|
+ self.assertEqual(expandvars('${A}'*n), 'B'*n)
|
||
|
|
+ self.assertEqual(expandvars('$A!'*n), 'B!'*n)
|
||
|
|
+ self.assertEqual(expandvars('${A}A'*n), 'BA'*n)
|
||
|
|
+ self.assertEqual(expandvars('${'*10*n), '${'*10*n)
|
||
|
|
+
|
||
|
|
def test_abspath(self):
|
||
|
|
self.assertIn("foo", self.pathmodule.abspath("foo"))
|
||
|
|
with warnings.catch_warnings():
|
||
|
|
diff --git a/Lib/test/test_ntpath.py b/Lib/test/test_ntpath.py
|
||
|
|
index ced9dc4fffb41e..72f89ebb21c478 100644
|
||
|
|
--- a/Lib/test/test_ntpath.py
|
||
|
|
+++ b/Lib/test/test_ntpath.py
|
||
|
|
@@ -7,8 +7,7 @@
|
||
|
|
import unittest
|
||
|
|
import warnings
|
||
|
|
from ntpath import ALLOW_MISSING
|
||
|
|
-from test.support import cpython_only, os_helper
|
||
|
|
-from test.support import TestFailed, is_emscripten
|
||
|
|
+from test.support import os_helper, is_emscripten
|
||
|
|
from test.support.os_helper import FakePath
|
||
|
|
from test import test_genericpath
|
||
|
|
from tempfile import TemporaryFile
|
||
|
|
@@ -58,7 +57,7 @@ def tester(fn, wantResult):
|
||
|
|
fn = fn.replace("\\", "\\\\")
|
||
|
|
gotResult = eval(fn)
|
||
|
|
if wantResult != gotResult and _norm(wantResult) != _norm(gotResult):
|
||
|
|
- raise TestFailed("%s should return: %s but returned: %s" \
|
||
|
|
+ raise support.TestFailed("%s should return: %s but returned: %s" \
|
||
|
|
%(str(fn), str(wantResult), str(gotResult)))
|
||
|
|
|
||
|
|
# then with bytes
|
||
|
|
@@ -74,7 +73,7 @@ def tester(fn, wantResult):
|
||
|
|
warnings.simplefilter("ignore", DeprecationWarning)
|
||
|
|
gotResult = eval(fn)
|
||
|
|
if _norm(wantResult) != _norm(gotResult):
|
||
|
|
- raise TestFailed("%s should return: %s but returned: %s" \
|
||
|
|
+ raise support.TestFailed("%s should return: %s but returned: %s" \
|
||
|
|
%(str(fn), str(wantResult), repr(gotResult)))
|
||
|
|
|
||
|
|
|
||
|
|
@@ -882,6 +881,19 @@ def check(value, expected):
|
||
|
|
check('%spam%bar', '%sbar' % nonascii)
|
||
|
|
check('%{}%bar'.format(nonascii), 'ham%sbar' % nonascii)
|
||
|
|
|
||
|
|
+ @support.requires_resource('cpu')
|
||
|
|
+ def test_expandvars_large(self):
|
||
|
|
+ expandvars = ntpath.expandvars
|
||
|
|
+ with os_helper.EnvironmentVarGuard() as env:
|
||
|
|
+ env.clear()
|
||
|
|
+ env["A"] = "B"
|
||
|
|
+ n = 100_000
|
||
|
|
+ self.assertEqual(expandvars('%A%'*n), 'B'*n)
|
||
|
|
+ self.assertEqual(expandvars('%A%A'*n), 'BA'*n)
|
||
|
|
+ self.assertEqual(expandvars("''"*n + '%%'), "''"*n + '%')
|
||
|
|
+ self.assertEqual(expandvars("%%"*n), "%"*n)
|
||
|
|
+ self.assertEqual(expandvars("$$"*n), "$"*n)
|
||
|
|
+
|
||
|
|
def test_expanduser(self):
|
||
|
|
tester('ntpath.expanduser("test")', 'test')
|
||
|
|
|
||
|
|
@@ -1207,7 +1219,7 @@ def test_con_device(self):
|
||
|
|
self.assertTrue(os.path.exists(r"\\.\CON"))
|
||
|
|
|
||
|
|
@unittest.skipIf(sys.platform != 'win32', "Fast paths are only for win32")
|
||
|
|
- @cpython_only
|
||
|
|
+ @support.cpython_only
|
||
|
|
def test_fast_paths_in_use(self):
|
||
|
|
# There are fast paths of these functions implemented in posixmodule.c.
|
||
|
|
# Confirm that they are being used, and not the Python fallbacks in
|
||
|
|
diff --git a/Misc/NEWS.d/next/Security/2025-05-30-22-33-27.gh-issue-136065.bu337o.rst b/Misc/NEWS.d/next/Security/2025-05-30-22-33-27.gh-issue-136065.bu337o.rst
|
||
|
|
new file mode 100644
|
||
|
|
index 00000000000000..1d152bb5318380
|
||
|
|
--- /dev/null
|
||
|
|
+++ b/Misc/NEWS.d/next/Security/2025-05-30-22-33-27.gh-issue-136065.bu337o.rst
|
||
|
|
@@ -0,0 +1 @@
|
||
|
|
+Fix quadratic complexity in :func:`os.path.expandvars`.
|
||
|
|
|
||
|
|
From 27eb90f676ced2a2a6f2a3ea9d0555d045a0d976 Mon Sep 17 00:00:00 2001
|
||
|
|
From: =?UTF-8?q?=C5=81ukasz=20Langa?= <lukasz@langa.pl>
|
||
|
|
Date: Fri, 31 Oct 2025 17:32:52 +0100
|
||
|
|
Subject: [PATCH 2/2] Oops
|
||
|
|
|
||
|
|
---
|
||
|
|
Lib/test/test_ntpath.py | 1 +
|
||
|
|
1 file changed, 1 insertion(+)
|
||
|
|
|
||
|
|
diff --git a/Lib/test/test_ntpath.py b/Lib/test/test_ntpath.py
|
||
|
|
index 72f89ebb21c478..7c42d4f5894788 100644
|
||
|
|
--- a/Lib/test/test_ntpath.py
|
||
|
|
+++ b/Lib/test/test_ntpath.py
|
||
|
|
@@ -7,6 +7,7 @@
|
||
|
|
import unittest
|
||
|
|
import warnings
|
||
|
|
from ntpath import ALLOW_MISSING
|
||
|
|
+from test import support
|
||
|
|
from test.support import os_helper, is_emscripten
|
||
|
|
from test.support.os_helper import FakePath
|
||
|
|
from test import test_genericpath
|