Issue #17998: Fix an internal error in regular expression engine.

This commit is contained in:
Serhiy Storchaka 2013-08-03 19:18:38 +03:00
parent 1dfb9180a7
commit 1f35ae0a3c
4 changed files with 19 additions and 7 deletions

View File

@ -1040,6 +1040,16 @@ class ReTests(unittest.TestCase):
with self.assertRaisesRegex(sre_constants.error, '\?foo'): with self.assertRaisesRegex(sre_constants.error, '\?foo'):
re.compile('(?P<?foo>)') re.compile('(?P<?foo>)')
def test_issue17998(self):
for reps in '*', '+', '?', '{1}':
for mod in '', '?':
pattern = '.' + reps + mod + 'yz'
self.assertEqual(re.compile(pattern, re.S).findall('xyz'),
['xyz'], msg=pattern)
pattern = pattern.encode()
self.assertEqual(re.compile(pattern, re.S).findall(b'xyz'),
[b'xyz'], msg=pattern)
def run_re_tests(): def run_re_tests():
from test.re_tests import tests, SUCCEED, FAIL, SYNTAX_ERROR from test.re_tests import tests, SUCCEED, FAIL, SYNTAX_ERROR

View File

@ -59,6 +59,8 @@ Core and Builtins
Library Library
------- -------
- Issue #17998: Fix an internal error in regular expression engine.
- Issue #17557: Fix os.getgroups() to work with the modified behavior of - Issue #17557: Fix os.getgroups() to work with the modified behavior of
getgroups(2) on OS X 10.8. Original patch by Mateusz Lenik. getgroups(2) on OS X 10.8. Original patch by Mateusz Lenik.

View File

@ -997,7 +997,7 @@ entrance:
TRACE(("|%p|%p|REPEAT_ONE %d %d\n", ctx->pattern, ctx->ptr, TRACE(("|%p|%p|REPEAT_ONE %d %d\n", ctx->pattern, ctx->ptr,
ctx->pattern[1], ctx->pattern[2])); ctx->pattern[1], ctx->pattern[2]));
if (ctx->pattern[1] > (end - ctx->ptr) / state->charsize) if ((Py_ssize_t) ctx->pattern[1] > (end - ctx->ptr) / state->charsize)
RETURN_FAILURE; /* cannot match */ RETURN_FAILURE; /* cannot match */
state->ptr = ctx->ptr; state->ptr = ctx->ptr;
@ -1081,7 +1081,7 @@ entrance:
TRACE(("|%p|%p|MIN_REPEAT_ONE %d %d\n", ctx->pattern, ctx->ptr, TRACE(("|%p|%p|MIN_REPEAT_ONE %d %d\n", ctx->pattern, ctx->ptr,
ctx->pattern[1], ctx->pattern[2])); ctx->pattern[1], ctx->pattern[2]));
if (ctx->pattern[1] > (end - ctx->ptr) / state->charsize) if ((Py_ssize_t) ctx->pattern[1] > (end - ctx->ptr) / state->charsize)
RETURN_FAILURE; /* cannot match */ RETURN_FAILURE; /* cannot match */
state->ptr = ctx->ptr; state->ptr = ctx->ptr;
@ -1180,7 +1180,7 @@ entrance:
TRACE(("|%p|%p|MAX_UNTIL %d\n", ctx->pattern, TRACE(("|%p|%p|MAX_UNTIL %d\n", ctx->pattern,
ctx->ptr, ctx->count)); ctx->ptr, ctx->count));
if (ctx->count < ctx->u.rep->pattern[1]) { if (ctx->count < (Py_ssize_t) ctx->u.rep->pattern[1]) {
/* not enough matches */ /* not enough matches */
ctx->u.rep->count = ctx->count; ctx->u.rep->count = ctx->count;
DO_JUMP(JUMP_MAX_UNTIL_1, jump_max_until_1, DO_JUMP(JUMP_MAX_UNTIL_1, jump_max_until_1,
@ -1194,7 +1194,7 @@ entrance:
RETURN_FAILURE; RETURN_FAILURE;
} }
if ((ctx->count < ctx->u.rep->pattern[2] || if ((ctx->count < (Py_ssize_t) ctx->u.rep->pattern[2] ||
ctx->u.rep->pattern[2] == SRE_MAXREPEAT) && ctx->u.rep->pattern[2] == SRE_MAXREPEAT) &&
state->ptr != ctx->u.rep->last_ptr) { state->ptr != ctx->u.rep->last_ptr) {
/* we may have enough matches, but if we can /* we may have enough matches, but if we can
@ -1243,7 +1243,7 @@ entrance:
TRACE(("|%p|%p|MIN_UNTIL %d %p\n", ctx->pattern, TRACE(("|%p|%p|MIN_UNTIL %d %p\n", ctx->pattern,
ctx->ptr, ctx->count, ctx->u.rep->pattern)); ctx->ptr, ctx->count, ctx->u.rep->pattern));
if (ctx->count < ctx->u.rep->pattern[1]) { if (ctx->count < (Py_ssize_t) ctx->u.rep->pattern[1]) {
/* not enough matches */ /* not enough matches */
ctx->u.rep->count = ctx->count; ctx->u.rep->count = ctx->count;
DO_JUMP(JUMP_MIN_UNTIL_1, jump_min_until_1, DO_JUMP(JUMP_MIN_UNTIL_1, jump_min_until_1,
@ -1272,7 +1272,7 @@ entrance:
LASTMARK_RESTORE(); LASTMARK_RESTORE();
if ((ctx->count >= ctx->u.rep->pattern[2] if ((ctx->count >= (Py_ssize_t) ctx->u.rep->pattern[2]
&& ctx->u.rep->pattern[2] != SRE_MAXREPEAT) || && ctx->u.rep->pattern[2] != SRE_MAXREPEAT) ||
state->ptr == ctx->u.rep->last_ptr) state->ptr == ctx->u.rep->last_ptr)
RETURN_FAILURE; RETURN_FAILURE;

View File

@ -19,7 +19,7 @@
#if SIZEOF_SIZE_T > 4 #if SIZEOF_SIZE_T > 4
# define SRE_MAXREPEAT (~(SRE_CODE)0) # define SRE_MAXREPEAT (~(SRE_CODE)0)
#else #else
# define SRE_MAXREPEAT ((SRE_CODE)PY_SSIZE_T_MAX + 1u) # define SRE_MAXREPEAT ((SRE_CODE)PY_SSIZE_T_MAX)
#endif #endif
typedef struct { typedef struct {