mirror of https://github.com/python/cpython
439 lines
17 KiB
Python
439 lines
17 KiB
Python
import re
|
|
import sys
|
|
from test import support
|
|
|
|
from .util import (
|
|
BREAKPOINT_FN, GDB_VERSION,
|
|
run_gdb, setup_module, DebuggerTests)
|
|
|
|
|
|
def setUpModule():
|
|
setup_module()
|
|
|
|
|
|
class PrettyPrintTests(DebuggerTests):
|
|
def get_gdb_repr(self, source,
|
|
cmds_after_breakpoint=None,
|
|
import_site=False):
|
|
# Given an input python source representation of data,
|
|
# run "python -c'id(DATA)'" under gdb with a breakpoint on
|
|
# builtin_id and scrape out gdb's representation of the "op"
|
|
# parameter, and verify that the gdb displays the same string
|
|
#
|
|
# Verify that the gdb displays the expected string
|
|
#
|
|
# For a nested structure, the first time we hit the breakpoint will
|
|
# give us the top-level structure
|
|
|
|
# NOTE: avoid decoding too much of the traceback as some
|
|
# undecodable characters may lurk there in optimized mode
|
|
# (issue #19743).
|
|
cmds_after_breakpoint = cmds_after_breakpoint or ["backtrace 1"]
|
|
gdb_output = self.get_stack_trace(source, breakpoint=BREAKPOINT_FN,
|
|
cmds_after_breakpoint=cmds_after_breakpoint,
|
|
import_site=import_site)
|
|
# gdb can insert additional '\n' and space characters in various places
|
|
# in its output, depending on the width of the terminal it's connected
|
|
# to (using its "wrap_here" function)
|
|
m = re.search(
|
|
# Match '#0 builtin_id(self=..., v=...)'
|
|
r'#0\s+builtin_id\s+\(self\=.*,\s+v=\s*(.*?)?\)'
|
|
# Match ' at Python/bltinmodule.c'.
|
|
# bpo-38239: builtin_id() is defined in Python/bltinmodule.c,
|
|
# but accept any "Directory\file.c" to support Link Time
|
|
# Optimization (LTO).
|
|
r'\s+at\s+\S*[A-Za-z]+/[A-Za-z0-9_-]+\.c',
|
|
gdb_output, re.DOTALL)
|
|
if not m:
|
|
self.fail('Unexpected gdb output: %r\n%s' % (gdb_output, gdb_output))
|
|
return m.group(1), gdb_output
|
|
|
|
def test_getting_backtrace(self):
|
|
gdb_output = self.get_stack_trace('id(42)')
|
|
self.assertTrue(BREAKPOINT_FN in gdb_output)
|
|
|
|
def assertGdbRepr(self, val, exp_repr=None):
|
|
# Ensure that gdb's rendering of the value in a debugged process
|
|
# matches repr(value) in this process:
|
|
gdb_repr, gdb_output = self.get_gdb_repr('id(' + ascii(val) + ')')
|
|
if not exp_repr:
|
|
exp_repr = repr(val)
|
|
self.assertEqual(gdb_repr, exp_repr,
|
|
('%r did not equal expected %r; full output was:\n%s'
|
|
% (gdb_repr, exp_repr, gdb_output)))
|
|
|
|
@support.requires_resource('cpu')
|
|
def test_int(self):
|
|
'Verify the pretty-printing of various int values'
|
|
self.assertGdbRepr(42)
|
|
self.assertGdbRepr(0)
|
|
self.assertGdbRepr(-7)
|
|
self.assertGdbRepr(1000000000000)
|
|
self.assertGdbRepr(-1000000000000000)
|
|
|
|
def test_singletons(self):
|
|
'Verify the pretty-printing of True, False and None'
|
|
self.assertGdbRepr(True)
|
|
self.assertGdbRepr(False)
|
|
self.assertGdbRepr(None)
|
|
|
|
def test_dicts(self):
|
|
'Verify the pretty-printing of dictionaries'
|
|
self.assertGdbRepr({})
|
|
self.assertGdbRepr({'foo': 'bar'}, "{'foo': 'bar'}")
|
|
# Python preserves insertion order since 3.6
|
|
self.assertGdbRepr({'foo': 'bar', 'douglas': 42}, "{'foo': 'bar', 'douglas': 42}")
|
|
|
|
def test_lists(self):
|
|
'Verify the pretty-printing of lists'
|
|
self.assertGdbRepr([])
|
|
self.assertGdbRepr(list(range(5)))
|
|
|
|
@support.requires_resource('cpu')
|
|
def test_bytes(self):
|
|
'Verify the pretty-printing of bytes'
|
|
self.assertGdbRepr(b'')
|
|
self.assertGdbRepr(b'And now for something hopefully the same')
|
|
self.assertGdbRepr(b'string with embedded NUL here \0 and then some more text')
|
|
self.assertGdbRepr(b'this is a tab:\t'
|
|
b' this is a slash-N:\n'
|
|
b' this is a slash-R:\r'
|
|
)
|
|
|
|
self.assertGdbRepr(b'this is byte 255:\xff and byte 128:\x80')
|
|
|
|
self.assertGdbRepr(bytes([b for b in range(255)]))
|
|
|
|
@support.requires_resource('cpu')
|
|
def test_strings(self):
|
|
'Verify the pretty-printing of unicode strings'
|
|
# We cannot simply call locale.getpreferredencoding() here,
|
|
# as GDB might have been linked against a different version
|
|
# of Python with a different encoding and coercion policy
|
|
# with respect to PEP 538 and PEP 540.
|
|
stdout, stderr = run_gdb(
|
|
'--eval-command',
|
|
'python import locale; print(locale.getpreferredencoding())')
|
|
|
|
encoding = stdout
|
|
if stderr or not encoding:
|
|
raise RuntimeError(
|
|
f'unable to determine the Python locale preferred encoding '
|
|
f'of embedded Python in GDB\n'
|
|
f'stdout={stdout!r}\n'
|
|
f'stderr={stderr!r}')
|
|
|
|
def check_repr(text):
|
|
try:
|
|
text.encode(encoding)
|
|
except UnicodeEncodeError:
|
|
self.assertGdbRepr(text, ascii(text))
|
|
else:
|
|
self.assertGdbRepr(text)
|
|
|
|
self.assertGdbRepr('')
|
|
self.assertGdbRepr('And now for something hopefully the same')
|
|
self.assertGdbRepr('string with embedded NUL here \0 and then some more text')
|
|
|
|
# Test printing a single character:
|
|
# U+2620 SKULL AND CROSSBONES
|
|
check_repr('\u2620')
|
|
|
|
# Test printing a Japanese unicode string
|
|
# (I believe this reads "mojibake", using 3 characters from the CJK
|
|
# Unified Ideographs area, followed by U+3051 HIRAGANA LETTER KE)
|
|
check_repr('\u6587\u5b57\u5316\u3051')
|
|
|
|
# Test a character outside the BMP:
|
|
# U+1D121 MUSICAL SYMBOL C CLEF
|
|
# This is:
|
|
# UTF-8: 0xF0 0x9D 0x84 0xA1
|
|
# UTF-16: 0xD834 0xDD21
|
|
check_repr(chr(0x1D121))
|
|
|
|
def test_tuples(self):
|
|
'Verify the pretty-printing of tuples'
|
|
self.assertGdbRepr(tuple(), '()')
|
|
self.assertGdbRepr((1,), '(1,)')
|
|
self.assertGdbRepr(('foo', 'bar', 'baz'))
|
|
|
|
@support.requires_resource('cpu')
|
|
def test_sets(self):
|
|
'Verify the pretty-printing of sets'
|
|
if GDB_VERSION < (7, 3):
|
|
self.skipTest("pretty-printing of sets needs gdb 7.3 or later")
|
|
self.assertGdbRepr(set(), "set()")
|
|
self.assertGdbRepr(set(['a']), "{'a'}")
|
|
# PYTHONHASHSEED is need to get the exact frozenset item order
|
|
if not sys.flags.ignore_environment:
|
|
self.assertGdbRepr(set(['a', 'b']), "{'a', 'b'}")
|
|
self.assertGdbRepr(set([4, 5, 6]), "{4, 5, 6}")
|
|
|
|
# Ensure that we handle sets containing the "dummy" key value,
|
|
# which happens on deletion:
|
|
gdb_repr, gdb_output = self.get_gdb_repr('''s = set(['a','b'])
|
|
s.remove('a')
|
|
id(s)''')
|
|
self.assertEqual(gdb_repr, "{'b'}")
|
|
|
|
@support.requires_resource('cpu')
|
|
def test_frozensets(self):
|
|
'Verify the pretty-printing of frozensets'
|
|
if GDB_VERSION < (7, 3):
|
|
self.skipTest("pretty-printing of frozensets needs gdb 7.3 or later")
|
|
self.assertGdbRepr(frozenset(), "frozenset()")
|
|
self.assertGdbRepr(frozenset(['a']), "frozenset({'a'})")
|
|
# PYTHONHASHSEED is need to get the exact frozenset item order
|
|
if not sys.flags.ignore_environment:
|
|
self.assertGdbRepr(frozenset(['a', 'b']), "frozenset({'a', 'b'})")
|
|
self.assertGdbRepr(frozenset([4, 5, 6]), "frozenset({4, 5, 6})")
|
|
|
|
def test_exceptions(self):
|
|
# Test a RuntimeError
|
|
gdb_repr, gdb_output = self.get_gdb_repr('''
|
|
try:
|
|
raise RuntimeError("I am an error")
|
|
except RuntimeError as e:
|
|
id(e)
|
|
''')
|
|
self.assertEqual(gdb_repr,
|
|
"RuntimeError('I am an error',)")
|
|
|
|
|
|
# Test division by zero:
|
|
gdb_repr, gdb_output = self.get_gdb_repr('''
|
|
try:
|
|
a = 1 / 0
|
|
except ZeroDivisionError as e:
|
|
id(e)
|
|
''')
|
|
self.assertEqual(gdb_repr,
|
|
"ZeroDivisionError('division by zero',)")
|
|
|
|
def test_modern_class(self):
|
|
'Verify the pretty-printing of new-style class instances'
|
|
gdb_repr, gdb_output = self.get_gdb_repr('''
|
|
class Foo:
|
|
pass
|
|
foo = Foo()
|
|
foo.an_int = 42
|
|
id(foo)''')
|
|
m = re.match(r'<Foo\(an_int=42\) at remote 0x-?[0-9a-f]+>', gdb_repr)
|
|
self.assertTrue(m,
|
|
msg='Unexpected new-style class rendering %r' % gdb_repr)
|
|
|
|
def test_subclassing_list(self):
|
|
'Verify the pretty-printing of an instance of a list subclass'
|
|
gdb_repr, gdb_output = self.get_gdb_repr('''
|
|
class Foo(list):
|
|
pass
|
|
foo = Foo()
|
|
foo += [1, 2, 3]
|
|
foo.an_int = 42
|
|
id(foo)''')
|
|
m = re.match(r'<Foo\(an_int=42\) at remote 0x-?[0-9a-f]+>', gdb_repr)
|
|
|
|
self.assertTrue(m,
|
|
msg='Unexpected new-style class rendering %r' % gdb_repr)
|
|
|
|
def test_subclassing_tuple(self):
|
|
'Verify the pretty-printing of an instance of a tuple subclass'
|
|
# This should exercise the negative tp_dictoffset code in the
|
|
# new-style class support
|
|
gdb_repr, gdb_output = self.get_gdb_repr('''
|
|
class Foo(tuple):
|
|
pass
|
|
foo = Foo((1, 2, 3))
|
|
foo.an_int = 42
|
|
id(foo)''')
|
|
m = re.match(r'<Foo\(an_int=42\) at remote 0x-?[0-9a-f]+>', gdb_repr)
|
|
|
|
self.assertTrue(m,
|
|
msg='Unexpected new-style class rendering %r' % gdb_repr)
|
|
|
|
def assertSane(self, source, corruption, exprepr=None):
|
|
'''Run Python under gdb, corrupting variables in the inferior process
|
|
immediately before taking a backtrace.
|
|
|
|
Verify that the variable's representation is the expected failsafe
|
|
representation'''
|
|
if corruption:
|
|
cmds_after_breakpoint=[corruption, 'backtrace']
|
|
else:
|
|
cmds_after_breakpoint=['backtrace']
|
|
|
|
gdb_repr, gdb_output = \
|
|
self.get_gdb_repr(source,
|
|
cmds_after_breakpoint=cmds_after_breakpoint)
|
|
if exprepr:
|
|
if gdb_repr == exprepr:
|
|
# gdb managed to print the value in spite of the corruption;
|
|
# this is good (see http://bugs.python.org/issue8330)
|
|
return
|
|
|
|
# Match anything for the type name; 0xDEADBEEF could point to
|
|
# something arbitrary (see http://bugs.python.org/issue8330)
|
|
pattern = '<.* at remote 0x-?[0-9a-f]+>'
|
|
|
|
m = re.match(pattern, gdb_repr)
|
|
if not m:
|
|
self.fail('Unexpected gdb representation: %r\n%s' % \
|
|
(gdb_repr, gdb_output))
|
|
|
|
def test_NULL_ptr(self):
|
|
'Ensure that a NULL PyObject* is handled gracefully'
|
|
gdb_repr, gdb_output = (
|
|
self.get_gdb_repr('id(42)',
|
|
cmds_after_breakpoint=['set variable v=0',
|
|
'backtrace'])
|
|
)
|
|
|
|
self.assertEqual(gdb_repr, '0x0')
|
|
|
|
def test_NULL_ob_type(self):
|
|
'Ensure that a PyObject* with NULL ob_type is handled gracefully'
|
|
self.assertSane('id(42)',
|
|
'set v->ob_type=0')
|
|
|
|
def test_corrupt_ob_type(self):
|
|
'Ensure that a PyObject* with a corrupt ob_type is handled gracefully'
|
|
self.assertSane('id(42)',
|
|
'set v->ob_type=0xDEADBEEF',
|
|
exprepr='42')
|
|
|
|
def test_corrupt_tp_flags(self):
|
|
'Ensure that a PyObject* with a type with corrupt tp_flags is handled'
|
|
self.assertSane('id(42)',
|
|
'set v->ob_type->tp_flags=0x0',
|
|
exprepr='42')
|
|
|
|
def test_corrupt_tp_name(self):
|
|
'Ensure that a PyObject* with a type with corrupt tp_name is handled'
|
|
self.assertSane('id(42)',
|
|
'set v->ob_type->tp_name=0xDEADBEEF',
|
|
exprepr='42')
|
|
|
|
def test_builtins_help(self):
|
|
'Ensure that the new-style class _Helper in site.py can be handled'
|
|
|
|
if sys.flags.no_site:
|
|
self.skipTest("need site module, but -S option was used")
|
|
|
|
# (this was the issue causing tracebacks in
|
|
# http://bugs.python.org/issue8032#msg100537 )
|
|
gdb_repr, gdb_output = self.get_gdb_repr('id(__builtins__.help)', import_site=True)
|
|
|
|
m = re.match(r'<_Helper\(\) at remote 0x-?[0-9a-f]+>', gdb_repr)
|
|
self.assertTrue(m,
|
|
msg='Unexpected rendering %r' % gdb_repr)
|
|
|
|
def test_selfreferential_list(self):
|
|
'''Ensure that a reference loop involving a list doesn't lead proxyval
|
|
into an infinite loop:'''
|
|
gdb_repr, gdb_output = \
|
|
self.get_gdb_repr("a = [3, 4, 5] ; a.append(a) ; id(a)")
|
|
self.assertEqual(gdb_repr, '[3, 4, 5, [...]]')
|
|
|
|
gdb_repr, gdb_output = \
|
|
self.get_gdb_repr("a = [3, 4, 5] ; b = [a] ; a.append(b) ; id(a)")
|
|
self.assertEqual(gdb_repr, '[3, 4, 5, [[...]]]')
|
|
|
|
def test_selfreferential_dict(self):
|
|
'''Ensure that a reference loop involving a dict doesn't lead proxyval
|
|
into an infinite loop:'''
|
|
gdb_repr, gdb_output = \
|
|
self.get_gdb_repr("a = {} ; b = {'bar':a} ; a['foo'] = b ; id(a)")
|
|
|
|
self.assertEqual(gdb_repr, "{'foo': {'bar': {...}}}")
|
|
|
|
def test_selfreferential_old_style_instance(self):
|
|
gdb_repr, gdb_output = \
|
|
self.get_gdb_repr('''
|
|
class Foo:
|
|
pass
|
|
foo = Foo()
|
|
foo.an_attr = foo
|
|
id(foo)''')
|
|
self.assertTrue(re.match(r'<Foo\(an_attr=<\.\.\.>\) at remote 0x-?[0-9a-f]+>',
|
|
gdb_repr),
|
|
'Unexpected gdb representation: %r\n%s' % \
|
|
(gdb_repr, gdb_output))
|
|
|
|
def test_selfreferential_new_style_instance(self):
|
|
gdb_repr, gdb_output = \
|
|
self.get_gdb_repr('''
|
|
class Foo(object):
|
|
pass
|
|
foo = Foo()
|
|
foo.an_attr = foo
|
|
id(foo)''')
|
|
self.assertTrue(re.match(r'<Foo\(an_attr=<\.\.\.>\) at remote 0x-?[0-9a-f]+>',
|
|
gdb_repr),
|
|
'Unexpected gdb representation: %r\n%s' % \
|
|
(gdb_repr, gdb_output))
|
|
|
|
gdb_repr, gdb_output = \
|
|
self.get_gdb_repr('''
|
|
class Foo(object):
|
|
pass
|
|
a = Foo()
|
|
b = Foo()
|
|
a.an_attr = b
|
|
b.an_attr = a
|
|
id(a)''')
|
|
self.assertTrue(re.match(r'<Foo\(an_attr=<Foo\(an_attr=<\.\.\.>\) at remote 0x-?[0-9a-f]+>\) at remote 0x-?[0-9a-f]+>',
|
|
gdb_repr),
|
|
'Unexpected gdb representation: %r\n%s' % \
|
|
(gdb_repr, gdb_output))
|
|
|
|
def test_truncation(self):
|
|
'Verify that very long output is truncated'
|
|
gdb_repr, gdb_output = self.get_gdb_repr('id(list(range(1000)))')
|
|
self.assertEqual(gdb_repr,
|
|
"[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, "
|
|
"14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, "
|
|
"27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, "
|
|
"40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, "
|
|
"53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, "
|
|
"66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, "
|
|
"79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, "
|
|
"92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, "
|
|
"104, 105, 106, 107, 108, 109, 110, 111, 112, 113, "
|
|
"114, 115, 116, 117, 118, 119, 120, 121, 122, 123, "
|
|
"124, 125, 126, 127, 128, 129, 130, 131, 132, 133, "
|
|
"134, 135, 136, 137, 138, 139, 140, 141, 142, 143, "
|
|
"144, 145, 146, 147, 148, 149, 150, 151, 152, 153, "
|
|
"154, 155, 156, 157, 158, 159, 160, 161, 162, 163, "
|
|
"164, 165, 166, 167, 168, 169, 170, 171, 172, 173, "
|
|
"174, 175, 176, 177, 178, 179, 180, 181, 182, 183, "
|
|
"184, 185, 186, 187, 188, 189, 190, 191, 192, 193, "
|
|
"194, 195, 196, 197, 198, 199, 200, 201, 202, 203, "
|
|
"204, 205, 206, 207, 208, 209, 210, 211, 212, 213, "
|
|
"214, 215, 216, 217, 218, 219, 220, 221, 222, 223, "
|
|
"224, 225, 226...(truncated)")
|
|
self.assertEqual(len(gdb_repr),
|
|
1024 + len('...(truncated)'))
|
|
|
|
def test_builtin_method(self):
|
|
gdb_repr, gdb_output = self.get_gdb_repr('import sys; id(sys.stdout.readlines)')
|
|
self.assertTrue(re.match(r'<built-in method readlines of _io.TextIOWrapper object at remote 0x-?[0-9a-f]+>',
|
|
gdb_repr),
|
|
'Unexpected gdb representation: %r\n%s' % \
|
|
(gdb_repr, gdb_output))
|
|
|
|
def test_frames(self):
|
|
gdb_output = self.get_stack_trace('''
|
|
import sys
|
|
def foo(a, b, c):
|
|
return sys._getframe(0)
|
|
|
|
f = foo(3, 4, 5)
|
|
id(f)''',
|
|
breakpoint='builtin_id',
|
|
cmds_after_breakpoint=['print (PyFrameObject*)v']
|
|
)
|
|
self.assertTrue(re.match(r'.*\s+\$1 =\s+Frame 0x-?[0-9a-f]+, for file <string>, line 4, in foo \(a=3.*',
|
|
gdb_output,
|
|
re.DOTALL),
|
|
'Unexpected gdb representation: %r\n%s' % (gdb_output, gdb_output))
|