mirror of https://github.com/python/cpython
539 lines
15 KiB
Python
539 lines
15 KiB
Python
import io
|
|
import logging
|
|
import os
|
|
import os.path
|
|
import re
|
|
import sys
|
|
|
|
from c_common import fsutil
|
|
from c_common.logging import VERBOSITY, Printer
|
|
from c_common.scriptutil import (
|
|
add_verbosity_cli,
|
|
add_traceback_cli,
|
|
add_sepval_cli,
|
|
add_progress_cli,
|
|
add_files_cli,
|
|
add_commands_cli,
|
|
process_args_by_key,
|
|
configure_logger,
|
|
get_prog,
|
|
filter_filenames,
|
|
)
|
|
from c_parser.info import KIND
|
|
from .match import filter_forward
|
|
from . import (
|
|
analyze as _analyze,
|
|
datafiles as _datafiles,
|
|
check_all as _check_all,
|
|
)
|
|
|
|
|
|
KINDS = [
|
|
KIND.TYPEDEF,
|
|
KIND.STRUCT,
|
|
KIND.UNION,
|
|
KIND.ENUM,
|
|
KIND.FUNCTION,
|
|
KIND.VARIABLE,
|
|
KIND.STATEMENT,
|
|
]
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
#######################################
|
|
# table helpers
|
|
|
|
TABLE_SECTIONS = {
|
|
'types': (
|
|
['kind', 'name', 'data', 'file'],
|
|
KIND.is_type_decl,
|
|
(lambda v: (v.kind.value, v.filename or '', v.name)),
|
|
),
|
|
'typedefs': 'types',
|
|
'structs': 'types',
|
|
'unions': 'types',
|
|
'enums': 'types',
|
|
'functions': (
|
|
['name', 'data', 'file'],
|
|
(lambda kind: kind is KIND.FUNCTION),
|
|
(lambda v: (v.filename or '', v.name)),
|
|
),
|
|
'variables': (
|
|
['name', 'parent', 'data', 'file'],
|
|
(lambda kind: kind is KIND.VARIABLE),
|
|
(lambda v: (v.filename or '', str(v.parent) if v.parent else '', v.name)),
|
|
),
|
|
'statements': (
|
|
['file', 'parent', 'data'],
|
|
(lambda kind: kind is KIND.STATEMENT),
|
|
(lambda v: (v.filename or '', str(v.parent) if v.parent else '', v.name)),
|
|
),
|
|
KIND.TYPEDEF: 'typedefs',
|
|
KIND.STRUCT: 'structs',
|
|
KIND.UNION: 'unions',
|
|
KIND.ENUM: 'enums',
|
|
KIND.FUNCTION: 'functions',
|
|
KIND.VARIABLE: 'variables',
|
|
KIND.STATEMENT: 'statements',
|
|
}
|
|
|
|
|
|
def _render_table(items, columns, relroot=None):
|
|
# XXX improve this
|
|
header = '\t'.join(columns)
|
|
div = '--------------------'
|
|
yield header
|
|
yield div
|
|
total = 0
|
|
for item in items:
|
|
rowdata = item.render_rowdata(columns)
|
|
row = [rowdata[c] for c in columns]
|
|
if relroot and 'file' in columns:
|
|
index = columns.index('file')
|
|
row[index] = os.path.relpath(row[index], relroot)
|
|
yield '\t'.join(row)
|
|
total += 1
|
|
yield div
|
|
yield f'total: {total}'
|
|
|
|
|
|
def build_section(name, groupitems, *, relroot=None):
|
|
info = TABLE_SECTIONS[name]
|
|
while type(info) is not tuple:
|
|
if name in KINDS:
|
|
name = info
|
|
info = TABLE_SECTIONS[info]
|
|
|
|
columns, match_kind, sortkey = info
|
|
items = (v for v in groupitems if match_kind(v.kind))
|
|
items = sorted(items, key=sortkey)
|
|
def render():
|
|
yield ''
|
|
yield f'{name}:'
|
|
yield ''
|
|
for line in _render_table(items, columns, relroot):
|
|
yield line
|
|
return items, render
|
|
|
|
|
|
#######################################
|
|
# the checks
|
|
|
|
CHECKS = {
|
|
#'globals': _check_globals,
|
|
}
|
|
|
|
|
|
def add_checks_cli(parser, checks=None, *, add_flags=None):
|
|
default = False
|
|
if not checks:
|
|
checks = list(CHECKS)
|
|
default = True
|
|
elif isinstance(checks, str):
|
|
checks = [checks]
|
|
if (add_flags is None and len(checks) > 1) or default:
|
|
add_flags = True
|
|
|
|
process_checks = add_sepval_cli(parser, '--check', 'checks', checks)
|
|
if add_flags:
|
|
for check in checks:
|
|
parser.add_argument(f'--{check}', dest='checks',
|
|
action='append_const', const=check)
|
|
return [
|
|
process_checks,
|
|
]
|
|
|
|
|
|
def _get_check_handlers(fmt, printer, verbosity=VERBOSITY):
|
|
div = None
|
|
def handle_after():
|
|
pass
|
|
if not fmt:
|
|
div = ''
|
|
def handle_failure(failure, data):
|
|
data = repr(data)
|
|
if verbosity >= 3:
|
|
logger.info(f'failure: {failure}')
|
|
logger.info(f'data: {data}')
|
|
else:
|
|
logger.warn(f'failure: {failure} (data: {data})')
|
|
elif fmt == 'raw':
|
|
def handle_failure(failure, data):
|
|
print(f'{failure!r} {data!r}')
|
|
elif fmt == 'brief':
|
|
def handle_failure(failure, data):
|
|
parent = data.parent or ''
|
|
funcname = parent if isinstance(parent, str) else parent.name
|
|
name = f'({funcname}).{data.name}' if funcname else data.name
|
|
failure = failure.split('\t')[0]
|
|
print(f'{data.filename}:{name} - {failure}')
|
|
elif fmt == 'summary':
|
|
def handle_failure(failure, data):
|
|
print(_fmt_one_summary(data, failure))
|
|
elif fmt == 'full':
|
|
div = ''
|
|
def handle_failure(failure, data):
|
|
name = data.shortkey if data.kind is KIND.VARIABLE else data.name
|
|
parent = data.parent or ''
|
|
funcname = parent if isinstance(parent, str) else parent.name
|
|
known = 'yes' if data.is_known else '*** NO ***'
|
|
print(f'{data.kind.value} {name!r} failed ({failure})')
|
|
print(f' file: {data.filename}')
|
|
print(f' func: {funcname or "-"}')
|
|
print(f' name: {data.name}')
|
|
print(f' data: ...')
|
|
print(f' type unknown: {known}')
|
|
else:
|
|
if fmt in FORMATS:
|
|
raise NotImplementedError(fmt)
|
|
raise ValueError(f'unsupported fmt {fmt!r}')
|
|
return handle_failure, handle_after, div
|
|
|
|
|
|
#######################################
|
|
# the formats
|
|
|
|
def fmt_raw(analysis):
|
|
for item in analysis:
|
|
yield from item.render('raw')
|
|
|
|
|
|
def fmt_brief(analysis):
|
|
# XXX Support sorting.
|
|
items = sorted(analysis)
|
|
for kind in KINDS:
|
|
if kind is KIND.STATEMENT:
|
|
continue
|
|
for item in items:
|
|
if item.kind is not kind:
|
|
continue
|
|
yield from item.render('brief')
|
|
yield f' total: {len(items)}'
|
|
|
|
|
|
def fmt_summary(analysis):
|
|
# XXX Support sorting and grouping.
|
|
items = list(analysis)
|
|
total = len(items)
|
|
|
|
def section(name):
|
|
_, render = build_section(name, items)
|
|
yield from render()
|
|
|
|
yield from section('types')
|
|
yield from section('functions')
|
|
yield from section('variables')
|
|
yield from section('statements')
|
|
|
|
yield ''
|
|
# yield f'grand total: {len(supported) + len(unsupported)}'
|
|
yield f'grand total: {total}'
|
|
|
|
|
|
def _fmt_one_summary(item, extra=None):
|
|
parent = item.parent or ''
|
|
funcname = parent if isinstance(parent, str) else parent.name
|
|
if extra:
|
|
return f'{item.filename:35}\t{funcname or "-":35}\t{item.name:40}\t{extra}'
|
|
else:
|
|
return f'{item.filename:35}\t{funcname or "-":35}\t{item.name}'
|
|
|
|
|
|
def fmt_full(analysis):
|
|
# XXX Support sorting.
|
|
items = sorted(analysis, key=lambda v: v.key)
|
|
yield ''
|
|
for item in items:
|
|
yield from item.render('full')
|
|
yield ''
|
|
yield f'total: {len(items)}'
|
|
|
|
|
|
FORMATS = {
|
|
'raw': fmt_raw,
|
|
'brief': fmt_brief,
|
|
'summary': fmt_summary,
|
|
'full': fmt_full,
|
|
}
|
|
|
|
|
|
def add_output_cli(parser, *, default='summary'):
|
|
parser.add_argument('--format', dest='fmt', default=default, choices=tuple(FORMATS))
|
|
|
|
def process_args(args, *, argv=None):
|
|
pass
|
|
return process_args
|
|
|
|
|
|
#######################################
|
|
# the commands
|
|
|
|
def _cli_check(parser, checks=None, **kwargs):
|
|
if isinstance(checks, str):
|
|
checks = [checks]
|
|
if checks is False:
|
|
process_checks = None
|
|
elif checks is None:
|
|
process_checks = add_checks_cli(parser)
|
|
elif len(checks) == 1 and type(checks) is not dict and re.match(r'^<.*>$', checks[0]):
|
|
check = checks[0][1:-1]
|
|
def process_checks(args, *, argv=None):
|
|
args.checks = [check]
|
|
else:
|
|
process_checks = add_checks_cli(parser, checks=checks)
|
|
process_progress = add_progress_cli(parser)
|
|
process_output = add_output_cli(parser, default=None)
|
|
process_files = add_files_cli(parser, **kwargs)
|
|
return [
|
|
process_checks,
|
|
process_progress,
|
|
process_output,
|
|
process_files,
|
|
]
|
|
|
|
|
|
def cmd_check(filenames, *,
|
|
checks=None,
|
|
ignored=None,
|
|
fmt=None,
|
|
failfast=False,
|
|
iter_filenames=None,
|
|
relroot=fsutil.USE_CWD,
|
|
track_progress=None,
|
|
verbosity=VERBOSITY,
|
|
_analyze=_analyze,
|
|
_CHECKS=CHECKS,
|
|
**kwargs
|
|
):
|
|
if not checks:
|
|
checks = _CHECKS
|
|
elif isinstance(checks, str):
|
|
checks = [checks]
|
|
checks = [_CHECKS[c] if isinstance(c, str) else c
|
|
for c in checks]
|
|
printer = Printer(verbosity)
|
|
(handle_failure, handle_after, div
|
|
) = _get_check_handlers(fmt, printer, verbosity)
|
|
|
|
filenames, relroot = fsutil.fix_filenames(filenames, relroot=relroot)
|
|
filenames = filter_filenames(filenames, iter_filenames, relroot)
|
|
if track_progress:
|
|
filenames = track_progress(filenames)
|
|
|
|
logger.info('analyzing files...')
|
|
analyzed = _analyze(filenames, **kwargs)
|
|
analyzed.fix_filenames(relroot, normalize=False)
|
|
decls = filter_forward(analyzed, markpublic=True)
|
|
|
|
logger.info('checking analysis results...')
|
|
failed = []
|
|
for data, failure in _check_all(decls, checks, failfast=failfast):
|
|
if data is None:
|
|
printer.info('stopping after one failure')
|
|
break
|
|
if div is not None and len(failed) > 0:
|
|
printer.info(div)
|
|
failed.append(data)
|
|
handle_failure(failure, data)
|
|
handle_after()
|
|
|
|
printer.info('-------------------------')
|
|
logger.info(f'total failures: {len(failed)}')
|
|
logger.info('done checking')
|
|
|
|
if fmt == 'summary':
|
|
print('Categorized by storage:')
|
|
print()
|
|
from .match import group_by_storage
|
|
grouped = group_by_storage(failed, ignore_non_match=False)
|
|
for group, decls in grouped.items():
|
|
print()
|
|
print(group)
|
|
for decl in decls:
|
|
print(' ', _fmt_one_summary(decl))
|
|
print(f'subtotal: {len(decls)}')
|
|
|
|
if len(failed) > 0:
|
|
sys.exit(len(failed))
|
|
|
|
|
|
def _cli_analyze(parser, **kwargs):
|
|
process_progress = add_progress_cli(parser)
|
|
process_output = add_output_cli(parser)
|
|
process_files = add_files_cli(parser, **kwargs)
|
|
return [
|
|
process_progress,
|
|
process_output,
|
|
process_files,
|
|
]
|
|
|
|
|
|
# XXX Support filtering by kind.
|
|
def cmd_analyze(filenames, *,
|
|
fmt=None,
|
|
iter_filenames=None,
|
|
relroot=fsutil.USE_CWD,
|
|
track_progress=None,
|
|
verbosity=None,
|
|
_analyze=_analyze,
|
|
formats=FORMATS,
|
|
**kwargs
|
|
):
|
|
verbosity = verbosity if verbosity is not None else 3
|
|
|
|
try:
|
|
do_fmt = formats[fmt]
|
|
except KeyError:
|
|
raise ValueError(f'unsupported fmt {fmt!r}')
|
|
|
|
filenames, relroot = fsutil.fix_filenames(filenames, relroot=relroot)
|
|
filenames = filter_filenames(filenames, iter_filenames, relroot)
|
|
if track_progress:
|
|
filenames = track_progress(filenames)
|
|
|
|
logger.info('analyzing files...')
|
|
analyzed = _analyze(filenames, **kwargs)
|
|
analyzed.fix_filenames(relroot, normalize=False)
|
|
decls = filter_forward(analyzed, markpublic=True)
|
|
|
|
for line in do_fmt(decls):
|
|
print(line)
|
|
|
|
|
|
def _cli_data(parser, filenames=None, known=None):
|
|
ArgumentParser = type(parser)
|
|
common = ArgumentParser(add_help=False)
|
|
# These flags will get processed by the top-level parse_args().
|
|
add_verbosity_cli(common)
|
|
add_traceback_cli(common)
|
|
|
|
subs = parser.add_subparsers(dest='datacmd')
|
|
|
|
sub = subs.add_parser('show', parents=[common])
|
|
if known is None:
|
|
sub.add_argument('--known', required=True)
|
|
if filenames is None:
|
|
sub.add_argument('filenames', metavar='FILE', nargs='+')
|
|
|
|
sub = subs.add_parser('dump', parents=[common])
|
|
if known is None:
|
|
sub.add_argument('--known')
|
|
sub.add_argument('--show', action='store_true')
|
|
process_progress = add_progress_cli(sub)
|
|
|
|
sub = subs.add_parser('check', parents=[common])
|
|
if known is None:
|
|
sub.add_argument('--known', required=True)
|
|
|
|
def process_args(args, *, argv):
|
|
if args.datacmd == 'dump':
|
|
process_progress(args, argv)
|
|
return process_args
|
|
|
|
|
|
def cmd_data(datacmd, filenames, known=None, *,
|
|
_analyze=_analyze,
|
|
formats=FORMATS,
|
|
extracolumns=None,
|
|
relroot=fsutil.USE_CWD,
|
|
track_progress=None,
|
|
**kwargs
|
|
):
|
|
kwargs.pop('verbosity', None)
|
|
usestdout = kwargs.pop('show', None)
|
|
if datacmd == 'show':
|
|
do_fmt = formats['summary']
|
|
if isinstance(known, str):
|
|
known, _ = _datafiles.get_known(known, extracolumns, relroot)
|
|
for line in do_fmt(known):
|
|
print(line)
|
|
elif datacmd == 'dump':
|
|
filenames, relroot = fsutil.fix_filenames(filenames, relroot=relroot)
|
|
if track_progress:
|
|
filenames = track_progress(filenames)
|
|
analyzed = _analyze(filenames, **kwargs)
|
|
analyzed.fix_filenames(relroot, normalize=False)
|
|
if known is None or usestdout:
|
|
outfile = io.StringIO()
|
|
_datafiles.write_known(analyzed, outfile, extracolumns,
|
|
relroot=relroot)
|
|
print(outfile.getvalue())
|
|
else:
|
|
_datafiles.write_known(analyzed, known, extracolumns,
|
|
relroot=relroot)
|
|
elif datacmd == 'check':
|
|
raise NotImplementedError(datacmd)
|
|
else:
|
|
raise ValueError(f'unsupported data command {datacmd!r}')
|
|
|
|
|
|
COMMANDS = {
|
|
'check': (
|
|
'analyze and fail if the given C source/header files have any problems',
|
|
[_cli_check],
|
|
cmd_check,
|
|
),
|
|
'analyze': (
|
|
'report on the state of the given C source/header files',
|
|
[_cli_analyze],
|
|
cmd_analyze,
|
|
),
|
|
'data': (
|
|
'check/manage local data (e.g. known types, ignored vars, caches)',
|
|
[_cli_data],
|
|
cmd_data,
|
|
),
|
|
}
|
|
|
|
|
|
#######################################
|
|
# the script
|
|
|
|
def parse_args(argv=sys.argv[1:], prog=sys.argv[0], *, subset=None):
|
|
import argparse
|
|
parser = argparse.ArgumentParser(
|
|
prog=prog or get_prog(),
|
|
)
|
|
|
|
processors = add_commands_cli(
|
|
parser,
|
|
commands={k: v[1] for k, v in COMMANDS.items()},
|
|
commonspecs=[
|
|
add_verbosity_cli,
|
|
add_traceback_cli,
|
|
],
|
|
subset=subset,
|
|
)
|
|
|
|
args = parser.parse_args(argv)
|
|
ns = vars(args)
|
|
|
|
cmd = ns.pop('cmd')
|
|
|
|
verbosity, traceback_cm = process_args_by_key(
|
|
args,
|
|
argv,
|
|
processors[cmd],
|
|
['verbosity', 'traceback_cm'],
|
|
)
|
|
# "verbosity" is sent to the commands, so we put it back.
|
|
args.verbosity = verbosity
|
|
|
|
return cmd, ns, verbosity, traceback_cm
|
|
|
|
|
|
def main(cmd, cmd_kwargs):
|
|
try:
|
|
run_cmd = COMMANDS[cmd][0]
|
|
except KeyError:
|
|
raise ValueError(f'unsupported cmd {cmd!r}')
|
|
run_cmd(**cmd_kwargs)
|
|
|
|
|
|
if __name__ == '__main__':
|
|
cmd, cmd_kwargs, verbosity, traceback_cm = parse_args()
|
|
configure_logger(verbosity)
|
|
with traceback_cm:
|
|
main(cmd, cmd_kwargs)
|