| #!/usr/bin/env python3 |
| # Copyright 2023 The Chromium Authors |
| # Use of this source code is governed by a BSD-style license that can be |
| # found in the LICENSE file. |
| """Samples clang-tidy results from a JSON file. |
| |
| Provides information about number of checks triggered and a summary of some of |
| the checks with links back to code search. |
| |
| Usage: |
| tools/sample_clang_tidy_results.py out/all_findings.json |
| """ |
| |
| import argparse |
| import collections |
| import functools |
| import json |
| import logging |
| import os |
| import random |
| import subprocess |
| import sys |
| from pathlib import Path |
| from typing import Any, Dict, List |
| |
| |
| @functools.lru_cache(maxsize=None) |
| def get_src_path() -> str: |
| src_path = Path(__file__).parent.parent.resolve() |
| if not src_path: |
| raise NotFoundError( |
| 'Could not find checkout in any parent of the current path.') |
| return src_path |
| |
| |
| @functools.lru_cache(maxsize=None) |
| def git_rev_parse_head(path: Path): |
| if (path / '.git').exists(): |
| return subprocess.check_output(['git', 'rev-parse', 'HEAD'], |
| encoding='utf-8', |
| cwd=path).strip() |
| return git_rev_parse_head(path.parent) |
| |
| |
| def convert_diag_to_cs(diag: Dict[str, Any]) -> str: |
| path = diag['file_path'] |
| line = diag['line_number'] |
| name = diag['diag_name'] |
| replacement = '\n'.join(x['new_text'] for x in diag['replacements']) |
| |
| sha = git_rev_parse_head(get_src_path() / path) |
| |
| # https://source.chromium.org/chromium/chromium/src/+/main:apps/app_restore_service.cc |
| sha_and_path = f'{sha}:{path}' |
| return { |
| 'name': |
| name, |
| 'path': ('https://source.chromium.org/chromium/chromium/src/+/' |
| f'{sha}:{path};l={line}'), |
| 'replacement': |
| replacement |
| } |
| |
| |
| @functools.lru_cache(maxsize=None) |
| def is_first_party_path(path: Path) -> bool: |
| if path == get_src_path(): |
| return True |
| |
| if path == '/': |
| return False |
| |
| if (path / '.git').exists() or (path / '.gclient').exists(): |
| return False |
| |
| return is_first_party_path(path.parent) |
| |
| |
| def is_first_party_diag(diag: Dict[str, Any]) -> bool: |
| path = diag['file_path'] |
| if path.startswith('out/') or path.startswith('/'): |
| return False |
| return is_first_party_path(get_src_path() / path) |
| |
| |
| def select_random_diags(diags: List[Dict[str, Any]], number: int) -> List[Any]: |
| first_party = [x for x in diags if is_first_party_diag(x)] |
| if len(first_party) <= number: |
| return first_party |
| return random.sample(first_party, number) |
| |
| |
| def is_diag_in_test_file(diag: Dict[str, Any]) -> bool: |
| file_stem = os.path.splitext(diag['file_path'])[0] |
| return (file_stem.endswith('test') or file_stem.endswith('tests') |
| or '_test_' in file_stem or '_unittest_' in file_stem) |
| |
| |
| def is_diag_in_third_party(diag: Dict[str, Any]) -> bool: |
| return 'third_party' in diag['file_path'] |
| |
| |
| def main(argv: List[str]): |
| logging.basicConfig( |
| format='>> %(asctime)s: %(levelname)s: %(filename)s:%(lineno)d: ' |
| '%(message)s', |
| level=logging.INFO, |
| ) |
| |
| parser = argparse.ArgumentParser( |
| description=__doc__, |
| formatter_class=argparse.RawDescriptionHelpFormatter, |
| ) |
| parser.add_argument('-n', |
| '--number', |
| type=int, |
| default=30, |
| help='How many checks to sample') |
| parser.add_argument('--ignore-tests', |
| action='store_true', |
| help='Filters lints in test/unittest files if specified.') |
| parser.add_argument('--include-third-party', |
| action='store_true', |
| help='Includes lints in third_party if specified.') |
| parser.add_argument('file', help='JSON file to parse') |
| opts = parser.parse_args(argv) |
| |
| with open(opts.file) as f: |
| data = json.load(f) |
| |
| print(f'Files with tidy errors: {len(data["failed_tidy_files"])}') |
| print(f'Timed out files: {len(data["timed_out_src_files"])}') |
| diags = data['diagnostics'] |
| |
| if not opts.include_third_party: |
| new_diags = [x for x in diags if not is_diag_in_third_party(x)] |
| print(f'Dropped {len(diags) - len(new_diags)} diags from third_party') |
| diags = new_diags |
| |
| if opts.ignore_tests: |
| new_diags = [x for x in diags if not is_diag_in_test_file(x)] |
| print(f'Dropped {len(diags) - len(new_diags)} diags from test files') |
| diags = new_diags |
| |
| counts = collections.defaultdict(int) |
| for x in diags: |
| name = x['diag_name'] |
| counts[name] += 1 |
| |
| print(f'Total number of diagnostics: {len(diags)}') |
| for x in sorted(counts.keys()): |
| print(f'\t{x}: {counts[x]}') |
| print() |
| |
| diags = select_random_diags(diags, opts.number) |
| data = [convert_diag_to_cs(x) for x in diags] |
| print(f'** Sample of first-party lints: **') |
| for x in data: |
| print(x['path']) |
| print(f'\tDiagnostic: {x["name"]}') |
| print(f'\tReplacement: {x["replacement"]}') |
| print() |
| |
| print('** Link summary **') |
| for x in data: |
| print(x['path']) |
| |
| |
| if __name__ == '__main__': |
| main(sys.argv[1:]) |