#!/usr/bin/env python3 # -*- coding: utf-8 -*- # ------------------------------------------------------------------------------ # Copyright (c) 2022 Michael Richters # This is free and unencumbered software released into the public domain. # Anyone is free to copy, modify, publish, use, compile, sell, or # distribute this software, either in source code form or as a compiled # binary, for any purpose, commercial or non-commercial, and by any # means. # In jurisdictions that recognize copyright laws, the author or authors # of this software dedicate any and all copyright interest in the # software to the public domain. We make this dedication for the benefit # of the public at large and to the detriment of our heirs and # successors. We intend this dedication to be an overt act of # relinquishment in perpetuity of all present and future rights to this # software under copyright law. # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, # EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF # MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. # IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR ANY CLAIM, DAMAGES OR # OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, # ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR # OTHER DEALINGS IN THE SOFTWARE. # For more information, please refer to # ------------------------------------------------------------------------------ """This is a script for maintenance of the headers included in Kaleidoscope source files. It is not currently possible to run this automatically on all Kaleidoscope source files, because of the peculiarities therein. It uses llvm/clang to determine which headers should be included in a given file, but there's no avr-clang, so we're limited to using the virtual hardware device. It takes any number of source files as its input, examines them and updates the list of header `#include` directives. It is safe to run on most Kaleidoscope source files, and a good idea to run it on new ones (after staging them, so you can easily see what changes have been made). """ # Example invocation: # $ git ls-files -m | grep '\.\(h\|cpp\)' | bin/iwyu.py import argparse import glob import logging import os import re import shlex import shutil import subprocess import sys # ============================================================================== def parse_args(args): parser = argparse.ArgumentParser( description= """Run `include-what-you-use` on source files given as command-line arguments and/or read from standard input. When reading target filenames from standard input, they should be either absolute or relative to the current directory, and each line of input (minus the line-ending character(s) is treated as a filename.""") parser.add_argument( '-q', '--quiet', dest='loglevel', help="Suppress output except warnings and errors.", action='store_const', const=logging.ERROR, default=logging.WARNING, ) parser.add_argument( '-v', '--verbose', dest='loglevel', help="Output verbose debugging information.", action='store_const', const=logging.INFO, ) parser.add_argument( '-d', '--debug', dest='loglevel', help="""Save output from `include-what-you-use` for processed files beside the originals, with a '.iwyu' suffix, for debugging purposes.""", action='store_const', const=logging.DEBUG, ) parser.add_argument( '-r', '--regex', dest='regex', help="""A regular expression for matching filenames Only the basename of the file is matched, and the regex is only used when searching a directory for files to process, not on target filenames specified in arguments or read from standard input.""", action='store', default=r'\.(h|cpp)$', ) parser.add_argument( '-i', '--ignores_file', dest='ignores_file', metavar='', help= """The name of a file (relative to KALEIDOSCOPE_DIR) that contains a list of glob patterns that will be ignored when a target directory is searched for filenames that match .""", action='store', default='.iwyu_ignore', ) parser.add_argument( 'targets', metavar="", nargs='+', help= """A list of target files and/or directories to search for source files to format. Any target file will be processed, regardless of the filename. Any target directory will be recursively searched for files matching the regular expression given by --regex. Filenames and directories beginning with a '.' will always be excluded from the search, but can still be processed if specified as a command-line target.""", ) return parser.parse_args(args) # ============================================================================== def setup_logging(loglevel): """Set up basic logging Args: :int:loglevel: minimum loglevel for emitting messages """ logformat = "%(message)s" logging.basicConfig( level=loglevel, stream=sys.stdout, format=logformat, datefmt="", ) # ============================================================================== def main(): """Main entry point function.""" # Parse command-line arguments: opts = parse_args(sys.argv[1:]) # Set up logging system: setup_logging(opts.loglevel) # ---------------------------------------------------------------------- # Find include-what-you-use: iwyu = shutil.which('include-what-you-use') logging.info("Found `include-what-you-use` executable: %s", iwyu) iwyu_opts = [ '--no_fwd_decls', # No forward declarations '--max_line_length=100', '--update_comments', ] # Prepend '-Xiwyu' to each `include-what-you-use` option: iwyu_opts = [_ for opt in iwyu_opts for _ in ('-Xiwyu', opt)] # ---------------------------------------------------------------------- # Find fix_includes: fix_includes = shutil.which('fix_includes.py') logging.debug("Found `fix_includes` executable: %s", fix_includes) # ---------------------------------------------------------------------- # Find clang (first checking environment variable): clang = os.getenv('CLANG_COMPILER') if clang is None: clang = shutil.which('clang') logging.debug("Found `clang` executable: %s", clang) # Get system include dir from `clang`: clang_cmd = [clang, '-print-resource-dir'] logging.debug("Running command: `%s`", shlex.join(clang_cmd)) result = subprocess.run(clang_cmd, capture_output=True, check=True) clang_resource_dir = result.stdout.decode('utf-8').rstrip() system_include_dir = os.path.join(clang_resource_dir, 'include') logging.debug("Using system include dir: %s", system_include_dir) # ---------------------------------------------------------------------- # Get $KALEIDOSCOPE_DIR from enironment, falling back on `pwd`: kaleidoscope_dir = os.getenv('KALEIDOSCOPE_DIR') if kaleidoscope_dir is None: kaleidoscope_dir = os.getcwd() logging.debug("Using Kaleidoscope dir: %s", kaleidoscope_dir) kaleidoscope_src_dir = os.path.join(kaleidoscope_dir, 'src') # Define locations of other dirs to find Arduino libraries: virtual_hardware_dir = os.path.join( kaleidoscope_dir, '.arduino', 'user', 'hardware', 'keyboardio', 'virtual') logging.debug("Using virtual hardware dir: %s", virtual_hardware_dir) virtual_arduino_core_dir = os.path.join(virtual_hardware_dir, 'cores', 'arduino') logging.debug("Using virtual arduino core: %s", virtual_arduino_core_dir) virtual_model01_dir = os.path.join(virtual_hardware_dir, 'variants', 'model01') logging.debug("Using virtual Model01 dir: %s", virtual_model01_dir) virtual_keyboardiohid_dir = os.path.join( virtual_hardware_dir, 'libraries', 'KeyboardioHID', 'src') logging.debug("Using virtual KeyboardioHID dir: %s", virtual_keyboardiohid_dir) # ---------------------------------------------------------------------- # Create the long list of options passed to `clang` via `include-what-you-use`. # First, we tell it we're using C++: clang_opts = ['-x', 'c++'] # General compiler options: clang_opts += [ '-c', '-g', '-Wall', '-Wextra', '-std=gnu++14', # Not `c++14`, because we're using clang, not gcc '-ffunction-sections', '-fdata-sections', '-fno-threadsafe-statics', '-MMD', '-Woverloaded-virtual', '-Wno-unused-parameter', '-Wno-unused-variable', '-Wno-ignored-qualifiers', '-Wno-type-limits', '-Wno-pragma-once-outside-header', ] # Variables we define to do a Kaleidoscope build: defines = [ 'KALEIDOSCOPE_VIRTUAL_BUILD=1', 'KEYBOARDIOHID_BUILD_WITHOUT_HID=1', 'USBCON=dummy', 'ARDUINO_ARCH_AVR=1', 'ARDUINO=10607', 'ARDUINO_AVR_MODEL01', 'ARDUINO_ARCH_VIRTUAL', 'USB_VID=0x1209', 'USB_PID=0x2301', 'USB_MANUFACTURER="Keyboardio"', 'USB_PRODUCT="Model 01"', 'KALEIDOSCOPE_HARDWARE_H="Kaleidoscope-Hardware-Keyboardio-Model01.h"', 'TWI_BUFFER_LENGTH=32', ] clang_opts += ['-D' + _ for _ in defines] # Directories to search for libraries to include: includes = [ system_include_dir, kaleidoscope_src_dir, virtual_arduino_core_dir, virtual_model01_dir, virtual_keyboardiohid_dir, ] # Include plugin source dirs for plugins that depend on other plugins: includes += glob.glob(os.path.join(kaleidoscope_dir, 'plugins', '*', 'src')) clang_opts += ['-I' + _ for _ in includes] # ---------------------------------------------------------------------- # Define the `include-what-you-use` command (sans target files) iwyu_cmd = [iwyu] + iwyu_opts + clang_opts logging.debug("Using IWYU command: %s", ' \\\n\t'.join(iwyu_cmd)) fix_includes_cmd = [ fix_includes, '--update_comments', '--nosafe_headers', '--reorder', '--separate_project_includes=' + kaleidoscope_src_dir, # Does this help? ] logging.debug("Using `fix_includes` command: %s", ' \\\n\t'.join(fix_includes_cmd)) # ---------------------------------------------------------------------- targets = opts.targets # If stdin is a pipe, read pathname targets, one per line. This allows us to # connect the output of `find` to our input conveniently: if not sys.stdin.isatty(): targets += sys.stdin.read().splitlines() # ---------------------------------------------------------------------- iwyu_ignores_file = os.path.join(kaleidoscope_dir, opts.ignores_file) ignores = build_ignores_list(iwyu_ignores_file) # ---------------------------------------------------------------------- regex = re.compile(opts.regex) exit_code = 0 for src in (_ for t in targets for _ in build_target_list(t, regex)): if src in ignores: logging.info("Skipping ignored file: %s", os.path.relpath(src)) continue if not run_iwyu(os.path.relpath(src), iwyu_cmd, fix_includes_cmd): exit_code = 1 return exit_code # ============================================================================== def build_target_list(path, src_regex): """Docstring""" logging.debug("Searching target: %s", path) # If the specified path is a filename, return it (as a list), regardless of # whether or not it matches the regex. if os.path.isfile(path): return [path] # If the specified path is not valid, just return an empty list. if not os.path.isdir(path): logging.error("Error: File not found: %s", path) return [] # The specified path is a directory, so we search recursively for files # contained therein that match the specified regular expression. targets = [] for root, dirs, files in os.walk(os.path.abspath(path)): logging.debug("Searching dir: %s", root) # First, ignore all dotfiles (and directories). dotfiles = set(glob.glob('.*')) dirs = set(dirs) - dotfiles files = set(files) - dotfiles logging.debug("Files found: %s", ', '.join(files)) # Add all matching files to the list of source files to be formatted. for f in filter(src_regex.search, files): logging.debug("Source file found: %s", f) targets.append(os.path.join(root, f)) return [os.path.abspath(_) for _ in targets] # ============================================================================== def build_ignores_list(ignores_file_path): logging.debug("Searching for ignores file: %s", ignores_file_path) # If the ignores file doesn't exist, return an empty list: if not os.path.isfile(ignores_file_path): logging.debug("Ignores file not found") return [] ignores_list = [] with open(ignores_file_path) as f: for line in f.read().splitlines(): logging.debug("Ignoring files like: %s", line) if line.startswith('#'): continue ignores_list += glob.glob(line, recursive=True) ignores_file_dir = os.path.dirname(ignores_file_path) with cwd(ignores_file_dir): ignores_list[:] = [os.path.abspath(_) for _ in ignores_list] logging.debug("Ignores list:\n\t%s", "\n\t".join(ignores_list)) return ignores_list # ------------------------------------------------------------------------------ from contextlib import contextmanager @contextmanager def cwd(path): """A simple function change directory, an automatically restore the previous working directory when done, using `with cwd(temp_dir):`""" old_wd = os.getcwd() os.chdir(path) try: yield finally: os.chdir(old_wd) # ============================================================================== def run_iwyu(source_file, iwyu_cmd, fix_includes_cmd): """Run `include-what-you-use` on , an update that file's header includes by sending the output to `fix_includes.py`. If either command returns an error code, return `False`, otherwise return `True`.""" logging.info("Processing file: %s", source_file) # Run IWYU on iwyu_proc = subprocess.run(iwyu_cmd + [source_file], capture_output=True, check=False) # If IWYU returns an error, report on it: if iwyu_proc.returncode != 0: logging.error("Error: failed to parse file: %s", source_file) logging.debug("IWYU returned: %s", iwyu_proc.returncode) logging.debug("STDOUT:\n%s", iwyu_proc.stdout.decode('utf-8')) logging.debug("STDERR:\n%s", iwyu_proc.stderr.decode('utf-8')) # In addition to reporting the error, save the output for analysis: with open(source_file + '.iwyu', 'wb') as f: f.write(iwyu_proc.stderr) # Don't run fix_includes if there was an error (or if we've got an old version of IWYU # that returns bogus exit codes): return False # IWYU reports on the associated header of *.cpp files, but if we want to skip processing # that header, we need to use only the part of the output for the *.cpp file. Fortunately, # the header is listed first, so we only need to search for the start of the target file's # section of the output. n = iwyu_proc.stderr.find(f"\n{source_file} should".encode('utf-8')) iwyu_stderr = iwyu_proc.stderr[n:] # Run fix_includes.py, using the output (stderr) of IWYU: fix_includes_proc = subprocess.run( fix_includes_cmd, input=iwyu_stderr, capture_output=True, check=False) # Report any errors returned by fix_includes.py: if fix_includes_proc.returncode != 0: logging.error("Error: failed to fix includes for file: %s", source_file) logging.debug("fix_includes.py returned: %s", fix_includes_proc.returncode) logging.debug("STDOUT:\n%s", fix_includes_proc.stdout.decode('utf-8')) logging.debug("STDERR:\n%s", fix_includes_proc.stderr.decode('utf-8')) return False # Return true on success, false otherwise: return True # ============================================================================== if __name__ == "__main__": try: sys.exit(main()) except KeyboardInterrupt: logging.info("Aborting") sys.exit(1)