#!/usr/bin/env python3 # vim: set syntax=python ts=4 : # Copyright (c) 2020 Intel Corporation # SPDX-License-Identifier: Apache-2.0 """Zephyr Test Runner (twister) Also check the "User and Developer Guides" at https://docs.zephyrproject.org/ This script scans for the set of unit test applications in the git repository and attempts to execute them. By default, it tries to build each test case on one platform per architecture, using a precedence list defined in an architecture configuration file, and if possible run the tests in any available emulators or simulators on the system. Test cases are detected by the presence of a 'testcase.yaml' or a sample.yaml files in the application's project directory. This file may contain one or more blocks, each identifying a test scenario. The title of the block is a name for the test case, which only needs to be unique for the test cases specified in that testcase meta-data. The full canonical name for each test case is /. Each test block in the testcase meta data can define the following key/value pairs: tags: (required) A set of string tags for the testcase. Usually pertains to functional domains but can be anything. Command line invocations of this script can filter the set of tests to run based on tag. skip: (default False) skip testcase unconditionally. This can be used for broken tests. slow: (default False) Don't build or run this test case unless --enable-slow was passed in on the command line. Intended for time-consuming test cases that are only run under certain circumstances, like daily builds. extra_args: Extra cache entries to pass to CMake when building or running the test case. extra_configs: Extra configuration options to be merged with a master prj.conf when building or running the test case. build_only: (default False) If true, don't try to run the test even if the selected platform supports it. build_on_all: (default False) If true, attempt to build test on all available platforms. depends_on: A board or platform can announce what features it supports, this option will enable the test only those platforms that provide this feature. min_ram: minimum amount of RAM needed for this test to build and run. This is compared with information provided by the board metadata. min_flash: minimum amount of ROM needed for this test to build and run. This is compared with information provided by the board metadata. timeout: Length of time to run test in emulator before automatically killing it. Default to 60 seconds. arch_allow: Set of architectures that this test case should only be run for. arch_exclude: Set of architectures that this test case should not run on. platform_allow: Set of platforms that this test case should only be run for. platform_exclude: Set of platforms that this test case should not run on. extra_sections: When computing sizes, twister will report errors if it finds extra, unexpected sections in the Zephyr binary unless they are named here. They will not be included in the size calculation. filter: Filter whether the testcase should be run by evaluating an expression against an environment containing the following values: { ARCH : , PLATFORM : , , , , *: any environment variable available } The grammar for the expression language is as follows: expression ::= expression "and" expression | expression "or" expression | "not" expression | "(" expression ")" | symbol "==" constant | symbol "!=" constant | symbol "<" number | symbol ">" number | symbol ">=" number | symbol "<=" number | symbol "in" list | symbol ":" string | symbol list ::= "[" list_contents "]" list_contents ::= constant | list_contents "," constant constant ::= number | string For the case where expression ::= symbol, it evaluates to true if the symbol is defined to a non-empty string. Operator precedence, starting from lowest to highest: or (left associative) and (left associative) not (right associative) all comparison operators (non-associative) arch_allow, arch_exclude, platform_allow, platform_exclude are all syntactic sugar for these expressions. For instance arch_exclude = x86 arc Is the same as: filter = not ARCH in ["x86", "arc"] The ':' operator compiles the string argument as a regular expression, and then returns a true value only if the symbol's value in the environment matches. For example, if CONFIG_SOC="stm32f107xc" then filter = CONFIG_SOC : "stm.*" Would match it. The set of test cases that actually run depends on directives in the testcase filed and options passed in on the command line. If there is any confusion, running with -v or examining the discard report (twister_discard.csv) can help show why particular test cases were skipped. Metrics (such as pass/fail state and binary size) for the last code release are stored in scripts/release/twister_last_release.csv. To update this, pass the --all --release options. To load arguments from a file, write '+' before the file name, e.g., +file_name. File content must be one or more valid arguments separated by line break instead of white spaces. Most everyday users will run with no arguments. """ import os import argparse import sys import logging import time import itertools import shutil from collections import OrderedDict import multiprocessing from itertools import islice import csv from colorama import Fore from pathlib import Path from multiprocessing.managers import BaseManager import queue ZEPHYR_BASE = os.getenv("ZEPHYR_BASE") if not ZEPHYR_BASE: # This file has been zephyr/scripts/twister for years, # and that is not going to change anytime soon. Let the user # run this script as ./scripts/twister without making them # set ZEPHYR_BASE. ZEPHYR_BASE = str(Path(__file__).resolve().parents[1]) # Propagate this decision to child processes. os.environ['ZEPHYR_BASE'] = ZEPHYR_BASE print(f'ZEPHYR_BASE unset, using "{ZEPHYR_BASE}"') try: from anytree import RenderTree, Node, find except ImportError: print("Install the anytree module to use the --test-tree option") try: from tabulate import tabulate except ImportError: print("Install tabulate python module with pip to use --device-testing option.") sys.path.insert(0, os.path.join(ZEPHYR_BASE, "scripts/pylib/twister")) from twisterlib import HardwareMap, TestSuite, SizeCalculator, CoverageTool, ExecutionCounter logger = logging.getLogger('twister') logger.setLevel(logging.DEBUG) def size_report(sc): logger.info(sc.filename) logger.info("SECTION NAME VMA LMA SIZE HEX SZ TYPE") for i in range(len(sc.sections)): v = sc.sections[i] logger.info("%-17s 0x%08x 0x%08x %8d 0x%05x %-7s" % (v["name"], v["virt_addr"], v["load_addr"], v["size"], v["size"], v["type"])) logger.info("Totals: %d bytes (ROM), %d bytes (RAM)" % (sc.rom_size, sc.ram_size)) logger.info("") def export_tests(filename, tests): with open(filename, "wt") as csvfile: fieldnames = ['section', 'subsection', 'title', 'reference'] cw = csv.DictWriter(csvfile, fieldnames, lineterminator=os.linesep) for test in tests: data = test.split(".") if len(data) > 1: subsec = " ".join(data[1].split("_")).title() rowdict = { "section": data[0].capitalize(), "subsection": subsec, "title": test, "reference": test } cw.writerow(rowdict) else: logger.error("{} can't be exported: ".format(test)) def parse_arguments(): parser = argparse.ArgumentParser( description=__doc__, formatter_class=argparse.RawDescriptionHelpFormatter) parser.fromfile_prefix_chars = "+" case_select = parser.add_argument_group("Test case selection", """ Artificially long but functional example: $ ./scripts/twister -v \\ --testcase-root tests/ztest/base \\ --testcase-root tests/kernel \\ --test tests/ztest/base/testing.ztest.verbose_0 \\ --test tests/kernel/fifo/fifo_api/kernel.fifo.poll "kernel.fifo.poll" is one of the test section names in __/fifo_api/testcase.yaml """) parser.add_argument("--force-toolchain", action="store_true", help="Do not filter based on toolchain, use the set " " toolchain unconditionally") parser.add_argument( "-p", "--platform", action="append", help="Platform filter for testing. This option may be used multiple " "times. Testcases will only be built/run on the platforms " "specified. If this option is not used, then platforms marked " "as default in the platform metadata file will be chosen " "to build and test. ") parser.add_argument("-P", "--exclude-platform", action="append", default=[], help="""Exclude platforms and do not build or run any tests on those platforms. This option can be called multiple times. """ ) parser.add_argument( "-a", "--arch", action="append", help="Arch filter for testing. Takes precedence over --platform. " "If unspecified, test all arches. Multiple invocations " "are treated as a logical 'or' relationship") parser.add_argument( "-t", "--tag", action="append", help="Specify tags to restrict which tests to run by tag value. " "Default is to not do any tag filtering. Multiple invocations " "are treated as a logical 'or' relationship") parser.add_argument("-e", "--exclude-tag", action="append", help="Specify tags of tests that should not run. " "Default is to run all tests with all tags.") case_select.add_argument( "-f", "--only-failed", action="store_true", help="Run only those tests that failed the previous twister run " "invocation.") parser.add_argument( "--retry-failed", type=int, default=0, help="Retry failing tests again, up to the number of times specified.") parser.add_argument( "--retry-interval", type=int, default=60, help="Retry failing tests after specified period of time.") test_xor_subtest = case_select.add_mutually_exclusive_group() test_xor_subtest.add_argument( "-s", "--test", action="append", help="Run only the specified test cases. These are named by " "") test_xor_subtest.add_argument( "--sub-test", action="append", help="""Recursively find sub-test functions and run the entire test section where they were found, including all sibling test functions. Sub-tests are named by: section.name.in.testcase.yaml.function_name_without_test_prefix Example: kernel.fifo.poll.fifo_loop """) parser.add_argument( "-l", "--all", action="store_true", help="Build/test on all platforms. Any --platform arguments " "ignored.") parser.add_argument( "-o", "--report-dir", help="""Output reports containing results of the test run into the specified directory. The output will be both in CSV and JUNIT format (twister.csv and twister.xml). """) parser.add_argument( "--json-report", action="store_true", help="""Generate a JSON file with all test results. [Experimental] """) parser.add_argument( "--platform-reports", action="store_true", help="""Create individual reports for each platform. """) parser.add_argument( "--report-name", help="""Create a report with a custom name. """) parser.add_argument( "--report-suffix", help="""Add a suffix to all generated file names, for example to add a version or a commit ID. """) parser.add_argument("--report-excluded", action="store_true", help="""List all tests that are never run based on current scope and coverage. If you are looking for accurate results, run this with --all, but this will take a while...""") parser.add_argument("--compare-report", help="Use this report file for size comparison") parser.add_argument( "-B", "--subset", help="Only run a subset of the tests, 1/4 for running the first 25%%, " "3/5 means run the 3rd fifth of the total. " "This option is useful when running a large number of tests on " "different hosts to speed up execution time.") parser.add_argument( "-N", "--ninja", action="store_true", help="Use the Ninja generator with CMake") parser.add_argument( "-y", "--dry-run", action="store_true", help="""Create the filtered list of test cases, but don't actually run them. Useful if you're just interested in the discard report generated for every run and saved in the specified output directory (twister_discard.csv). """) parser.add_argument("--list-tags", action="store_true", help="list all tags in selected tests") case_select.add_argument("--list-tests", action="store_true", help="""List of all sub-test functions recursively found in all --testcase-root arguments. Note different sub-tests can share the same section name and come from different directories. The output is flattened and reports --sub-test names only, not their directories. For instance net.socket.getaddrinfo_ok and net.socket.fd_set belong to different directories. """) case_select.add_argument("--test-tree", action="store_true", help="""Output the testsuite in a tree form""") case_select.add_argument("--list-test-duplicates", action="store_true", help="""List tests with duplicate identifiers. """) parser.add_argument("--export-tests", action="store", metavar="FILENAME", help="Export tests case meta-data to a file in CSV format." "Test instances can be exported per target by supplying " "the platform name using --platform option. (tests for only " " one platform can be exported at a time)") parser.add_argument("--timestamps", action="store_true", help="Print all messages with time stamps") parser.add_argument( "-r", "--release", action="store_true", help="Update the benchmark database with the results of this test " "run. Intended to be run by CI when tagging an official " "release. This database is used as a basis for comparison " "when looking for deltas in metrics such as footprint") parser.add_argument("-W", "--disable-warnings-as-errors", action="store_true", help="Treat warning conditions as errors") parser.add_argument("--overflow-as-errors", action="store_true", help="Treat RAM/SRAM overflows as errors") parser.add_argument( "-v", "--verbose", action="count", default=0, help="Emit debugging information, call multiple times to increase " "verbosity") parser.add_argument( "-i", "--inline-logs", action="store_true", help="Upon test failure, print relevant log data to stdout " "instead of just a path to it") parser.add_argument("--log-file", metavar="FILENAME", action="store", help="log also to file") parser.add_argument( "-m", "--last-metrics", action="store_true", help="Instead of comparing metrics from the last --release, " "compare with the results of the previous twister " "invocation") parser.add_argument( "-u", "--no-update", action="store_true", help="do not update the results of the last run of the twister run") parser.add_argument( "-G", "--integration", action="store_true", help="Run integration tests") case_select.add_argument( "-F", "--load-tests", metavar="FILENAME", action="store", help="Load list of tests and platforms to be run from file.") parser.add_argument( "--quarantine-list", metavar="FILENAME", help="Load list of test scenarios under quarantine. The entries in " "the file need to correspond to the test scenarios names as in" "corresponding tests .yaml files. These scenarios" "will be skipped with quarantine as the reason") parser.add_argument( "--quarantine-verify", action="store_true", help="Use the list of test scenarios under quarantine and run them" "to verify their current status") case_select.add_argument( "-E", "--save-tests", metavar="FILENAME", action="store", help="Append list of tests and platforms to be run to file.") test_or_build = parser.add_mutually_exclusive_group() test_or_build.add_argument( "-b", "--build-only", action="store_true", help="Only build the code, do not execute any of it in QEMU") test_or_build.add_argument( "--test-only", action="store_true", help="""Only run device tests with current artifacts, do not build the code""") parser.add_argument( "--cmake-only", action="store_true", help="Only run cmake, do not build or run.") parser.add_argument( "--filter", choices=['buildable', 'runnable'], default='buildable', help="""Filter tests to be built and executed. By default everything is built and if a test is runnable (emulation or a connected device), it is run. This option allows for example to only build tests that can actually be run. Runnable is a subset of buildable.""") parser.add_argument( "-M", "--runtime-artifact-cleanup", action="store_true", help="Delete artifacts of passing tests.") parser.add_argument( "-j", "--jobs", type=int, help="Number of jobs for building, defaults to number of CPU threads, " "overcommited by factor 2 when --build-only") parser.add_argument( "--show-footprint", action="store_true", help="Show footprint statistics and deltas since last release." ) parser.add_argument( "-H", "--footprint-threshold", type=float, default=5, help="When checking test case footprint sizes, warn the user if " "the new app size is greater then the specified percentage " "from the last release. Default is 5. 0 to warn on any " "increase on app size") parser.add_argument( "-D", "--all-deltas", action="store_true", help="Show all footprint deltas, positive or negative. Implies " "--footprint-threshold=0") parser.add_argument( "-O", "--outdir", default=os.path.join(os.getcwd(), "twister-out"), help="Output directory for logs and binaries. " "Default is 'twister-out' in the current directory. " "This directory will be cleaned unless '--no-clean' is set. " "The '--clobber-output' option controls what cleaning does.") parser.add_argument( "-c", "--clobber-output", action="store_true", help="Cleaning the output directory will simply delete it instead " "of the default policy of renaming.") parser.add_argument( "-n", "--no-clean", action="store_true", help="Re-use the outdir before building. Will result in " "faster compilation since builds will be incremental.") case_select.add_argument( "-T", "--testcase-root", action="append", default=[], help="Base directory to recursively search for test cases. All " "testcase.yaml files under here will be processed. May be " "called multiple times. Defaults to the 'samples/' and " "'tests/' directories at the base of the Zephyr tree.") board_root_list = ["%s/boards" % ZEPHYR_BASE, "%s/scripts/pylib/twister/boards" % ZEPHYR_BASE] parser.add_argument( "-A", "--board-root", action="append", default=board_root_list, help="""Directory to search for board configuration files. All .yaml files in the directory will be processed. The directory should have the same structure in the main Zephyr tree: boards///""") parser.add_argument( "-z", "--size", action="append", help="Don't run twister. Instead, produce a report to " "stdout detailing RAM/ROM sizes on the specified filenames. " "All other command line arguments ignored.") parser.add_argument( "-S", "--enable-slow", action="store_true", help="Execute time-consuming test cases that have been marked " "as 'slow' in testcase.yaml. Normally these are only built.") parser.add_argument( "-K", "--force-platform", action="store_true", help="""Force testing on selected platforms, even if they are excluded in the test configuration (testcase.yaml)""" ) parser.add_argument( "--disable-unrecognized-section-test", action="store_true", default=False, help="Skip the 'unrecognized section' test.") parser.add_argument("-R", "--enable-asserts", action="store_true", default=True, help="deprecated, left for compatibility") parser.add_argument("--disable-asserts", action="store_false", dest="enable_asserts", help="deprecated, left for compatibility") parser.add_argument("-Q", "--error-on-deprecations", action="store_false", help="Error on deprecation warnings.") parser.add_argument("--enable-size-report", action="store_true", help="Enable expensive computation of RAM/ROM segment sizes.") parser.add_argument( "-x", "--extra-args", action="append", default=[], help="""Extra CMake cache entries to define when building test cases. May be called multiple times. The key-value entries will be prefixed with -D before being passed to CMake. E.g "twister -x=USE_CCACHE=0" will translate to "cmake -DUSE_CCACHE=0" which will ultimately disable ccache. """ ) parser.add_argument( "--emulation-only", action="store_true", help="Only build and run emulation platforms") parser.add_argument( "--device-testing", action="store_true", help="Test on device directly. Specify the serial device to " "use with the --device-serial option.") parser.add_argument( "-X", "--fixture", action="append", default=[], help="Specify a fixture that a board might support") serial = parser.add_mutually_exclusive_group() serial.add_argument("--device-serial", help="""Serial device for accessing the board (e.g., /dev/ttyACM0) """) serial.add_argument("--device-serial-pty", help="""Script for controlling pseudoterminal. Twister believes that it interacts with a terminal when it actually interacts with the script. E.g "twister --device-testing --device-serial-pty