| Gilles Peskine | ba94b58 | 2019-09-16 19:18:40 +0200 | [diff] [blame] | 1 | #!/usr/bin/env python3 | 
|  | 2 |  | 
|  | 3 | """Sanity checks for test data. | 
| Gilles Peskine | bbb3664 | 2020-07-03 00:30:12 +0200 | [diff] [blame] | 4 |  | 
|  | 5 | This program contains a class for traversing test cases that can be used | 
|  | 6 | independently of the checks. | 
| Gilles Peskine | ba94b58 | 2019-09-16 19:18:40 +0200 | [diff] [blame] | 7 | """ | 
|  | 8 |  | 
| Bence Szépkúti | 1e14827 | 2020-08-07 13:07:28 +0200 | [diff] [blame] | 9 | # Copyright The Mbed TLS Contributors | 
| Dave Rodgman | 16799db | 2023-11-02 19:47:20 +0000 | [diff] [blame] | 10 | # SPDX-License-Identifier: Apache-2.0 OR GPL-2.0-or-later | 
| Gilles Peskine | ba94b58 | 2019-09-16 19:18:40 +0200 | [diff] [blame] | 11 |  | 
| Gilles Peskine | 1fb7aea | 2019-12-02 14:26:04 +0100 | [diff] [blame] | 12 | import argparse | 
| Gilles Peskine | ba94b58 | 2019-09-16 19:18:40 +0200 | [diff] [blame] | 13 | import glob | 
|  | 14 | import os | 
|  | 15 | import re | 
| Yanray Wang | 2354693 | 2023-02-24 14:53:29 +0800 | [diff] [blame] | 16 | import subprocess | 
| Gilles Peskine | ba94b58 | 2019-09-16 19:18:40 +0200 | [diff] [blame] | 17 | import sys | 
| Tomás González | 754f8cd | 2023-08-17 15:11:10 +0100 | [diff] [blame] | 18 |  | 
| Gilles Peskine | ba94b58 | 2019-09-16 19:18:40 +0200 | [diff] [blame] | 19 |  | 
|  | 20 | class Results: | 
| Darryl Green | 1822061 | 2019-12-17 15:03:59 +0000 | [diff] [blame] | 21 | """Store file and line information about errors or warnings in test suites.""" | 
| Gilles Peskine | 1fb7aea | 2019-12-02 14:26:04 +0100 | [diff] [blame] | 22 |  | 
|  | 23 | def __init__(self, options): | 
| Gilles Peskine | ba94b58 | 2019-09-16 19:18:40 +0200 | [diff] [blame] | 24 | self.errors = 0 | 
|  | 25 | self.warnings = 0 | 
| Gilles Peskine | 1fb7aea | 2019-12-02 14:26:04 +0100 | [diff] [blame] | 26 | self.ignore_warnings = options.quiet | 
| Gilles Peskine | ba94b58 | 2019-09-16 19:18:40 +0200 | [diff] [blame] | 27 |  | 
|  | 28 | def error(self, file_name, line_number, fmt, *args): | 
|  | 29 | sys.stderr.write(('{}:{}:ERROR:' + fmt + '\n'). | 
|  | 30 | format(file_name, line_number, *args)) | 
|  | 31 | self.errors += 1 | 
|  | 32 |  | 
|  | 33 | def warning(self, file_name, line_number, fmt, *args): | 
| Gilles Peskine | 1fb7aea | 2019-12-02 14:26:04 +0100 | [diff] [blame] | 34 | if not self.ignore_warnings: | 
|  | 35 | sys.stderr.write(('{}:{}:Warning:' + fmt + '\n') | 
|  | 36 | .format(file_name, line_number, *args)) | 
|  | 37 | self.warnings += 1 | 
| Gilles Peskine | ba94b58 | 2019-09-16 19:18:40 +0200 | [diff] [blame] | 38 |  | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 39 | class TestDescriptionExplorer: | 
|  | 40 | """An iterator over test cases with descriptions. | 
| Gilles Peskine | d34e9e4 | 2020-06-25 16:16:25 +0200 | [diff] [blame] | 41 |  | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 42 | The test cases that have descriptions are: | 
|  | 43 | * Individual unit tests (entries in a .data file) in test suites. | 
|  | 44 | * Individual test cases in ssl-opt.sh. | 
|  | 45 |  | 
|  | 46 | This is an abstract class. To use it, derive a class that implements | 
|  | 47 | the process_test_case method, and call walk_all(). | 
| Gilles Peskine | d34e9e4 | 2020-06-25 16:16:25 +0200 | [diff] [blame] | 48 | """ | 
| Gilles Peskine | ba94b58 | 2019-09-16 19:18:40 +0200 | [diff] [blame] | 49 |  | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 50 | def process_test_case(self, per_file_state, | 
|  | 51 | file_name, line_number, description): | 
|  | 52 | """Process a test case. | 
| Gilles Peskine | d34e9e4 | 2020-06-25 16:16:25 +0200 | [diff] [blame] | 53 |  | 
| Gilles Peskine | bbb3664 | 2020-07-03 00:30:12 +0200 | [diff] [blame] | 54 | per_file_state: an object created by new_per_file_state() at the beginning | 
|  | 55 | of each file. | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 56 | file_name: a relative path to the file containing the test case. | 
|  | 57 | line_number: the line number in the given file. | 
|  | 58 | description: the test case description as a byte string. | 
| Gilles Peskine | d34e9e4 | 2020-06-25 16:16:25 +0200 | [diff] [blame] | 59 | """ | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 60 | raise NotImplementedError | 
| Gilles Peskine | d34e9e4 | 2020-06-25 16:16:25 +0200 | [diff] [blame] | 61 |  | 
| Gilles Peskine | bbb3664 | 2020-07-03 00:30:12 +0200 | [diff] [blame] | 62 | def new_per_file_state(self): | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 63 | """Return a new per-file state object. | 
| Gilles Peskine | d34e9e4 | 2020-06-25 16:16:25 +0200 | [diff] [blame] | 64 |  | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 65 | The default per-file state object is None. Child classes that require per-file | 
|  | 66 | state may override this method. | 
| Gilles Peskine | d34e9e4 | 2020-06-25 16:16:25 +0200 | [diff] [blame] | 67 | """ | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 68 | #pylint: disable=no-self-use | 
|  | 69 | return None | 
|  | 70 |  | 
|  | 71 | def walk_test_suite(self, data_file_name): | 
|  | 72 | """Iterate over the test cases in the given unit test data file.""" | 
|  | 73 | in_paragraph = False | 
| Gilles Peskine | bbb3664 | 2020-07-03 00:30:12 +0200 | [diff] [blame] | 74 | descriptions = self.new_per_file_state() # pylint: disable=assignment-from-none | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 75 | with open(data_file_name, 'rb') as data_file: | 
|  | 76 | for line_number, line in enumerate(data_file, 1): | 
|  | 77 | line = line.rstrip(b'\r\n') | 
|  | 78 | if not line: | 
|  | 79 | in_paragraph = False | 
|  | 80 | continue | 
|  | 81 | if line.startswith(b'#'): | 
|  | 82 | continue | 
|  | 83 | if not in_paragraph: | 
|  | 84 | # This is a test case description line. | 
|  | 85 | self.process_test_case(descriptions, | 
|  | 86 | data_file_name, line_number, line) | 
|  | 87 | in_paragraph = True | 
|  | 88 |  | 
| Tomás González | 4a86da2 | 2023-09-01 17:41:16 +0100 | [diff] [blame] | 89 | def collect_from_script(self, file_name): | 
|  | 90 | """Collect the test cases in a script by calling its listing test cases | 
|  | 91 | option""" | 
| Gilles Peskine | bbb3664 | 2020-07-03 00:30:12 +0200 | [diff] [blame] | 92 | descriptions = self.new_per_file_state() # pylint: disable=assignment-from-none | 
| Tomás González | 4a86da2 | 2023-09-01 17:41:16 +0100 | [diff] [blame] | 93 | listed = subprocess.check_output(['sh', file_name, '--list-test-cases']) | 
|  | 94 | # Assume test file is responsible for printing identical format of | 
|  | 95 | # test case description between --list-test-cases and its OUTCOME.CSV | 
| Tomás González | 38ecf9f | 2023-09-04 10:23:04 +0100 | [diff] [blame] | 96 | # | 
| Yanray Wang | 63f0abe | 2023-08-30 18:31:35 +0800 | [diff] [blame] | 97 | # idx indicates the number of test case since there is no line number | 
| Tomás González | 7f2cddb | 2023-10-27 11:45:26 +0100 | [diff] [blame] | 98 | # in the script for each test case. | 
| Tomás González | 38ecf9f | 2023-09-04 10:23:04 +0100 | [diff] [blame] | 99 | for idx, description in enumerate(listed.splitlines()): | 
|  | 100 | self.process_test_case(descriptions, | 
|  | 101 | file_name, | 
|  | 102 | idx, | 
|  | 103 | description.rstrip()) | 
| Yanray Wang | 2354693 | 2023-02-24 14:53:29 +0800 | [diff] [blame] | 104 |  | 
| Gilles Peskine | 6f6ff33 | 2020-06-25 16:40:10 +0200 | [diff] [blame] | 105 | @staticmethod | 
|  | 106 | def collect_test_directories(): | 
|  | 107 | """Get the relative path for the TLS and Crypto test directories.""" | 
|  | 108 | if os.path.isdir('tests'): | 
|  | 109 | tests_dir = 'tests' | 
|  | 110 | elif os.path.isdir('suites'): | 
|  | 111 | tests_dir = '.' | 
|  | 112 | elif os.path.isdir('../suites'): | 
|  | 113 | tests_dir = '..' | 
|  | 114 | directories = [tests_dir] | 
|  | 115 | return directories | 
|  | 116 |  | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 117 | def walk_all(self): | 
|  | 118 | """Iterate over all named test cases.""" | 
| Gilles Peskine | 6f6ff33 | 2020-06-25 16:40:10 +0200 | [diff] [blame] | 119 | test_directories = self.collect_test_directories() | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 120 | for directory in test_directories: | 
|  | 121 | for data_file_name in glob.glob(os.path.join(directory, 'suites', | 
|  | 122 | '*.data')): | 
|  | 123 | self.walk_test_suite(data_file_name) | 
| Tomás González | 4a86da2 | 2023-09-01 17:41:16 +0100 | [diff] [blame] | 124 |  | 
|  | 125 | for sh_file in ['ssl-opt.sh', 'compat.sh']: | 
|  | 126 | sh_file = os.path.join(directory, sh_file) | 
|  | 127 | if os.path.exists(sh_file): | 
|  | 128 | self.collect_from_script(sh_file) | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 129 |  | 
| Gilles Peskine | 686c292 | 2022-01-07 15:58:38 +0100 | [diff] [blame] | 130 | class TestDescriptions(TestDescriptionExplorer): | 
|  | 131 | """Collect the available test cases.""" | 
|  | 132 |  | 
|  | 133 | def __init__(self): | 
|  | 134 | super().__init__() | 
|  | 135 | self.descriptions = set() | 
|  | 136 |  | 
|  | 137 | def process_test_case(self, _per_file_state, | 
|  | 138 | file_name, _line_number, description): | 
|  | 139 | """Record an available test case.""" | 
|  | 140 | base_name = re.sub(r'\.[^.]*$', '', re.sub(r'.*/', '', file_name)) | 
|  | 141 | key = ';'.join([base_name, description.decode('utf-8')]) | 
|  | 142 | self.descriptions.add(key) | 
|  | 143 |  | 
|  | 144 | def collect_available_test_cases(): | 
|  | 145 | """Collect the available test cases.""" | 
|  | 146 | explorer = TestDescriptions() | 
|  | 147 | explorer.walk_all() | 
|  | 148 | return sorted(explorer.descriptions) | 
|  | 149 |  | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 150 | class DescriptionChecker(TestDescriptionExplorer): | 
|  | 151 | """Check all test case descriptions. | 
|  | 152 |  | 
|  | 153 | * Check that each description is valid (length, allowed character set, etc.). | 
|  | 154 | * Check that there is no duplicated description inside of one test suite. | 
|  | 155 | """ | 
|  | 156 |  | 
|  | 157 | def __init__(self, results): | 
|  | 158 | self.results = results | 
|  | 159 |  | 
| Gilles Peskine | bbb3664 | 2020-07-03 00:30:12 +0200 | [diff] [blame] | 160 | def new_per_file_state(self): | 
| Gilles Peskine | 6f6ff33 | 2020-06-25 16:40:10 +0200 | [diff] [blame] | 161 | """Dictionary mapping descriptions to their line number.""" | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 162 | return {} | 
|  | 163 |  | 
|  | 164 | def process_test_case(self, per_file_state, | 
|  | 165 | file_name, line_number, description): | 
| Gilles Peskine | 6f6ff33 | 2020-06-25 16:40:10 +0200 | [diff] [blame] | 166 | """Check test case descriptions for errors.""" | 
|  | 167 | results = self.results | 
|  | 168 | seen = per_file_state | 
|  | 169 | if description in seen: | 
|  | 170 | results.error(file_name, line_number, | 
|  | 171 | 'Duplicate description (also line {})', | 
|  | 172 | seen[description]) | 
|  | 173 | return | 
|  | 174 | if re.search(br'[\t;]', description): | 
|  | 175 | results.error(file_name, line_number, | 
|  | 176 | 'Forbidden character \'{}\' in description', | 
|  | 177 | re.search(br'[\t;]', description).group(0).decode('ascii')) | 
|  | 178 | if re.search(br'[^ -~]', description): | 
|  | 179 | results.error(file_name, line_number, | 
|  | 180 | 'Non-ASCII character in description') | 
|  | 181 | if len(description) > 66: | 
|  | 182 | results.warning(file_name, line_number, | 
|  | 183 | 'Test description too long ({} > 66)', | 
|  | 184 | len(description)) | 
|  | 185 | seen[description] = line_number | 
| Gilles Peskine | ba94b58 | 2019-09-16 19:18:40 +0200 | [diff] [blame] | 186 |  | 
|  | 187 | def main(): | 
| Gilles Peskine | 1fb7aea | 2019-12-02 14:26:04 +0100 | [diff] [blame] | 188 | parser = argparse.ArgumentParser(description=__doc__) | 
| Gilles Peskine | 7e09105 | 2022-01-07 15:58:55 +0100 | [diff] [blame] | 189 | parser.add_argument('--list-all', | 
|  | 190 | action='store_true', | 
|  | 191 | help='List all test cases, without doing checks') | 
| Gilles Peskine | 1fb7aea | 2019-12-02 14:26:04 +0100 | [diff] [blame] | 192 | parser.add_argument('--quiet', '-q', | 
|  | 193 | action='store_true', | 
|  | 194 | help='Hide warnings') | 
|  | 195 | parser.add_argument('--verbose', '-v', | 
|  | 196 | action='store_false', dest='quiet', | 
|  | 197 | help='Show warnings (default: on; undoes --quiet)') | 
|  | 198 | options = parser.parse_args() | 
| Gilles Peskine | 7e09105 | 2022-01-07 15:58:55 +0100 | [diff] [blame] | 199 | if options.list_all: | 
|  | 200 | descriptions = collect_available_test_cases() | 
|  | 201 | sys.stdout.write('\n'.join(descriptions + [''])) | 
|  | 202 | return | 
| Gilles Peskine | 1fb7aea | 2019-12-02 14:26:04 +0100 | [diff] [blame] | 203 | results = Results(options) | 
| Gilles Peskine | 78c45db | 2020-06-25 16:34:11 +0200 | [diff] [blame] | 204 | checker = DescriptionChecker(results) | 
|  | 205 | checker.walk_all() | 
| Gilles Peskine | 1fb7aea | 2019-12-02 14:26:04 +0100 | [diff] [blame] | 206 | if (results.warnings or results.errors) and not options.quiet: | 
| Gilles Peskine | ba94b58 | 2019-09-16 19:18:40 +0200 | [diff] [blame] | 207 | sys.stderr.write('{}: {} errors, {} warnings\n' | 
|  | 208 | .format(sys.argv[0], results.errors, results.warnings)) | 
|  | 209 | sys.exit(1 if results.errors else 0) | 
|  | 210 |  | 
|  | 211 | if __name__ == '__main__': | 
|  | 212 | main() |