Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 1 | #!/usr/bin/env python3 |
| 2 | # SPDX-License-Identifier: Apache-2.0 |
| 3 | """ |
| 4 | A tool for validating entity manager configurations. |
| 5 | """ |
| 6 | import argparse |
| 7 | import json |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 8 | import os |
Potin Lai | 0f3a4d9 | 2023-12-05 00:13:55 +0800 | [diff] [blame] | 9 | import re |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 10 | import sys |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 11 | from concurrent.futures import ProcessPoolExecutor |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 12 | |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 13 | import jsonschema.validators |
| 14 | |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 15 | DEFAULT_SCHEMA_FILENAME = "global.json" |
| 16 | |
| 17 | |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 18 | def get_default_thread_count() -> int: |
| 19 | """ |
| 20 | Returns the number of CPUs available to the current process. |
| 21 | """ |
| 22 | try: |
| 23 | # This will respect CPU affinity settings |
| 24 | return len(os.sched_getaffinity(0)) |
| 25 | except AttributeError: |
| 26 | # Fallback for systems without sched_getaffinity |
| 27 | return os.cpu_count() or 1 |
| 28 | |
| 29 | |
Potin Lai | 0f3a4d9 | 2023-12-05 00:13:55 +0800 | [diff] [blame] | 30 | def remove_c_comments(string): |
| 31 | # first group captures quoted strings (double or single) |
| 32 | # second group captures comments (//single-line or /* multi-line */) |
| 33 | pattern = r"(\".*?(?<!\\)\"|\'.*?(?<!\\)\')|(/\*.*?\*/|//[^\r\n]*$)" |
| 34 | regex = re.compile(pattern, re.MULTILINE | re.DOTALL) |
| 35 | |
| 36 | def _replacer(match): |
| 37 | if match.group(2) is not None: |
| 38 | return "" |
| 39 | else: |
| 40 | return match.group(1) |
| 41 | |
| 42 | return regex.sub(_replacer, string) |
| 43 | |
| 44 | |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 45 | def main(): |
| 46 | parser = argparse.ArgumentParser( |
| 47 | description="Entity manager configuration validator", |
| 48 | ) |
| 49 | parser.add_argument( |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 50 | "-s", |
| 51 | "--schema", |
| 52 | help=( |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 53 | "Use the specified schema file instead of the default " |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 54 | "(__file__/../../schemas/global.json)" |
| 55 | ), |
| 56 | ) |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 57 | parser.add_argument( |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 58 | "-c", |
| 59 | "--config", |
| 60 | action="append", |
| 61 | help=( |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 62 | "Validate the specified configuration files (can be " |
| 63 | "specified more than once) instead of the default " |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 64 | "(__file__/../../configurations/**.json)" |
| 65 | ), |
| 66 | ) |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 67 | parser.add_argument( |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 68 | "-e", |
| 69 | "--expected-fails", |
| 70 | help=( |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 71 | "A file with a list of configurations to ignore should " |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 72 | "they fail to validate" |
| 73 | ), |
| 74 | ) |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 75 | parser.add_argument( |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 76 | "-k", |
| 77 | "--continue", |
| 78 | action="store_true", |
| 79 | help="keep validating after a failure", |
| 80 | ) |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 81 | parser.add_argument( |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 82 | "-v", "--verbose", action="store_true", help="be noisy" |
| 83 | ) |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 84 | parser.add_argument( |
| 85 | "-t", |
| 86 | "--threads", |
| 87 | type=int, |
| 88 | default=get_default_thread_count(), |
| 89 | help="Number of threads to use for parallel validation (default: number of CPUs)", |
| 90 | ) |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 91 | args = parser.parse_args() |
| 92 | |
| 93 | schema_file = args.schema |
| 94 | if schema_file is None: |
| 95 | try: |
| 96 | source_dir = os.path.realpath(__file__).split(os.sep)[:-2] |
| 97 | schema_file = os.sep + os.path.join( |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 98 | *source_dir, "schemas", DEFAULT_SCHEMA_FILENAME |
| 99 | ) |
Patrick Williams | cad2d1f | 2022-12-04 14:38:16 -0600 | [diff] [blame] | 100 | except Exception: |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 101 | print( |
| 102 | f"Could not guess location of {DEFAULT_SCHEMA_FILENAME}", |
| 103 | file=sys.stderr, |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 104 | ) |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 105 | sys.exit(2) |
| 106 | |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 107 | config_files = args.config or [] |
| 108 | if len(config_files) == 0: |
| 109 | try: |
| 110 | source_dir = os.path.realpath(__file__).split(os.sep)[:-2] |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 111 | configs_dir = os.sep + os.path.join(*source_dir, "configurations") |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 112 | data = os.walk(configs_dir) |
| 113 | for root, _, files in data: |
| 114 | for f in files: |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 115 | if f.endswith(".json"): |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 116 | config_files.append(os.path.join(root, f)) |
Patrick Williams | cad2d1f | 2022-12-04 14:38:16 -0600 | [diff] [blame] | 117 | except Exception: |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 118 | print( |
| 119 | "Could not guess location of configurations", file=sys.stderr |
| 120 | ) |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 121 | sys.exit(2) |
| 122 | |
| 123 | configs = [] |
| 124 | for config_file in config_files: |
| 125 | try: |
| 126 | with open(config_file) as fd: |
Potin Lai | 0f3a4d9 | 2023-12-05 00:13:55 +0800 | [diff] [blame] | 127 | configs.append(json.loads(remove_c_comments(fd.read()))) |
Patrick Williams | cad2d1f | 2022-12-04 14:38:16 -0600 | [diff] [blame] | 128 | except FileNotFoundError: |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 129 | print( |
| 130 | f"Could not parse config file: {config_file}", file=sys.stderr |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 131 | ) |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 132 | sys.exit(2) |
| 133 | |
| 134 | expected_fails = [] |
| 135 | if args.expected_fails: |
| 136 | try: |
| 137 | with open(args.expected_fails) as fd: |
| 138 | for line in fd: |
| 139 | expected_fails.append(line.strip()) |
Patrick Williams | cad2d1f | 2022-12-04 14:38:16 -0600 | [diff] [blame] | 140 | except Exception: |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 141 | print( |
| 142 | f"Could not read expected fails file: {args.expected_fails}", |
| 143 | file=sys.stderr, |
Patrick Williams | fa8ee87 | 2022-12-07 07:00:42 -0600 | [diff] [blame] | 144 | ) |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 145 | sys.exit(2) |
| 146 | |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 147 | results = { |
| 148 | "invalid": [], |
| 149 | "unexpected_pass": [], |
| 150 | } |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 151 | |
| 152 | should_continue = getattr(args, "continue") |
| 153 | |
| 154 | with ProcessPoolExecutor(max_workers=args.threads) as executor: |
| 155 | # Submit all validation tasks |
| 156 | config_to_future = {} |
| 157 | for config_file, config in zip(config_files, configs): |
| 158 | filename = os.path.split(config_file)[1] |
| 159 | future = executor.submit( |
| 160 | validate_single_config, |
| 161 | args, |
| 162 | filename, |
| 163 | config, |
| 164 | expected_fails, |
| 165 | schema_file, |
| 166 | ) |
| 167 | config_to_future[config_file] = future |
| 168 | |
| 169 | # Process results as they complete |
| 170 | for config_file, future in config_to_future.items(): |
| 171 | # Wait for the future to complete and get its result |
| 172 | is_invalid, is_unexpected_pass = future.result() |
| 173 | # Update the results with the validation result |
| 174 | filename = os.path.split(config_file)[1] |
| 175 | if is_invalid: |
| 176 | results["invalid"].append(filename) |
| 177 | if is_unexpected_pass: |
| 178 | results["unexpected_pass"].append(filename) |
| 179 | |
| 180 | # Stop validation if validation failed unexpectedly and --continue is not set |
| 181 | validation_failed = is_invalid or is_unexpected_pass |
| 182 | if validation_failed and not should_continue: |
| 183 | executor.shutdown(wait=False, cancel_futures=True) |
| 184 | break |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 185 | |
| 186 | exit_status = 0 |
| 187 | if len(results["invalid"]) + len(results["unexpected_pass"]): |
| 188 | exit_status = 1 |
| 189 | unexpected_pass_suffix = " **" |
| 190 | show_suffix_explanation = False |
| 191 | print("results:") |
| 192 | for f in config_files: |
| 193 | if any([x in f for x in results["unexpected_pass"]]): |
| 194 | show_suffix_explanation = True |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 195 | print(f" '{f}' passed!{unexpected_pass_suffix}") |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 196 | if any([x in f for x in results["invalid"]]): |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 197 | print(f" '{f}' failed!") |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 198 | |
| 199 | if show_suffix_explanation: |
| 200 | print("\n** configuration expected to fail") |
| 201 | |
| 202 | sys.exit(exit_status) |
| 203 | |
| 204 | |
Alexander Hansen | 46072c4 | 2025-04-11 16:16:07 +0200 | [diff] [blame] | 205 | def validator_from_file(schema_file): |
Alexander Hansen | 46072c4 | 2025-04-11 16:16:07 +0200 | [diff] [blame] | 206 | schema = {} |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 207 | with open(schema_file) as fd: |
| 208 | schema = json.load(fd) |
Alexander Hansen | 46072c4 | 2025-04-11 16:16:07 +0200 | [diff] [blame] | 209 | |
| 210 | spec = jsonschema.Draft202012Validator |
| 211 | spec.check_schema(schema) |
| 212 | base_uri = "file://{}/".format( |
| 213 | os.path.split(os.path.realpath(schema_file))[0] |
| 214 | ) |
| 215 | resolver = jsonschema.RefResolver(base_uri, schema) |
| 216 | validator = spec(schema, resolver=resolver) |
| 217 | |
| 218 | return validator |
| 219 | |
| 220 | |
Alexander Hansen | a47bdad | 2025-04-11 16:05:28 +0200 | [diff] [blame] | 221 | def validate_single_config( |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 222 | args, filename, config, expected_fails, schema_file |
Alexander Hansen | a47bdad | 2025-04-11 16:05:28 +0200 | [diff] [blame] | 223 | ): |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 224 | expect_fail = filename in expected_fails |
| 225 | |
| 226 | is_invalid = False |
| 227 | is_unexpected_pass = False |
| 228 | |
Alexander Hansen | a47bdad | 2025-04-11 16:05:28 +0200 | [diff] [blame] | 229 | try: |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 230 | validator = validator_from_file(schema_file) |
Alexander Hansen | a47bdad | 2025-04-11 16:05:28 +0200 | [diff] [blame] | 231 | validator.validate(config) |
| 232 | if expect_fail: |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 233 | is_unexpected_pass = True |
Alexander Hansen | a47bdad | 2025-04-11 16:05:28 +0200 | [diff] [blame] | 234 | except jsonschema.exceptions.ValidationError as e: |
| 235 | if not expect_fail: |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 236 | is_invalid = True |
Alexander Hansen | a47bdad | 2025-04-11 16:05:28 +0200 | [diff] [blame] | 237 | if args.verbose: |
| 238 | print(e) |
Patrick Williams | f8f6027 | 2025-05-03 01:36:31 -0400 | [diff] [blame^] | 239 | except FileNotFoundError: |
| 240 | is_invalid = True |
| 241 | if args.verbose: |
| 242 | print(f"Could not read schema file: {schema_file}") |
| 243 | |
| 244 | return (is_invalid, is_unexpected_pass) |
Alexander Hansen | a47bdad | 2025-04-11 16:05:28 +0200 | [diff] [blame] | 245 | |
| 246 | |
Brad Bishop | c04b3f4 | 2020-05-01 08:17:59 -0400 | [diff] [blame] | 247 | if __name__ == "__main__": |
| 248 | main() |