Add --examine-coverage to fix_error_ids.py

2023-10-03 13:03:40 +00:00 · 2020-06-28 01:46:42 +02:00 · 2020-06-28 01:46:42 +02:00 · 919572d6ec
commit 919572d6ec
parent 8fde9fd1c3
3 changed files with 97 additions and 21 deletions
--- a/.circleci/config.yml
+++ b/.circleci/config.yml
@ -323,7 +323,7 @@ jobs:
      - checkout
      - run:
          name: Check for error codes
-          command: ./scripts/fix_error_ids.py --check-only
+          command: ./scripts/error_codes.py --check
  chk_pylint:
    docker:
--- a/liblangutil/Exceptions.h
+++ b/liblangutil/Exceptions.h
@ -61,7 +61,7 @@ struct InvalidAstError: virtual util::Exception {};
 * They are passed as the first parameter of error reporting functions.
 * Suffix _error helps to find them in the sources.
 * The struct ErrorId prevents incidental calls like typeError(3141) instead of typeError(3141_error).
- * To create a new ID, one can add 0000_error and then run "python ./scripts/fix_error_ids.py"
+ * To create a new ID, one can add 0000_error and then run "python ./scripts/error_codes.py --fix"
 * from the root of the repo.
 */
 struct ErrorId
--- a/scripts/fix_error_ids.py
+++ b/scripts/fix_error_ids.py
@ -7,7 +7,7 @@ import sys
 from os import path
 ENCODING = "utf-8"
-PATTERN = r"\b\d+_error\b"
+SOURCE_FILE_PATTERN = r"\b\d+_error\b"
 def read_file(file_name):
@ -36,9 +36,9 @@ def in_comment(source, pos):
    return slash_star_pos > star_slash_pos
-def find_ids_in_file(file_name, ids):
+def find_ids_in_source_file(file_name, ids):
    source = read_file(file_name)
-    for m in re.finditer(PATTERN, source):
+    for m in re.finditer(SOURCE_FILE_PATTERN, source):
        if in_comment(source, m.start()):
            continue
        underscore_pos = m.group(0).index("_")
@ -52,7 +52,7 @@ def find_ids_in_file(file_name, ids):
 def get_used_ids(file_names):
    used_ids = {}
    for file_name in file_names:
-        find_ids_in_file(file_name, used_ids)
+        find_ids_in_source_file(file_name, used_ids)
    return used_ids
@ -71,7 +71,7 @@ def fix_ids_in_file(file_name, available_ids, used_ids):
    k = 0
    destination = []
-    for m in re.finditer(PATTERN, source):
+    for m in re.finditer(SOURCE_FILE_PATTERN, source):
        destination.extend(source[k:m.start()])
        underscore_pos = m.group(0).index("_")
@ -102,38 +102,105 @@ def fix_ids(used_ids, file_names):
        fix_ids_in_file(file_name, available_ids, used_ids)
-def find_source_files(top_dir):
+def find_files(top_dir, sub_dirs, extensions):
-    """Builds the list of .h and .cpp files in top_dir directory"""
+    """Builds a list of files with given extensions in specified subdirectories"""
    source_file_names = []
-    dirs = ['libevmasm', 'liblangutil', 'libsolc', 'libsolidity', 'libsolutil', 'libyul', 'solc']
+    for dir in sub_dirs:
    for dir in dirs:
        for root, _, file_names in os.walk(os.path.join(top_dir, dir), onerror=lambda e: exit(f"Walk error: {e}")):
            for file_name in file_names:
                _, ext = path.splitext(file_name)
-                if ext in [".h", ".cpp"]:
+                if ext in extensions:
                    source_file_names.append(path.join(root, file_name))
    return source_file_names
 def find_ids_in_test_file(file_name):
    source = read_file(file_name)
    pattern = r"^// (.*Error|Warning) \d\d\d\d:"
    return {m.group(0)[-5:-1] for m in re.finditer(pattern, source, flags=re.MULTILINE)}
 def find_ids_in_test_files(file_names):
    used_ids = set()
    for file_name in file_names:
        used_ids |= find_ids_in_test_file(file_name)
    return used_ids
 def print_ids(ids):
    for k, id in enumerate(sorted(ids)):
        if k % 10 > 0:
            print(" ", end="")
        elif k > 0:
            print()
        print(id, end="")
 def examine_id_coverage(top_dir, used_ids):
    test_sub_dirs = [
        path.join("test", "libsolidity", "errorRecoveryTests"),
        path.join("test", "libsolidity", "smtCheckerTests"),
        path.join("test", "libsolidity", "syntaxTests")
    ]
    test_file_names = find_files(
        top_dir,
        test_sub_dirs,
        [".sol"]
    )
    covered_ids = find_ids_in_test_files(test_file_names)
    print(f"IDs in source files: {len(used_ids)}")
    print(f"IDs in test files  : {len(covered_ids)} ({len(covered_ids) - len(used_ids)})")
    print()
    unused_covered_ids = covered_ids - used_ids
    if len(unused_covered_ids) != 0:
        print("Error. The following error codes found in tests, but not in sources:")
        print_ids(unused_covered_ids)
        return 1
    used_uncovered_ids = used_ids - covered_ids
    if len(used_uncovered_ids) != 0:
        print("The following error codes found in sources, but not in tests:")
        print_ids(used_uncovered_ids)
        print("\n\nPlease make sure to add appropriate tests.")
        return 1
    return 0
 def main(argv):
-    check_only = False
+    # pylint: disable=too-many-branches, too-many-locals
    check = False
    fix = False
    noconfirm = False
-    opts, args = getopt.getopt(argv, "", ["check-only", "noconfirm"])
+    examine_coverage = False
    opts, args = getopt.getopt(argv, "", ["check", "fix", "noconfirm", "examine-coverage"])
    for opt, arg in opts:
-        if opt == '--check-only':
+        if opt == '--check':
-            check_only = True
+            check = True
        elif opt == "--fix":
            fix = True
        elif opt == '--noconfirm':
            noconfirm = True
        elif opt == '--examine-coverage':
            examine_coverage = True
    if not check and not fix and not examine_coverage:
        print("usage: python error_codes.py --check | --fix [--noconfirm] | --examine-coverage")
        exit(1)
    random.seed()
    cwd = os.getcwd()
-    source_file_names = find_source_files(cwd)
+    source_file_names = find_files(
-
+        cwd,
        ["libevmasm", "liblangutil", "libsolc", "libsolidity", "libsolutil", "libyul", "solc"],
        [".h", ".cpp"]
    )
    used_ids = get_used_ids(source_file_names)
    ok = True
@ -148,13 +215,21 @@ def main(argv):
            print(f"ID {id} appears {used_ids[id]} times")
            ok = False
    if examine_coverage:
        if not ok:
            print("Incorrect IDs has to be fixed before applying --examine-coverage")
        res = examine_id_coverage(cwd, used_ids.keys())
        exit(res)
    if ok:
        print("No incorrect IDs found")
        exit(0)
-    if check_only:
+    if check:
        exit(1)
    assert fix, "Unexpected state, should not come here without --fix"
    if not noconfirm:
        answer = input(
            "\nDo you want to fix incorrect IDs?\n"
@ -166,6 +241,7 @@ def main(argv):
        if answer not in "yY":
            exit(1)
    random.seed()
    fix_ids(used_ids, source_file_names)
    print("Fixing completed")
    exit(2)