================
@@ -0,0 +1,534 @@
+#!/usr/bin/env python3
+
+"""generate_unsupported_in_drivermode.py
+
+This script generates Lit regression test files that validate that options are 
only exposed to intended driver modes.
+
+The options and driver modes are parsed from Options.td, whose path should be 
provided on the command line.
+See clang/include/clang/Driver/Options.td
+
+The LLVM TableGen executable can optionally be provided along with the path to 
the LLVM build tree bin directory.
+Otherwise, the script will search for it.
+
+The primary maintenance task for this script would be updating the expected 
return message for a driver mode if
+there are changes over time. See the instantiations of DriverData, 
specifically the check_str.
+
+Logic:
+1) For each option, (records of class "Option"), and for each driver, (records 
of class "OptionVisibility")
+    a. if the option's "Visibility" field includes the driver flavour, skip 
processing this option for this driver
+    b. if the option is part of an option group, (the record has the "Group" 
property),
+       and the group's "Visibility" field includes the driver flavour, skip 
processing this option for this driver
+    c. otherwise this option is not supported by this driver flavour, and this 
pairing is saved for testing
+2) For each unsupported pairing, generate a Lit RUN line, and a CHECK line to 
parse for expected output. Ex: "error: unknown argument"
+"""
+
+import os
+import json
+import subprocess
+from bisect import bisect_left
+from dataclasses import dataclass
+import argparse
+import dataclasses
+import itertools
+
+# Strings defined in Options.td for the various driver flavours. See 
"OptionVisibility"
+VISIBILITY_CC1AS = "CC1AsOption"
+VISIBILITY_CC1 = "CC1Option"
+VISIBILITY_CL = "CLOption"
+VISIBILITY_DXC = "DXCOption"
+VISIBILITY_DEFAULT = "DefaultVis"
+VISIBILITY_FC1 = "FC1Option"
+VISIBILITY_FLANG = "FlangOption"
+
+# Lit test prefix strings
+SLASH_SLASH = "// "
+EXCLAMATION = "! "
+
+exceptions_sequence = [
+    # Invalid usage of the driver options below causes unique output, so skip 
testing
+    "cc1",
+    "cc1as",
+    # There is currently a bug with "_no_warnings", i.e. --no-warnings. 
Diagnostic related options
+    # are parsed first, and always with CC1 visibility. They're used to set up 
the diagnostic
+    # engine, which parses "_no_warnings" (and its alias "w", i.e. -w) and 
sets an internal flag
+    # that suppresses all warnings.
+    "_no_warnings",
+    "w",
+]
+
+
+@dataclass
+class DriverOption:
+    """Defines an unsupported driver-option combination
+    driver: The driver string as defined by OptionVisibility in Options.td
+    option: The option object from Options.td
+    option_name: Corresponding string for an option. See "Name" for a given 
option in Options.td
+    prefix: String that precedes the option. Ex. "-"
+    """
+
+    driver: str
+    option: str
+    option_name: str
+    prefix: str
+
+
+@dataclass
+class DriverData:
+    """Dataclass for data specific to each driver
+    lit_cmd_prefix: The beginning string of the Lit command
+    lit_cmd_options: Strings containing additional options for this driver
+    visibility_str: The corresponding visibility string from OptionVisibility 
in Options.td
+    lit_cmd_end: String at the end of the Lit command
+    check_str: The string or regex to be sent to FileCheck
+    supported_joined_option_sequence: List of DriverOption objects for 
supported options
+                                      that are Kind *JOINED*, as defined in 
Options.td
+    supported_non_joined_option_sequence: List of DriverOption objects for 
supported options
+                                          that are not Kind *JOINED*, as 
defined in Options.td
+    test_option_sequence: A list of all the prefix-option pairs that will be 
tested for this driver
+    """
+
+    lit_cmd_prefix: str
+    lit_cmd_options: str
+    visibility_str: str
+    lit_cmd_end: str
+    check_str: str
+    supported_joined_option_sequence: list[DriverOption] = dataclasses.field(
+        default_factory=list
+    )
+    supported_non_joined_option_sequence: list[DriverOption] = 
dataclasses.field(
+        default_factory=list
+    )
+    test_option_sequence: list[str] = dataclasses.field(default_factory=list)
+
+
+def collect_transitive_groups(member, options_dictionary):
+    """Find the groups for a given member, where a member can be an option or 
a group.
+    Note that groups can themselves be part of groups, hence the recursion
+
+    For example, considering option 'C', it has the following 'Group' field as 
defined by Options.td:
+      "C": {
+        "Group": {
+          "def": "Preprocessor_Group",
+          // ...
+        },
+        // ...
+      },
+    'Preprocessor_Group' is itself part of 'CompileOnly_Group', so option 'C' 
would be part of both groups
+      "Preprocessor_Group": {
+        // ...
+        "Group": {
+          "def": "CompileOnly_Group",
+          // ...
+        },
+        // ...
+      },
+
+    member: An option object or group object from Options.td.
+    options_dictionary: The converted Python dictionary from the Options.td 
json string
+
+    Return: A set including the group(s) found for the member. If no groups 
found, returns an empty set
+    """
+    parent_field = options_dictionary[member]["Group"]
+    if parent_field is None:
+        return set()
+
+    parent_name = parent_field["def"]
+    return {parent_name} | collect_transitive_groups(parent_name, 
options_dictionary)
+
+
+def get_visibility(option):
+    """Get a list of drivers that a given option is exposed to
+    option: The option object from Options.td
+    Return: Set that contains the visibilities of the given option
+    """
+    visibility_set = set()
+    # Check for the option's explicit visibility
+    for visibility in options_dictionary[option]["Visibility"]:
+        if visibility is not None:
+            visibility_set.add(visibility["def"])
+
+    # Check for the option's group's visibility
+    group_set = collect_transitive_groups(option, options_dictionary)
+    if group_set:
+        for group_name in group_set:
+            for visibility in options_dictionary[group_name]["Visibility"]:
+                visibility_set.add(visibility["def"])
+
+    return visibility_set
+
+
+def get_lit_test_note(test_visibility):
+    """Return the note to be included at the start of the Lit test file
+    test_visibility: Any VISIBILITY_* variable. VISIBILITY_DEFAULT will return 
the .c formatted test note.
+    All other will return the .f90 formatted test note
+    """
+    test_prefix = SLASH_SLASH if test_visibility == VISIBILITY_DEFAULT else 
EXCLAMATION
+
+    return (
+        f"{test_prefix}NOTE: This lit test was automatically generated to 
validate "
+        "unintentionally exposed arguments to various driver flavours.\n"
+        f"{test_prefix}NOTE: To make changes, see 
llvm-project/clang/utils/generate_unsupported_in_drivermode.py"
+        + " from which it was generated.\n"
+        f"{test_prefix}NOTE: Regenerate this Lit test with the following:\n"
+        f"{test_prefix}NOTE: python generate_unsupported_in_drivermode.py "
+        "--options-td-dir llvm-project/clang/include/clang/Driver 
--llvm-include-dir llvm-project/llvm/include --llvm-tblgen 
llvm-project/build/bin/llvm-tblgen\n\n"
+    )
+
+
+def write_lit_test(test_path, test_visibility):
+    """Write the Lit tests to file
+    test_path: File write path
+    test_visibility: VISIBILITY_DEFAULT, VISIBILITY_FLANG, or VISIBILITY_FC1 
which indicates whether to write
+    to the main Lit test file, the flang test file, or the flang -fc1 test file
+    """
+    lit_file = open(test_path, "w")
+
+    lit_file.write(get_lit_test_note(test_visibility))
+    batch_size = 100
+
+    for visibility, driver_data in driver_data_dict.items():
+        is_flang_pair = visibility == VISIBILITY_FLANG or visibility == 
VISIBILITY_FC1
+
+        if (
+            (test_visibility == VISIBILITY_FLANG and visibility != 
VISIBILITY_FLANG)
+            or (test_visibility == VISIBILITY_FC1 and visibility != 
VISIBILITY_FC1)
+            or (test_visibility == VISIBILITY_DEFAULT and is_flang_pair)
+        ):
+            continue
+
+        comment_str = EXCLAMATION if is_flang_pair else SLASH_SLASH
+
+        unflattened_option_data = list(
+            itertools.batched(driver_data.test_option_sequence, batch_size)
+        )
+
+        for i, batch in enumerate(unflattened_option_data):
+            # Example run line: "// RUN: not %clang -cc1 -A ... -x c++ - < 
/dev/null 2>&1 | FileCheck -check-prefix=CC1OptionCHECK0 %s"
+            run_cmd = (
+                f"\n{comment_str}RUN: not " + driver_data.lit_cmd_prefix
+            )  # "// RUN: not %clang -cc1 "
+
+            # // RUN: <command up to this point> \
+            # // RUN:   --one-option \
+            # // RUN:   -a-different-option \
+            # ...
+            run_cmd += f" \\\n{comment_str}RUN:   
".join(itertools.chain(("",), batch))
+
+            run_cmd += (
+                driver_data.lit_cmd_options  # "-x c++"
+                + driver_data.lit_cmd_end  # " - < /dev/null 2>&1 | FileCheck 
-check-prefix=CC1OptionCHECK"
+                + str(i)  # "0"
+                + " %s\n\n"  # " %s"
+            )
+
+            lit_file.write(run_cmd)
+
+            for option_str in batch:
+                # Example check line: "// CC1OptionCHECK0: {{(unknown 
argument).*-A}}"
+                check_cmd = (
+                    comment_str  # "//
+                    + visibility  # "CC1Option"
+                    + "CHECK"
+                    + str(i)  # "0"
+                    + ": {{("
+                    + driver_data.check_str  # "unknown argument"
+                    + ").*"
+                    + option_str.replace("+", "\\+")  # "-A"
----------------
Maetveis wrote:

```suggestion
                    + re.escape(option_str)  # "-A"
```
This really should be minimally 
[re.escape](https://docs.python.org/3/library/re.html#re.escape), but it could 
be taken out of the regex too i.e.
`unknown argument{{.*}}-A`

https://github.com/llvm/llvm-project/pull/120900
_______________________________________________
cfe-commits mailing list
cfe-commits@lists.llvm.org
https://lists.llvm.org/cgi-bin/mailman/listinfo/cfe-commits

Reply via email to