cdisc-org · alexfurmenkov · May 18, 2026 · May 19, 2026 · May 20, 2026 · May 20, 2026
diff --git a/cdisc_rules_engine/models/rule.py b/cdisc_rules_engine/models/rule.py
@@ -32,14 +32,24 @@ def __init__(self, record_params: dict):
         self.operations: List[dict] = record_params.get("operations")
         self.conditions: dict = record_params["conditions"]
         self.actions: dict = record_params["actions"]
-        self.output_variables: dict = record_params.get("output_variables")
+        self.output_variables: dict = record_params.get("output variables")
         self.grouping_variables: List[str] = record_params.get("grouping_variables", [])
 
+    @classmethod
+    def _get_key(cls, obj: dict, space_key: str, default=None):
+        """Get a value by key, supporting both space-format ('Rule Type') and
+        underscore-format ('Rule_Type') for backward compatibility with the
+        CDISC Library API which returns underscore keys."""
+        if space_key in obj:
+            return obj[space_key]
+        return obj.get(space_key.replace(" ", "_"), default)
+
     @classmethod
     def from_cdisc_metadata(cls, rule_metadata: dict) -> dict:
         if cls.is_cdisc_rule_metadata(rule_metadata):
-            rule_metadata = cls.spaces_to_underscores(rule_metadata)
             authorities = rule_metadata.get("Authorities", [])
+            scope = rule_metadata.get("Scope", {})
+            outcome = rule_metadata.get("Outcome", {})
             executable_rule = {
                 "core_id": rule_metadata.get("Core", {}).get("Id"),
                 "author": "CDISC",
@@ -49,49 +59,36 @@ def from_cdisc_metadata(cls, rule_metadata: dict) -> dict:
                 "description": rule_metadata.get("Description"),
                 "authorities": authorities,
                 "standards": cls.parse_standards(authorities),
-                "classes": rule_metadata.get("Scope", {}).get("Classes"),
-                "domains": rule_metadata.get("Scope", {}).get("Domains"),
-                "entities": rule_metadata.get("Scope", {}).get("Entities"),
-                "rule_type": rule_metadata.get("Rule_Type"),
+                "classes": scope.get("Classes"),
+                "domains": scope.get("Domains"),
+                "entities": scope.get("Entities"),
+                "rule_type": cls._get_key(rule_metadata, "Rule Type"),
                 "conditions": cls.parse_conditions(rule_metadata.get("Check")),
-                "actions": cls.parse_actions(rule_metadata.get("Outcome")),
-                "use_case": rule_metadata.get("Scope", {}).get("Use_Case"),
-                "data_structures": rule_metadata.get("Scope", {}).get(
-                    "Data_Structures"
-                ),
+                "actions": cls.parse_actions(outcome),
+                "use_case": cls._get_key(scope, "Use Case"),
+                "data_structures": cls._get_key(scope, "Data Structures"),
                 "status": rule_metadata.get("Core", {}).get("Status", {}),
             }
 
             if "Operations" in rule_metadata:
                 executable_rule["operations"] = rule_metadata.get("Operations")
 
-            if "Match_Datasets" in rule_metadata:
-                executable_rule["datasets"] = cls.parse_datasets(
-                    rule_metadata.get("Match_Datasets")
-                )
-            if "Output_Variables" in rule_metadata.get("Outcome", {}):
-                executable_rule["output_variables"] = rule_metadata.get("Outcome", {})[
-                    "Output_Variables"
-                ]
-            if "Grouping_Variables" in rule_metadata:
-                executable_rule["grouping_variables"] = rule_metadata.get(
-                    "Grouping_Variables"
-                )
+            match_datasets = cls._get_key(rule_metadata, "Match Datasets")
+            if match_datasets is not None:
+                executable_rule["datasets"] = cls.parse_datasets(match_datasets)
+
+            output_variables = cls._get_key(outcome, "Output Variables")
+            if output_variables is not None:
+                executable_rule["output_variables"] = output_variables
+
+            grouping_variables = cls._get_key(rule_metadata, "Grouping Variables")
+            if grouping_variables is not None:
+                executable_rule["grouping_variables"] = grouping_variables
+
             return executable_rule
         else:
             return rule_metadata
 
-    @classmethod
-    def spaces_to_underscores(cls, obj):
-        if isinstance(obj, dict):
-            return {
-                key.replace(" ", "_"): cls.spaces_to_underscores(value)
-                for key, value in obj.items()
-            }
-        if isinstance(obj, list):
-            return [cls.spaces_to_underscores(item) for item in obj]
-        return obj
-
     @classmethod
     def parse_standards(cls, authorities: List[dict]) -> List[dict]:
         standards = []
@@ -200,8 +197,8 @@ def parse_datasets(cls, match_key_data: List[dict]) -> List[dict]:
                 ],
                 "wildcard": data.get("Wildcard", "**"),
             }
-            if "Join_Type" in data:
-                join_data["join_type"] = data.get("Join_Type")
+            if "Join Type" in data:
+                join_data["join_type"] = data.get("Join Type")
             if "Child" in data:
                 join_data["child"] = data.get("Child")
             datasets.append(join_data)

diff --git a/cdisc_rules_engine/models/rule_validation_result.py b/cdisc_rules_engine/models/rule_validation_result.py
@@ -48,12 +48,17 @@ def _get_rule_ids(self, rule: Rule, org: str) -> str:
         return ", ".join(
             sorted(
                 {
-                    reference.get("Rule_Identifier", {}).get("Id")
+                    (
+                        reference.get("Rule Identifier")
+                        or reference.get("Rule_Identifier")
+                        or {}
+                    ).get("Id")
                     for authority in rule.get("authorities", [])
                     for standard in authority.get("Standards", [])
                     for reference in standard.get("References", [])
                     if authority.get("Organization") == org
                 }
+                - {None}
             )
         )
 

diff --git a/scripts/script_utils.py b/scripts/script_utils.py
@@ -526,7 +526,7 @@ def load_and_parse_rule(rule_file):
         with open(rule_file, "r", encoding="utf-8") as file:
             if file_extension in [".yml", ".yaml"]:
                 loaded_data = yaml.safe_load(file)
-                return Rule.from_cdisc_metadata(replace_yml_spaces(loaded_data))
+                return Rule.from_cdisc_metadata(loaded_data)
             elif file_extension == ".json":
                 return Rule.from_cdisc_metadata(json.load(file))
             else:
@@ -604,18 +604,6 @@ def get_max_dataset_size(dataset_paths: Iterable[str]):
     return max_dataset_size
 
 
-def replace_yml_spaces(data):
-    if isinstance(data, dict):
-        return {
-            key.replace(" ", "_"): replace_yml_spaces(value)
-            for key, value in data.items()
-        }
-    elif isinstance(data, list):
-        return [replace_yml_spaces(item) for item in data]
-    else:
-        return data
-
-
 def library_metadata_not_found_message(standard, version, substandard=None):
     version_display = (version or "").replace("-", ".")
     sub_part = f" substandard {substandard}" if substandard else ""

diff --git a/tests/conftest.py b/tests/conftest.py
@@ -938,14 +938,14 @@ def mock_validation_results() -> list[RuleValidationResult]:
                         "Standards": [
                             {
                                 "References": [
-                                    {"Rule_Identifier": {"Id": "CDISCRuleID4"}},
-                                    {"Rule_Identifier": {"Id": "CDISCRuleID3"}},
+                                    {"Rule Identifier": {"Id": "CDISCRuleID4"}},
+                                    {"Rule Identifier": {"Id": "CDISCRuleID3"}},
                                 ]
                             },
                             {
                                 "References": [
-                                    {"Rule_Identifier": {"Id": "CDISCRuleID2"}},
-                                    {"Rule_Identifier": {"Id": "CDISCRuleID1"}},
+                                    {"Rule Identifier": {"Id": "CDISCRuleID2"}},
+                                    {"Rule Identifier": {"Id": "CDISCRuleID1"}},
                                 ]
                             },
                         ],
@@ -955,8 +955,8 @@ def mock_validation_results() -> list[RuleValidationResult]:
                         "Standards": [
                             {
                                 "References": [
-                                    {"Rule_Identifier": {"Id": "FDARuleID1"}},
-                                    {"Rule_Identifier": {"Id": "FDARuleID2"}},
+                                    {"Rule Identifier": {"Id": "FDARuleID1"}},
+                                    {"Rule Identifier": {"Id": "FDARuleID2"}},
                                 ]
                             }
                         ],
@@ -998,14 +998,14 @@ def mock_validation_results() -> list[RuleValidationResult]:
                         "Standards": [
                             {
                                 "References": [
-                                    {"Rule_Identifier": {"Id": "CDISCRuleID4"}},
-                                    {"Rule_Identifier": {"Id": "CDISCRuleID3"}},
+                                    {"Rule Identifier": {"Id": "CDISCRuleID4"}},
+                                    {"Rule Identifier": {"Id": "CDISCRuleID3"}},
                                 ]
                             },
                             {
                                 "References": [
-                                    {"Rule_Identifier": {"Id": "CDISCRuleID2"}},
-                                    {"Rule_Identifier": {"Id": "CDISCRuleID1"}},
+                                    {"Rule Identifier": {"Id": "CDISCRuleID2"}},
+                                    {"Rule Identifier": {"Id": "CDISCRuleID1"}},
                                 ]
                             },
                         ],
@@ -1015,8 +1015,8 @@ def mock_validation_results() -> list[RuleValidationResult]:
                         "Standards": [
                             {
                                 "References": [
-                                    {"Rule_Identifier": {"Id": "FDARuleID1"}},
-                                    {"Rule_Identifier": {"Id": "FDARuleID2"}},
+                                    {"Rule Identifier": {"Id": "FDARuleID1"}},
+                                    {"Rule Identifier": {"Id": "FDARuleID2"}},
                                 ]
                             }
                         ],

diff --git a/tests/resources/COREIssue329/rule-286.json b/tests/resources/COREIssue329/rule-286.json
@@ -15,10 +15,10 @@
                   "Document": "IG v3.2",
                   "Item": "Assumption 3",
                   "Section": "7.4",
-                  "Cited_Guidance": "Further information about the parameters is included below in Table 1. TSVAL may have controlled terminology depending on the value of TSPARMCD"
+                  "Cited Guidance": "Further information about the parameters is included below in Table 1. TSVAL may have controlled terminology depending on the value of TSPARMCD"
                 }
               ],
-              "Rule_Identifier": {
+              "Rule Identifier": {
                 "Id": "CG0286",
                 "Version": "1"
               }
@@ -37,10 +37,10 @@
                   "Document": "IG v3.3",
                   "Item": "Assumption 3",
                   "Section": "7.4",
-                  "Cited_Guidance": "Further information about the parameters is included Appendix C1, Trial Summary Codes. TSVAL may have controlled terminology depending on the value of TSPARMCD. Conditions for including parameters are included in Appendix C1, Trial Summary Codes."
+                  "Cited Guidance": "Further information about the parameters is included Appendix C1, Trial Summary Codes. TSVAL may have controlled terminology depending on the value of TSPARMCD. Conditions for including parameters are included in Appendix C1, Trial Summary Codes."
                 }
               ],
-              "Rule_Identifier": {
+              "Rule Identifier": {
                 "Id": "CG0286",
                 "Version": "1"
               }