DefectDojo
diff --git a/‎docs/content/en/connecting_your_tools/parsers/file/snyk_issue_api.md‎
Lines changed: 5 additions & 1 deletion b/‎docs/content/en/connecting_your_tools/parsers/file/snyk_issue_api.md‎
Lines changed: 5 additions & 1 deletion
diff --git a/‎dojo/settings/settings.dist.py‎
Lines changed: 2 additions & 0 deletions b/‎dojo/settings/settings.dist.py‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎dojo/tools/snyk_issue_api/parser.py‎
Lines changed: 184 additions & 65 deletions b/‎dojo/tools/snyk_issue_api/parser.py‎
Lines changed: 184 additions & 65 deletions
@@ -2,7 +2,11 @@
 title: "Snyk Issue API"
 toc_hide: true
 ---
-The Snyk Issue API parser supports importing vulnerability data from the Snyk Issue API in JSON format. Currently only parsing issues of type `code` is supported. Samples of ther issue types are welcome.
+The Snyk Issue API parser supports importing vulnerability data from the Snyk Issue API in JSON format.
+
+Currently parsing issues of type `code` (SAST) and `package_vulnerability` (SCA) are supported.
+
+Samples of ther issue types are welcome.
 
 For more information about the Snyk Issue API, refer to the [official Snyk API documentation](https://docs.snyk.io/snyk-api/reference/issues#get-orgs-org_id-issues).
 
 
@@ -1366,6 +1366,7 @@ def saml2_attrib_map_format(din):
     "Cyberwatch scan (Galeax)": ["title", "description", "severity"],
     "Cycognito Scan": ["title", "severity"],
     "OpenVAS Parser v2": ["title", "severity", "vuln_id_from_tool", "endpoints"],
+    "Snyk Issue API Scan": ["vuln_id_from_tool", "file_path"],
 }
 
 # Override the hardcoded settings here via the env var
@@ -1625,6 +1626,7 @@ def saml2_attrib_map_format(din):
     "Qualys Hacker Guardian Scan": DEDUPE_ALGO_HASH_CODE,
     "Cyberwatch scan (Galeax)": DEDUPE_ALGO_HASH_CODE,
     "OpenVAS Parser v2": DEDUPE_ALGO_HASH_CODE,
+    "Snyk Issue API Scan": DEDUPE_ALGO_HASH_CODE,
 }
 
 # Override the hardcoded settings here via the env var
 
@@ -1,5 +1,4 @@
 import json
-from contextlib import suppress
 from datetime import datetime
 
 from dojo.models import Finding
@@ -43,42 +42,59 @@ def process_tree(self, tree, test):
                 findings.append(finding)
         return findings
 
-    def get_finding(self, issue, test):
-        # Check top-level type must be "issue" as "packages" have their own API it seems.
-        if not issue or issue.get("type") != "issue":
-            return None
-
-        attributes = issue.get("attributes", {})
-
-        # Check attributes-level type must be "code"
-        # Other items are not supported yet due to a lack of samples and lack of documentation
-        # package_vulnerability,license,cloud,code,customconfig
-        if attributes.get("type") != "code":
-            return None
-
-        # Extract CWE classes
+    def extract_cwe_classes(self, attributes):
         cwes = []
         for class_info in attributes.get("classes", []):
             if class_info.get("source") == "CWE":
                 cwe_id = class_info.get("id", "").replace("CWE-", "")
                 if cwe_id.isdigit():
                     cwes.append(int(cwe_id))
 
-        # Extract location information, fixability and collect all source locations for impact
+        return cwes
+
+    def extract_if_fix_is_available(self, finding_type, coordinates):
+        if coordinates is None:
+            return False
+
+        for coordinate in coordinates:
+            # Check if any fix is available
+            if finding_type == "code":
+                if coordinate.get("is_fixable_snyk") or \
+                    coordinate.get("is_fixable_upstream") or \
+                    coordinate.get("is_fixable_manually"):
+                    return True
+
+            if finding_type == "package_vulnerability":
+                if coordinate.get("is_fixable_snyk") or \
+                    coordinate.get("is_fixable_upstream") or \
+                    coordinate.get("is_fixable_manually") or \
+                    coordinate.get("is_patchable") or \
+                    coordinate.get("is_pinnable") or \
+                    coordinate.get("is_upgradeable"):
+                    return True
+        return False
+
+    def extract_coordinate_data(self, is_type_code, coordinates):
         file_path = None
-        line = None
-        fix_available = False
+        line = None  # Always None for SCA
+        component_name = None
+        component_version = None
+        reachable = False   # SCA only
         impact_locations = []
 
-        for coordinate in attributes.get("coordinates", []):
-            # Check if any fix is available
-            if coordinate.get("is_fixable_snyk") or \
-               coordinate.get("is_fixable_upstream") or \
-               coordinate.get("is_fixable_manually"):
-                fix_available = True
+        for coordinate in coordinates:
+            if not is_type_code:
+                if coordinate.get("reachability") != "not-applicable":
+                    reachable = True
 
             for representation in coordinate.get("representations", []):
-                if "sourceLocation" in representation:
+                if not is_type_code:
+                    if "dependency" in representation:
+                        dependency = representation["dependency"]
+                        component_name = dependency.get("package_name")
+                        component_version = dependency.get("package_version")
+                        file_path = component_name
+                elif "sourceLocation" in representation:
                     location = representation["sourceLocation"]
                     region = location.get("region", {})
                     start = region.get("start", {})
@@ -100,6 +116,94 @@ def get_finding(self, issue, test):
                         if region:
                             line = start.get("line")
 
+        return file_path, line, component_name, component_version, reachable, impact_locations
+
+    def get_exploit_details(self, exploit_details):
+        if exploit_details:
+            sources = exploit_details.get("sources", [])
+            if sources:
+                return [f"Exploit Sources: {', '.join(sources)}", ""]
+
+        return None
+
+    def extract_problems(self, problems):
+        if problems:
+            problem = problems[0]  # Take the first problem
+            return [
+                f"id: {problem.get('id', 'Unknown')}",
+                f"Source: {problem.get('source', 'Unknown')}",
+                f"Type: {problem.get('type', 'Unknown')}",
+                f"URL: {problem.get('url', 'Unknown')}" if problem.get("url") else "",
+                f"Last Updated: {problem.get('updated_at', 'Unknown')}",
+                "",  # Empty line before locations
+            ]
+        return None
+
+    def extract_problem_ids(self, problems):
+        ids = []
+        if problems:
+            for problem in problems:
+                if "id" in problem:
+                    # using .extend here adds character by character to the array
+                    ids.append(problem["id"])  # noqa: PERF401
+        return ids
+
+    def extract_risk_score(self, risk):
+        if risk and "score" in risk:
+            score = risk["score"]
+            if isinstance(score, dict):
+                return (
+                    f"Risk Score: {score.get('value', 'N/A')} "
+                    f"(Model: {score.get('model', 'N/A')})"
+                )
+        return None
+
+    def extract_cvss_severities(self, severities, version):
+        for severity in severities:
+            if version in severity.get("version"):
+                # returning first matching severity
+                return severity.get("vector"), severity.get("score")
+
+        return None, None
+
+    def extract_convert_created_date(self, created_at):
+        if created_at:
+            created_str = created_at
+            # Parse the date string and convert to yyyy-mm-dd format
+            try:
+                created_date = datetime.fromisoformat(created_str)
+                return created_date.strftime("%Y-%m-%d")
+            except (ValueError, AttributeError):
+                return None
+
+        return None
+
+    def get_finding(self, issue, test):
+        # Check top-level type must be "issue" as "packages" have their own API it seems.
+        if not issue or issue.get("type") != "issue":
+            return None
+
+        attributes = issue.get("attributes", {})
+
+        # Check attributes-level type - support both code and package_vulnerability
+        issue_type = attributes.get("type")
+
+        if issue_type not in {"code", "package_vulnerability"}:
+            return None
+
+        cwes = self.extract_cwe_classes(attributes)
+
+        impact_details = []
+
+        problem = self.extract_problems(attributes.get("problems", []))
+        if problem:
+            impact_details.extend(problem)
+
+        # Add exploit details if available, SCA only
+        exploit_details = self.get_exploit_details(attributes.get("exploit_details", {}))
+        if exploit_details:
+            impact_details.extend(exploit_details)
+
         # Map severity levels
         severity_map = {
             "critical": "Critical",
@@ -108,16 +212,30 @@ def get_finding(self, issue, test):
             "low": "Low",
             "info": "Info",
         }
+
         severity = severity_map.get(attributes.get("effective_severity_level", "").lower(), "Info")
 
-        # Parse created_at date
-        created = None
-        if attributes.get("created_at"):
-            with suppress(ValueError):
-                created = datetime.strptime(attributes["created_at"], "%Y-%m-%dT%H:%M:%S.%fZ")
-            if not created:
-                with suppress(ValueError):
-                    created = datetime.strptime(attributes["created_at"], "%Y-%m-%dT%H:%M:%SZ")
+        created = self.extract_convert_created_date(attributes.get("created_at"))
+
+        is_out_of_scope = False  # attributes.get("is_out_of_scope", False)
+
+        file_path, line, component_name, component_version, reachable, impact_locations = self.extract_coordinate_data(issue_type == "code", attributes.get("coordinates", []))
+
+        # Locations (Code only)
+        if impact_locations:
+            for location in impact_locations:
+                impact_details.extend(location)
+
+        # Add package details (SCA only)
+        if component_name:
+            impact_details.extend([
+                "Package Details:",
+                f"Package: {component_name}",
+                f"Version: {component_version or 'Unknown'}",
+                "",
+            ])
+
+        impact_details.append(f"Reachable: {'Yes' if reachable else 'No'}")
 
         # Create finding
         finding = Finding(
@@ -130,50 +248,51 @@ def get_finding(self, issue, test):
             unique_id_from_tool=issue.get("id"),
             file_path=file_path,
             line=line,
-            out_of_scope=attributes.get("ignored", False),
+            out_of_scope=is_out_of_scope,
             active=attributes.get("status") == "open" and not attributes.get("ignored", False),
-            verified=True,
+            # not all open issues are verified, only fixed and ignored
+            verified=attributes.get("ignored", True) or attributes.get("status") == "resolved",
+            false_p=attributes.get("ignored"),
+            # mitigated is type "date", not "boolean"
+            is_mitigated=attributes.get("status") == "resolved",
             cwe=cwes[0] if cwes else None,
             date=created,
+            component_name=component_name,
+            component_version=component_version,
+            risk_accepted=False,
         )
 
-        # Set fix_available if the field exists in the model
-        if hasattr(finding, "fix_available"):
-            finding.fix_available = fix_available
+        # sca only
+        if attributes.get("key"):
+            finding.vuln_id_from_tool = attributes.get("key")
+
+        if attributes.get("severities"):
+            v3vector, v3score = self.extract_cvss_severities(attributes.get("severities", {}), "3")
+            v4vector, v4score = self.extract_cvss_severities(attributes.get("severities", {}), "4")
+
+            if v3vector and v3score:
+                finding.cvssv3 = v3vector
+                finding.cvssv3_score = v3score
+
+            if v4vector and v4score:
+                finding.cvssv4 = v4vector
+                finding.cvssv4_score = v4score
+
+        finding.unsaved_vulnerability_ids = self.extract_problem_ids(attributes.get("problems", []))
+
+        finding.fix_available = self.extract_if_fix_is_available(issue_type, attributes.get("coordinates", []))
 
         # Add risk score if available
-        risk = attributes.get("risk", {})
-        if risk and "score" in risk:
-            score = risk["score"]
-            if isinstance(score, dict):
-                finding.severity_justification = (
-                    f"Risk Score: {score.get('value', 'N/A')} "
-                    f"(Model: {score.get('model', 'N/A')})"
-                )
+        risk = self.extract_risk_score(attributes.get("risk", {}))
+
+        if risk:
+            finding.severity_justification = risk
 
         # Add additional CWEs as references
         if len(cwes) > 1:
             finding.references = "Additional CWEs: " + ", ".join(f"CWE-{cwe}" for cwe in cwes[1:])
 
-        # Add problem details and all source locations to impact
-        impact_details = []
-
-        # Add problem information
-        problems = attributes.get("problems", [])
-        if problems:
-            problem = problems[0]  # Take the first problem
-            impact_details.extend([
-                f"Source: {problem.get('source', 'Unknown')}",
-                f"Type: {problem.get('type', 'Unknown')}",
-                f"Last Updated: {problem.get('updated_at', 'Unknown')}",
-                f"Severity: {severity}",
-                "",  # Empty line before locations
-            ])
-
-        # Add all source locations
-        for location in impact_locations:
-            impact_details.extend(location)
-
+        # Set impact with details
         if impact_details:
             finding.impact = "\n".join(impact_details).rstrip()
Original file line number	Diff line number	Diff line change
`@@ -1366,6 +1366,7 @@ def saml2_attrib_map_format(din):`
`1366`	`1366`	`"Cyberwatch scan (Galeax)": ["title", "description", "severity"],`
`1367`	`1367`	`"Cycognito Scan": ["title", "severity"],`
`1368`	`1368`	`"OpenVAS Parser v2": ["title", "severity", "vuln_id_from_tool", "endpoints"],`
	`1369`	`+ "Snyk Issue API Scan": ["vuln_id_from_tool", "file_path"],`
`1369`	`1370`	`}`
`1370`	`1371`
`1371`	`1372`	`# Override the hardcoded settings here via the env var`
`@@ -1625,6 +1626,7 @@ def saml2_attrib_map_format(din):`
`1625`	`1626`	`"Qualys Hacker Guardian Scan": DEDUPE_ALGO_HASH_CODE,`
`1626`	`1627`	`"Cyberwatch scan (Galeax)": DEDUPE_ALGO_HASH_CODE,`
`1627`	`1628`	`"OpenVAS Parser v2": DEDUPE_ALGO_HASH_CODE,`
	`1629`	`+ "Snyk Issue API Scan": DEDUPE_ALGO_HASH_CODE,`
`1628`	`1630`	`}`
`1629`	`1631`
`1630`	`1632`	`# Override the hardcoded settings here via the env var`