PyPI - owasp-depscan - Versions diffs - 5.5.0__py3-none-any.whl → 6.0.0a3__py3-none-any.whl - Mend

owasp-depscan 5.5.0py3-none-any.whl → 6.0.0a3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (34) hide show

depscan/__init__.py +8 -0
depscan/cli.py +719 -827
depscan/cli_options.py +302 -0
depscan/lib/audit.py +3 -1
depscan/lib/bom.py +387 -289
depscan/lib/config.py +86 -337
depscan/lib/explainer.py +389 -101
depscan/lib/license.py +11 -10
depscan/lib/logger.py +65 -17
depscan/lib/package_query/__init__.py +0 -0
depscan/lib/package_query/cargo_pkg.py +124 -0
depscan/lib/package_query/metadata.py +170 -0
depscan/lib/package_query/npm_pkg.py +345 -0
depscan/lib/package_query/pkg_query.py +195 -0
depscan/lib/package_query/pypi_pkg.py +113 -0
depscan/lib/tomlparse.py +116 -0
depscan/lib/utils.py +34 -188
owasp_depscan-6.0.0a3.dist-info/METADATA +388 -0
{owasp_depscan-5.5.0.dist-info → owasp_depscan-6.0.0a3.dist-info}/RECORD +28 -25
{owasp_depscan-5.5.0.dist-info → owasp_depscan-6.0.0a3.dist-info}/WHEEL +1 -1
vendor/choosealicense.com/_licenses/cern-ohl-p-2.0.txt +1 -1
vendor/choosealicense.com/_licenses/cern-ohl-s-2.0.txt +1 -1
vendor/choosealicense.com/_licenses/cern-ohl-w-2.0.txt +2 -2
vendor/choosealicense.com/_licenses/mit-0.txt +1 -1
vendor/spdx/json/licenses.json +904 -677
depscan/lib/analysis.py +0 -1554
depscan/lib/csaf.py +0 -1860
depscan/lib/normalize.py +0 -312
depscan/lib/orasclient.py +0 -142
depscan/lib/pkg_query.py +0 -532
owasp_depscan-5.5.0.dist-info/METADATA +0 -580
{owasp_depscan-5.5.0.dist-info → owasp_depscan-6.0.0a3.dist-info}/entry_points.txt +0 -0
{owasp_depscan-5.5.0.dist-info → owasp_depscan-6.0.0a3.dist-info/licenses}/LICENSE +0 -0
{owasp_depscan-5.5.0.dist-info → owasp_depscan-6.0.0a3.dist-info}/top_level.txt +0 -0

depscan/lib/explainer.py CHANGED Viewed

@@ -1,69 +1,197 @@
-import json
 import os
 import re
+import glob
+from collections import defaultdict
+from custom_json_diff.lib.utils import json_load
 from rich import box
 from rich.markdown import Markdown
 from rich.table import Table
 from rich.tree import Tree
-from depscan.lib.config import max_purl_per_flow, max_reachable_explanations
-from depscan.lib.logger import console
+from depscan.lib.config import (
+    COMMON_CHECK_TAGS,
+    max_purl_per_flow,
+    max_reachable_explanations,
+    max_purls_reachable_explanations,
+    max_source_reachable_explanations,
+    max_sink_reachable_explanations,
+)
+from depscan.lib.logger import console, LOG
-def explain(
-    project_type,
-    src_dir,
-    reachables_slices_file,
-    vdr_file,
-    pkg_vulnerabilities,
-    pkg_group_rows,
-    direct_purls,
-    reached_purls,
-):
+def explain(project_type, src_dir, bom_dir, vdr_file, vdr_result, explanation_mode):
     """
-    Explain the analysis and findings
+    Explain the analysis and findings based on the explanation mode.
     :param project_type: Project type
     :param src_dir: Source directory
-    :param reachables_slices_file: Reachables slices file
-    :param vdr_file: VDR file from the summariser
-    :param pkg_vulnerabilities: Vulnerabilities from the analysis
-    :param pkg_group_rows: Prioritized list of purls
-    :param direct_purls: Dict containing packages used directly
-    :param reached_purls: Dict containing packages identified via reachables slicing
+    :param bom_dir: BOM directory
+    :param vdr_file: VDR file
+    :param vdr_result: VDR Result
+    :param explanation_mode: Explanation mode
     """
-    if (
-        not reachables_slices_file
-        and src_dir
-        and os.path.exists(os.path.join(src_dir, "reachables.slices.json"))
+    pattern_methods = {}
+    has_any_explanation = False
+    has_any_crypto_flows = False
+    slices_files = glob.glob(f"{bom_dir}/**/*reachables.slices.json", recursive=True)
+    openapi_spec_files = None
+    # Should we explain the endpoints and Code Hotspots
+    if explanation_mode in (
+        "Endpoints",
+        "EndpointsAndReachables",
     ):
-        reachables_slices_file = os.path.join(src_dir, "reachables.slices.json")
-    if reachables_slices_file:
-        with open(reachables_slices_file, "r", encoding="utf-8") as f:
-            reachables_data = json.load(f)
-            if reachables_data and reachables_data.get("reachables"):
+        openapi_spec_files = glob.glob(f"{bom_dir}/*openapi*.json", recursive=False)
+        if not openapi_spec_files:
+            openapi_spec_files = glob.glob(f"{src_dir}/*openapi*.json", recursive=False)
+    if openapi_spec_files:
+        rsection = Markdown("""## Service Endpoints
+The following endpoints and code hotspots were identified by depscan. Verify that proper authentication and authorization mechanisms are in place to secure them.""")
+        console.print(rsection)
+        for ospec in openapi_spec_files:
+            pattern_methods = print_endpoints(ospec)
+    # Return early for endpoints only explanations
+    if explanation_mode in ("Endpoints",):
+        return
+    section_title = (
+        "Non-Reachable Flows"
+        if explanation_mode in ("NonReachables",)
+        else "Reachable Flows"
+    )
+    for sf in slices_files:
+        if len(slices_files) > 1:
+            fn = os.path.basename(sf)
+            section_label = f"# Explanations for {sf}"
+            if "-" in fn:
+                section_label = f"# Explanations for {fn.split('-')[0].upper()}"
+            console.print(Markdown(section_label))
+        if (reachables_data := json_load(sf, log=LOG)) and reachables_data.get(
+            "reachables"
+        ):
+            if explanation_mode in ("NonReachables",):
                 rsection = Markdown(
-                    """## Reachable Flows
+                    f"""## {section_title}
-Below are some reachable flows identified by depscan. Use the provided tips to improve the securability of your application.
+Below are several data flows deemed safe and non-reachable. Use the provided tips to confirm this assessment.
                 """
                 )
-                console.print(rsection)
-                explain_reachables(
-                    reachables_data, pkg_group_rows, project_type
+            elif pattern_methods:
+                rsection = Markdown(
+                    f"""## {section_title}
+Below are some reachable flows, including those accessible via endpoints, identified by depscan. Use the generated OpenAPI specification to evaluate these endpoints for vulnerabilities and risk.
+                """
+                )
+            else:
+                rsection = Markdown(
+                    f"""## {section_title}
+Below are several data flows identified by depscan, including reachable ones. Use the tips provided to strengthen your application’s security posture.
+                """
                 )
+            has_explanation, has_crypto_flows, tips = explain_reachables(
+                explanation_mode,
+                reachables_data,
+                project_type,
+                vdr_result,
+                rsection if not has_any_explanation else None,
+            )
+            if not has_any_explanation and has_explanation:
+                has_any_explanation = True
+            if not has_any_crypto_flows and has_crypto_flows:
+                has_any_crypto_flows = True
+def _track_usage_targets(usage_targets, usages_object):
+    for k, v in usages_object.items():
+        for file, lines in v.items():
+            for l in lines:
+                usage_targets.add(f"{file}#{l}")
-def explain_reachables(reachables, pkg_group_rows, project_type):
+def print_endpoints(ospec):
+    if not ospec:
+        return
+    paths = json_load(ospec).get("paths") or {}
+    pattern_methods = defaultdict(list)
+    pattern_usage_targets = defaultdict(set)
+    for pattern, path_obj in paths.items():
+        usage_targets = set()
+        http_method_added = False
+        for k, v in path_obj.items():
+            if k == "parameters":
+                continue
+            # Java, JavaScript, Python etc
+            if k == "x-atom-usages":
+                _track_usage_targets(usage_targets, v)
+                continue
+            if isinstance(v, dict) and v.get("x-atom-usages"):
+                _track_usage_targets(usage_targets, v.get("x-atom-usages"))
+            pattern_methods[pattern].append(k)
+            http_method_added = True
+        pattern_usage_targets[pattern] = usage_targets
+        # We see an endpoint, but do not know the HTTP methods.
+        # Let's track them as empty
+        if not http_method_added and usage_targets:
+            pattern_methods[pattern].append("")
+    caption = ""
+    if pattern_methods:
+        caption = f"Identified Endpoints: {len(pattern_methods.keys())}"
+    rtable = Table(
+        box=box.DOUBLE_EDGE,
+        show_lines=True,
+        title="Endpoints",
+        caption=caption,
+    )
+    for c in ("URL Pattern", "HTTP Methods", "Code Hotspots"):
+        rtable.add_column(header=c, vertical="top")
+    for k, v in pattern_methods.items():
+        v.sort()
+        sorted_areas = list(pattern_usage_targets[k])
+        sorted_areas.sort()
+        rtable.add_row(k, ("\n".join(v)).upper(), "\n".join(sorted_areas))
+    if pattern_methods:
+        console.print()
+        console.print(rtable)
+    return pattern_methods
+def is_cpp_flow(flows):
+    if not flows:
+        return False
+    attempts = 0
+    for idx, aflow in enumerate(flows):
+        if aflow.get("parentFileName", "").endswith(".c") or aflow.get(
+            "parentFileName", ""
+        ).endswith(".cpp"):
+            return True
+        attempts += 1
+        if attempts > 3:
+            return False
+    return False
+def explain_reachables(
+    explanation_mode, reachables, project_type, vdr_result, header_section=None
+):
     """"""
     reachable_explanations = 0
     checked_flows = 0
+    has_crypto_flows = False
+    purls_reachable_explanations = defaultdict(int)
+    source_reachable_explanations = defaultdict(int)
+    sink_reachable_explanations = defaultdict(int)
+    has_explanation = False
+    header_shown = False
+    has_cpp_flow = False
     for areach in reachables.get("reachables", []):
+        cpp_flow = is_cpp_flow(areach.get("flows"))
+        if not has_cpp_flow and cpp_flow:
+            has_cpp_flow = True
         if (
             not areach.get("flows")
             or len(areach.get("flows")) < 2
-            or not areach.get("purls")
+            or (not areach.get("purls") and not cpp_flow)
         ):
             continue
         # Focus only on the prioritized list if available
@@ -74,11 +202,55 @@ def explain_reachables(reachables, pkg_group_rows, project_type):
         #             is_prioritized = True
         #     if not is_prioritized:
         #         continue
-        flow_tree, comment, source_sink_desc, has_check_tag = explain_flows(
-            areach.get("flows"), areach.get("purls"), project_type
+        (
+            flow_tree,
+            comment,
+            source_sink_desc,
+            source_code_str,
+            sink_code_str,
+            has_check_tag,
+            is_endpoint_reachable,
+            is_crypto_flow,
+        ) = explain_flows(
+            explanation_mode,
+            areach.get("flows"),
+            areach.get("purls"),
+            project_type,
+            vdr_result,
         )
-        if not source_sink_desc or not flow_tree:
+        if not source_sink_desc or not flow_tree or len(flow_tree.children) < 5:
             continue
+        # In non-reachables mode, we are not interested in reachable flows.
+        if (
+            explanation_mode
+            and explanation_mode in ("NonReachables",)
+            and not has_check_tag
+        ):
+            continue
+        if (
+            source_code_str
+            and source_reachable_explanations[source_code_str] + 1
+            > max_source_reachable_explanations
+        ):
+            continue
+        if (
+            sink_code_str
+            and sink_reachable_explanations[sink_code_str] + 1
+            > max_sink_reachable_explanations
+        ):
+            continue
+        purls_str = ",".join(sorted(areach.get("purls", [])))
+        if (
+            purls_str
+            and purls_reachable_explanations[purls_str] + 1
+            > max_purls_reachable_explanations
+        ):
+            continue
+        if not has_explanation:
+            has_explanation = True
+        # Did we find any crypto flows
+        if is_crypto_flow and not has_crypto_flows:
+            has_crypto_flows = True
         rtable = Table(
             box=box.DOUBLE_EDGE,
             show_lines=True,
@@ -90,31 +262,80 @@ def explain_reachables(reachables, pkg_group_rows, project_type):
         )
         rtable.add_column(header="Flow", vertical="top")
         rtable.add_row(flow_tree)
+        # Print the header first in case we haven't
+        if not header_shown and header_section:
+            console.print()
+            console.print(header_section)
+            header_shown = True
         console.print()
         console.print(rtable)
         reachable_explanations += 1
+        if purls_str:
+            purls_reachable_explanations[purls_str] += 1
+        if source_code_str:
+            source_reachable_explanations[source_code_str] += 1
+        if sink_code_str:
+            sink_reachable_explanations[sink_code_str] += 1
         if has_check_tag:
             checked_flows += 1
         if reachable_explanations + 1 > max_reachable_explanations:
             break
-    if reachable_explanations:
-        tips = """## Secure Design Tips"""
-        if checked_flows:
+    tips = """## Secure Design Tips"""
+    if explanation_mode in ("NonReachables",):
+        tips += """
+- Automate tests (including fuzzing) to verify validation, sanitization, encoding, and encryption.
+- Align the implementation with the original architecture and threat models to ensure security compliance.
+- Extract reusable methods into a shared library for organization-wide use.
+"""
+    elif has_explanation:
+        if has_crypto_flows:
             tips += """
-- Review the detected validation/sanitization methods in the application.
-- To improve the security posture, implement a common validation middleware.
+- Generate a Cryptographic BOM with cdxgen and monitor it in Dependency-Track.
+"""
+        elif checked_flows:
+            if not has_cpp_flow:
+                tips += """
+- Review the validation and sanitization methods used in the application.
+- To enhance the security posture, implement a common validation middleware.
+"""
+            else:
+                tips += """
+- Continuously fuzz the parser and validation functions with diverse payloads.
+- Generate post-build SBOMs with OWASP blint by building this project for various architecture combinations. Re-run depscan with the `--bom-dir` argument to enhance the analysis.
+"""
+        elif purls_reachable_explanations:
+            tips += """
+- Consider implementing a common validation and sanitization library to reduce the risk of exploitability.
 """
         else:
             tips += """
-- Consider implementing a common validation/sanitization library to reduce the exploitability risk.
+- Enhance your unit and integration tests to cover the flows listed above.
+- Continuously fuzz the parser and validation functions with diverse payloads.
 """
+    if tips:
         rsection = Markdown(tips)
         console.print(rsection)
+    return has_explanation, has_crypto_flows, tips
-def flow_to_source_sink(idx, flow, purls, project_type):
+def flow_to_source_sink(idx, flow, purls, project_type, vdr_result):
     """ """
+    endpoint_reached_purls = {}
+    reached_services = {}
+    if vdr_result:
+        endpoint_reached_purls = vdr_result.endpoint_reached_purls
+        reached_services = vdr_result.reached_services
+    is_endpoint_reachable = False
+    possible_reachable_service = False
+    tags = flow.get("tags", [])
+    is_crypto_flow = "crypto" in tags or "crypto-generate" in tags
+    method_in_emoji = ":right_arrow_curving_left:"
+    for p in purls:
+        if endpoint_reached_purls and endpoint_reached_purls.get(p):
+            is_endpoint_reachable = True
+            method_in_emoji = ":heavy_large_circle: "
+        if reached_services and reached_services.get(p):
+            possible_reachable_service = True
     source_sink_desc = ""
     param_name = flow.get("name")
     method_str = "method"
@@ -130,25 +351,27 @@ def flow_to_source_sink(idx, flow, purls, project_type):
         if parent_method in ("handleRequest",):
             method_str = f"handler {method_str}"
         elif parent_method in ("__construct", "__init"):
-            method_str = f"constructor"
+            method_str = "constructor"
         elif project_type in ("php",) and parent_method.startswith("__"):
             method_str = f"magic {method_str}"
     if flow.get("label") == "METHOD_PARAMETER_IN":
         if param_name:
-            source_sink_desc = f"""{param_str} [red]{param_name}[/red] :right_arrow_curving_left: to the {method_str} [bold]{parent_method}[/bold]"""
+            source_sink_desc = f"""{param_str} [red]{param_name}[/red] {method_in_emoji} to the {method_str} [bold]{parent_method}[/bold]"""
         else:
-            source_sink_desc = f"""{method_str.capitalize()} [red]{parent_method}[/red] :right_arrow_curving_left:"""
+            source_sink_desc = f"""{method_str.capitalize()} [red]{parent_method}[/red] {method_in_emoji}"""
     elif flow.get("label") == "CALL" and flow.get("isExternal"):
         method_full_name = flow.get("fullName", "")
         if not method_full_name.startswith("<"):
             source_sink_desc = f"Invocation: {method_full_name}"
     elif flow.get("label") == "RETURN" and flow.get("code"):
         source_sink_desc = flow.get("code").split("\n")[0]
-    elif project_type not in ("java") and flow.get("label") == "IDENTIFIER":
+    elif project_type not in ("java",) and flow.get("label") == "IDENTIFIER":
         source_sink_desc = flow.get("code").split("\n")[0]
+        if source_sink_desc.endswith("("):
+            source_sink_desc = f":diamond_suit: {source_sink_desc})"
     # Try to understand the source a bit more
     if source_sink_desc.startswith("require("):
-        source_sink_desc = "Flow starts from a module import"
+        source_sink_desc = "The flow originates from a module import."
     elif (
         ".use(" in source_sink_desc
         or ".subscribe(" in source_sink_desc
@@ -156,21 +379,41 @@ def flow_to_source_sink(idx, flow, purls, project_type):
         or ".emit(" in source_sink_desc
         or " => {" in source_sink_desc
     ):
-        source_sink_desc = "Flow starts from a callback function"
+        source_sink_desc = "The flow originates from a callback function."
     elif (
-        "middleware" in source_sink_desc.lower()
-        or "route" in source_sink_desc.lower()
+        "middleware" in source_sink_desc.lower() or "route" in source_sink_desc.lower()
     ):
-        source_sink_desc = "Flow starts from a middlware"
+        source_sink_desc = "The flow originates from middleware."
+    elif len(purls) == 0:
+        if tags:
+            source_sink_desc = (
+                f"{source_sink_desc} can be used to reach packages with tags `{tags}`"
+            )
     elif len(purls) == 1:
-        source_sink_desc = (
-            f"{source_sink_desc} can be used to reach this package."
-        )
+        if is_endpoint_reachable:
+            source_sink_desc = f"{source_sink_desc} can be used to reach this package from certain endpoints."
+        elif source_sink_desc:
+            if is_crypto_flow:
+                source_sink_desc = "Reachable crypto-flow."
+            else:
+                source_sink_desc = "Reachable data-flow."
     else:
-        source_sink_desc = (
-            f"{source_sink_desc} can be used to reach {len(purls)} packages."
-        )
-    return source_sink_desc
+        if is_endpoint_reachable:
+            source_sink_desc = f"{source_sink_desc} can be used to reach {len(purls)} packages from certain endpoints."
+        else:
+            if source_sink_desc:
+                source_sink_desc = (
+                    f"{source_sink_desc} can be used to reach {len(purls)} packages."
+                )
+            elif is_crypto_flow:
+                source_sink_desc = (
+                    f"{len(purls)} packages reachable from this crypto-flow."
+                )
+            else:
+                source_sink_desc = (
+                    f"{len(purls)} packages reachable from this data-flow."
+                )
+    return source_sink_desc, is_endpoint_reachable, is_crypto_flow
 def filter_tags(tags):
@@ -178,14 +421,32 @@ def filter_tags(tags):
         tags = [
             atag
             for atag in tags.split(", ")
-            if atag
-            not in ("RESOLVED_MEMBER", "UNKNOWN_METHOD", "UNKNOWN_TYPE_DECL")
+            if atag not in ("RESOLVED_MEMBER", "UNKNOWN_METHOD", "UNKNOWN_TYPE_DECL")
         ]
         return ", ".join(tags)
     return tags
-def flow_to_str(flow, project_type):
+def is_filterable_code(project_type, code):
+    if len(code) < 5:
+        return True
+    for c in (
+        "console.log",
+        "thoughtLog(",
+        "_tmp_",
+        "LOG.debug(",
+        "options.get(",
+        "RET",
+        "this.",
+        "NULL",
+        "!",
+    ):
+        if code and code.startswith(c):
+            return True
+    return False
+def flow_to_str(explanation_mode, flow, project_type):
     """"""
     has_check_tag = False
     file_loc = ""
@@ -194,60 +455,69 @@ def flow_to_str(flow, project_type):
         and flow.get("lineNumber")
         and not flow.get("parentFileName").startswith("unknown")
     ):
-        file_loc = f'{flow.get("parentFileName").replace("src/main/java/", "").replace("src/main/scala/", "")}#{flow.get("lineNumber")}    '
+        file_loc = f"{flow.get('parentFileName').replace('src/main/java/', '').replace('src/main/scala/', '')}#{flow.get('lineNumber')}    "
     node_desc = flow.get("code").split("\n")[0]
+    if node_desc.endswith("("):
+        node_desc = f":diamond_suit: {node_desc})"
+    elif node_desc.startswith("return "):
+        node_desc = f":arrow_backward: [italic]{node_desc}[/italic]"
     tags = filter_tags(flow.get("tags"))
-    if flow.get("label") == "METHOD_PARAMETER_IN":
+    if flow.get("label") in ("METHOD_PARAMETER_IN",):
         param_name = flow.get("name")
         if param_name == "this":
             param_name = ""
-        node_desc = f'{flow.get("parentMethodName")}([red]{param_name}[/red]) :right_arrow_curving_left:'
+        node_desc = f"{flow.get('parentMethodName')}([red]{param_name}[/red]) :right_arrow_curving_left:"
         if tags:
-            node_desc = (
-                f"{node_desc}\n[bold]Tags:[/bold] [italic]{tags}[/italic]\n"
-            )
-    elif flow.get("label") == "IDENTIFIER":
+            node_desc = f"{node_desc}\n[bold]Tags:[/bold] [italic]{tags}[/italic]\n"
+    elif flow.get("label") in ("IDENTIFIER", "CALL"):
         if node_desc.startswith("<"):
             node_desc = flow.get("name")
+        if flow.get("isExternal"):
+            node_desc = f"{node_desc} :right_arrow_curving_up:"
         if tags:
-            node_desc = (
-                f"{node_desc}\n[bold]Tags:[/bold] [italic]{tags}[/italic]\n"
-            )
-    if tags:
-        for ctag in (
-            "validation",
-            "encode",
-            "encrypt",
-            "sanitize",
-            "authentication",
-            "authorization",
-        ):
+            node_desc = f"{node_desc}\n[bold]Tags:[/bold] [italic]{tags}[/italic]\n"
+    if tags and not is_filterable_code(project_type, node_desc):
+        for ctag in COMMON_CHECK_TAGS:
             if ctag in tags:
                 has_check_tag = True
                 break
     if has_check_tag:
-        node_desc = f"[green]{node_desc}[/green]"
+        if explanation_mode in ("NonReachables",):
+            node_desc = f"[bold][green]{node_desc}[/green][/bold]"
+        else:
+            node_desc = f"[green]{node_desc}[/green]"
+    flow_str = (
+        f"""[gray37]{file_loc}[/gray37]{node_desc}"""
+        if not is_filterable_code(project_type, node_desc)
+        else ""
+    )
     return (
         file_loc,
-        f"""[gray37]{file_loc}[/gray37]{node_desc}""",
+        flow_str,
+        node_desc,
         has_check_tag,
     )
-def explain_flows(flows, purls, project_type):
+def explain_flows(explanation_mode, flows, purls, project_type, vdr_result):
     """"""
     tree = None
     comments = []
     if len(purls) > max_purl_per_flow:
         comments.append(
-            ":exclamation_mark: Refactor this flow to reduce the number of external libraries used."
+            ":exclamation_mark: Refactor this flow to minimize the use of external libraries."
         )
-    purls_str = "\n".join(purls)
-    comments.append(f"[info]Reachable Packages:[/info]\n{purls_str}")
+    if purls:
+        purls_str = "\n".join(purls)
+        comments.append(f"[info]Reachable Packages:[/info]\n{purls_str}")
     added_flows = []
+    added_node_desc = []
     has_check_tag = False
     last_file_loc = None
     source_sink_desc = ""
+    last_code = ""
+    source_code_str = ""
+    sink_code_str = ""
     for idx, aflow in enumerate(flows):
         # For java, we are only interested in identifiers with tags to keep the flows simple to understand
         if (
@@ -256,28 +526,46 @@ def explain_flows(flows, purls, project_type):
             and not aflow.get("tags")
         ):
             continue
+        curr_code = aflow.get("code", "").split("\n")[0]
+        if idx == 0:
+            source_code_str = curr_code
+        if idx == len(flows):
+            sink_code_str = curr_code
+        if last_code and last_code == curr_code:
+            continue
+        last_code = curr_code
         if not source_sink_desc:
-            source_sink_desc = flow_to_source_sink(
-                idx, aflow, purls, project_type
+            source_sink_desc, is_endpoint_reachable, is_crypto_flow = (
+                flow_to_source_sink(idx, aflow, purls, project_type, vdr_result)
             )
-        file_loc, flow_str, has_check_tag_flow = flow_to_str(
-            aflow, project_type
+        file_loc, flow_str, node_desc, has_check_tag_flow = flow_to_str(
+            explanation_mode, aflow, project_type
         )
-        if last_file_loc == file_loc:
+        if not flow_str or (last_file_loc and last_file_loc == file_loc):
             continue
         last_file_loc = file_loc
-        if flow_str in added_flows:
+        if flow_str in added_flows or node_desc in added_node_desc:
             continue
         added_flows.append(flow_str)
+        added_node_desc.append(node_desc)
         if not tree:
             tree = Tree(flow_str)
         else:
             tree.add(flow_str)
         if has_check_tag_flow:
             has_check_tag = True
-    if has_check_tag:
+    if has_check_tag and explanation_mode not in ("NonReachables",):
         comments.insert(
             0,
-            ":white_medium_small_square: Check if the mitigation(s) used in this flow is valid and appropriate for your security requirements.",
+            ":white_medium_small_square: Verify that the mitigation(s) used in this flow are valid and appropriate for your security requirements.",
         )
-    return tree, "\n".join(comments), source_sink_desc, has_check_tag
+    return (
+        tree,
+        "\n".join(comments),
+        source_sink_desc,
+        source_code_str,
+        sink_code_str,
+        has_check_tag,
+        is_endpoint_reachable,
+        is_crypto_flow,
+    )

owasp-depscan 5.5.0__py3-none-any.whl → 6.0.0a3__py3-none-any.whl

owasp-depscan 5.5.0py3-none-any.whl → 6.0.0a3py3-none-any.whl