PyPI - angr - Versions diffs - 9.2.92__py3-none-manylinux2014_x86_64.whl → 9.2.94__py3-none-manylinux2014_x86_64.whl - Mend

angr 9.2.92__py3-none-manylinux2014_x86_64.whl → 9.2.94__py3-none-manylinux2014_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of angr might be problematic. Click here for more details.

Files changed (45) hide show

angr/__init__.py +1 -1
angr/analyses/cfg/cfg_base.py +20 -10
angr/analyses/cfg/indirect_jump_resolvers/amd64_elf_got.py +1 -1
angr/analyses/cfg/indirect_jump_resolvers/arm_elf_fast.py +89 -32
angr/analyses/cfg/indirect_jump_resolvers/jumptable.py +276 -133
angr/analyses/complete_calling_conventions.py +1 -1
angr/analyses/decompiler/ail_simplifier.py +20 -0
angr/analyses/decompiler/block_io_finder.py +293 -0
angr/analyses/decompiler/block_similarity.py +190 -0
angr/analyses/decompiler/callsite_maker.py +5 -0
angr/analyses/decompiler/clinic.py +103 -1
angr/analyses/decompiler/decompilation_cache.py +2 -0
angr/analyses/decompiler/decompiler.py +21 -4
angr/analyses/decompiler/optimization_passes/__init__.py +6 -0
angr/analyses/decompiler/optimization_passes/code_motion.py +361 -0
angr/analyses/decompiler/optimization_passes/optimization_pass.py +1 -0
angr/analyses/decompiler/optimization_passes/stack_canary_simplifier.py +30 -18
angr/analyses/decompiler/optimization_passes/switch_default_case_duplicator.py +110 -0
angr/analyses/decompiler/peephole_optimizations/bswap.py +53 -2
angr/analyses/decompiler/peephole_optimizations/eager_eval.py +20 -1
angr/analyses/decompiler/structured_codegen/c.py +76 -41
angr/analyses/decompiler/structuring/phoenix.py +41 -9
angr/analyses/decompiler/utils.py +13 -4
angr/analyses/propagator/engine_ail.py +3 -0
angr/analyses/reaching_definitions/engine_ail.py +3 -0
angr/analyses/reaching_definitions/reaching_definitions.py +7 -0
angr/analyses/stack_pointer_tracker.py +60 -10
angr/analyses/typehoon/simple_solver.py +95 -24
angr/analyses/typehoon/typeconsts.py +1 -1
angr/calling_conventions.py +0 -3
angr/engines/pcode/cc.py +1 -1
angr/engines/successors.py +6 -0
angr/knowledge_plugins/propagations/states.py +2 -1
angr/procedures/definitions/glibc.py +3 -1
angr/procedures/definitions/parse_win32json.py +2135 -383
angr/procedures/definitions/wdk_ntoskrnl.py +956 -0
angr/sim_type.py +53 -13
angr/utils/library.py +2 -2
{angr-9.2.92.dist-info → angr-9.2.94.dist-info}/METADATA +6 -6
{angr-9.2.92.dist-info → angr-9.2.94.dist-info}/RECORD +44 -41
{angr-9.2.92.dist-info → angr-9.2.94.dist-info}/WHEEL +1 -1
angr/procedures/definitions/wdk_ntdll.py +0 -994
{angr-9.2.92.dist-info → angr-9.2.94.dist-info}/LICENSE +0 -0
{angr-9.2.92.dist-info → angr-9.2.94.dist-info}/entry_points.txt +0 -0
{angr-9.2.92.dist-info → angr-9.2.94.dist-info}/top_level.txt +0 -0

angr/analyses/decompiler/decompiler.py CHANGED Viewed

@@ -10,7 +10,7 @@ import ailment
 from angr.analyses.cfg import CFGFast
 from ...knowledge_plugins.functions.function import Function
 from ...knowledge_base import KnowledgeBase
-from ...sim_variable import SimMemoryVariable
+from ...sim_variable import SimMemoryVariable, SimRegisterVariable, SimStackVariable
 from ...utils import timethis
 from .. import Analysis, AnalysesHub
 from .structuring import RecursiveStructurer, PhoenixStructurer
@@ -403,7 +403,7 @@ class Decompiler(Analysis):
                     SimMemoryVariable(symbol.rebased_addr, 1, name=symbol.name, ident=ident),
                 )
-    def reflow_variable_types(self, type_constraints: Set, var_to_typevar: Dict, codegen):
+    def reflow_variable_types(self, type_constraints: Set, func_typevar, var_to_typevar: Dict, codegen):
         """
         Re-run type inference on an existing variable recovery result, then rerun codegen to generate new results.
@@ -439,13 +439,30 @@ class Decompiler(Analysis):
         try:
             tp = self.project.analyses.Typehoon(
                 type_constraints,
+                func_typevar,
                 kb=var_kb,
                 var_mapping=var_to_typevar,
                 must_struct=must_struct,
                 ground_truth=groundtruth,
             )
-            tp.update_variable_types(self.func.addr, var_to_typevar)
-            tp.update_variable_types("global", var_to_typevar)
+            tp.update_variable_types(
+                self.func.addr,
+                {v: t for v, t in var_to_typevar.items() if isinstance(v, (SimRegisterVariable, SimStackVariable))},
+            )
+            tp.update_variable_types(
+                "global",
+                {v: t for v, t in var_to_typevar.items() if isinstance(v, (SimRegisterVariable, SimStackVariable))},
+            )
+            # update the function prototype if needed
+            if self.func.prototype is not None and self.func.prototype.args:
+                var_manager = var_kb.variables[self.func.addr]
+                for i, arg in enumerate(codegen.cfunc.arg_list):
+                    if i >= len(self.func.prototype.args):
+                        break
+                    var = arg.variable
+                    new_type = var_manager.get_variable_type(var)
+                    if new_type is not None:
+                        self.func.prototype.args[i] = new_type
         except Exception:  # pylint:disable=broad-except
             l.warning(
                 "Typehoon analysis failed. Variables will not have types. Please report to GitHub.", exc_info=True

angr/analyses/decompiler/optimization_passes/__init__.py CHANGED Viewed

@@ -22,6 +22,8 @@ from .flip_boolean_cmp import FlipBooleanCmp
 from .ret_deduplicator import ReturnDeduplicator
 from .win_stack_canary_simplifier import WinStackCanarySimplifier
 from .cross_jump_reverter import CrossJumpReverter
+from .code_motion import CodeMotionOptimization
+from .switch_default_case_duplicator import SwitchDefaultCaseDuplicator
 # order matters!
 _all_optimization_passes = [
@@ -38,15 +40,19 @@ _all_optimization_passes = [
     (ITERegionConverter, True),
     (ITEExprConverter, True),
     (ExprOpSwapper, True),
+    (SwitchDefaultCaseDuplicator, True),
     (ReturnDuplicator, True),
     (LoweredSwitchSimplifier, False),
     (ReturnDeduplicator, True),
+    (CodeMotionOptimization, True),
     (CrossJumpReverter, True),
     (FlipBooleanCmp, True),
 ]
 # these passes may duplicate code to remove gotos or improve the structure of the graph
 DUPLICATING_OPTS = [ReturnDuplicator, CrossJumpReverter]
+# these passes may destroy blocks by merging them into semantically equivalent blocks
+CONDENSING_OPTS = [CodeMotionOptimization, ReturnDeduplicator]
 def get_optimization_passes(arch, platform):

angr/analyses/decompiler/optimization_passes/code_motion.py ADDED Viewed

@@ -0,0 +1,361 @@
+import itertools
+from typing import Tuple, List, Optional, Dict
+import logging
+from ailment import Block
+from ailment.statement import Jump, ConditionalJump, Statement, DirtyStatement
+import networkx as nx
+from angr.analyses.decompiler.optimization_passes.optimization_pass import OptimizationPass, OptimizationPassStage
+from angr.analyses.decompiler.block_similarity import is_similar, index_of_similar_stmts
+from angr.analyses.decompiler.block_io_finder import BlockIOFinder
+from angr.analyses.decompiler.utils import to_ail_supergraph, remove_labels, add_labels
+_l = logging.getLogger(name=__name__)
+class CodeMotionOptimization(OptimizationPass):
+    """
+    Moves common statements out of blocks that share the same predecessors or the same
+    successors. This is done to reduce the number of statements in a block and to make the
+    blocks more similar to each other.
+    As an example:
+    if (x) {
+        b = 2;
+        a = 1;
+        c = 3;
+    } else {
+        b = 2;
+        c = 3;
+    }
+    Will be turned into:
+    if (x) {
+        a = 1;
+    }
+    b = 2;
+    c = 3;
+    Current limitations (for very conservative operations):
+    - moving statements above conditional jumps is not supported
+    - only immediate children and parents are considered for moving statements
+    - when moving statements down, a block is only considered if already has a matching statement at the end
+    """
+    ARCHES = None
+    PLATFORMS = None
+    NAME = "Merge common statements in sub-scopes"
+    STAGE = OptimizationPassStage.AFTER_GLOBAL_SIMPLIFICATION
+    DESCRIPTION = __doc__
+    def __init__(self, func, *args, max_iters=10, node_idx_start: int = 0, **kwargs):
+        super().__init__(func, *args, **kwargs)
+        self._node_idx_start = node_idx_start
+        self._max_optimization_runs = max_iters
+        self.analyze()
+    def _check(self):
+        return True, None
+    def _analyze(self, cache=None):
+        optimization_runs = 0
+        graph_copy = remove_labels(nx.DiGraph(self._graph))
+        updates = True
+        graph_changed = False
+        while optimization_runs < self._max_optimization_runs and updates:
+            optimization_runs += 1
+            super_graph = to_ail_supergraph(graph_copy)
+            updates, updated_blocks = self._move_common_code(super_graph)
+            if updates:
+                critical_fail = self.update_graph_with_super_edits(graph_copy, super_graph, updated_blocks)
+                if critical_fail:
+                    _l.error("Critical failure in updating graph with super edits, aborting")
+                    break
+                graph_changed = True
+        if graph_changed:
+            self.out_graph = add_labels(graph_copy)
+    @staticmethod
+    def update_graph_with_super_edits(
+        original_graph: nx.DiGraph, super_graph: nx.DiGraph, updated_blocks: Dict[Block, Block]
+    ) -> bool:
+        """
+        This function updates an graph when doing block edits on a supergraph version of that same graph.
+        The updated blocks must be provided as a dictionary where the keys are original block in the supergraph and
+        the values are the new blocks that should replace them.
+        The supergraph MUST be generated using the to_ail_supergraph function, since it stores the original nodes
+        each super node represents. This is necessary to update the original graph with the new super nodes.
+        """
+        og_to_super = {}
+        for old_super, new_super in updated_blocks.items():
+            original_blocks = super_graph.nodes[old_super]["original_nodes"]
+            for original_block in original_blocks:
+                og_to_super[original_block] = new_super
+        for old_super, new_super in updated_blocks.items():
+            original_blocks = super_graph.nodes[old_super]["original_nodes"]
+            first_node_preds = []
+            last_node_preds = []
+            for original_block in original_blocks:
+                if original_block not in original_graph.nodes:
+                    return True
+                external_preds = [
+                    pred for pred in original_graph.predecessors(original_block) if pred not in original_blocks
+                ]
+                external_succs = [
+                    succ for succ in original_graph.successors(original_block) if succ not in original_blocks
+                ]
+                if external_preds:
+                    first_node_preds = external_preds
+                if external_succs:
+                    last_node_preds = external_succs
+            original_graph.remove_nodes_from(original_blocks)
+            original_graph.add_node(new_super)
+            for pred in first_node_preds:
+                original_graph.add_edge(og_to_super[pred] if pred in og_to_super else pred, new_super)
+            for succ in last_node_preds:
+                original_graph.add_edge(new_super, og_to_super[succ] if succ in og_to_super else succ)
+        return False
+    def _move_common_code(self, graph) -> Tuple[bool, Optional[Dict[Block, Block]]]:
+        """
+        Does two things at a high level:
+        1. rearrange code in blocks to maximize the number of similar statements at the end of the block
+        2. move common code out of blocks
+        To understand the limitations of this approach, see the TODOs.
+        """
+        # TODO: how can you handle an odd-numbered switch case? or many blocks with the same child?
+        for b0, b1 in itertools.combinations(graph.nodes, 2):
+            if (
+                b0 is b1
+                or not b0.statements
+                or not b1.statements
+                or any(isinstance(stmt, DirtyStatement) for stmt in b0.statements + b1.statements)
+                or is_similar(b0, b1)
+            ):
+                continue
+            # TODO: add support for moving code to a shared parent block, which requires that we figure out how to
+            #   move code above conditional jumps. Hard since you need to know if the condition executes code.
+            # TODO: also, how do you deal with short-circuiting, which is a region parent, not just a block?
+            # target any blocks that have a shared child and move common code to the child
+            b0_succs = list(graph.successors(b0))
+            b1_succs = list(graph.successors(b1))
+            if (len(b0_succs) == len(b1_succs) == 1) and b0_succs[0] == b1_succs[0]:
+                common_succ = b0_succs[0]
+                common_succ_preds = list(graph.predecessors(common_succ))
+                # you can only safely move code to a child if all the common_succ's preds are the ones
+                # we are moving code from (2 nodes).
+                if all(csp in (b0, b1) for csp in common_succ_preds):
+                    success, updated_blocks = self._move_common_code_to_child(b0, b1, common_succ)
+                    if success:
+                        return True, updated_blocks
+        return False, None
+    def _move_common_code_to_parent(self, b0: Block, b1: Block, parent: Block):
+        # TODO: this function does not work yet because you need to figure out if you can move a stmt above
+        #   a conditional jump, which requires cross-block analysis
+        changed, new_b0, new_b1 = self._make_stmts_end_similar(b0, b1, up=True)
+        if not changed:
+            return False, None
+        # move the longest common suffix to the parent
+        new_b0_stmts = new_b0.statements
+        new_b1_stmts = new_b1.statements
+        common_len = 0
+        for idx, new_b0_stmt in enumerate(new_b0_stmts):
+            if not new_b0_stmt.likes(new_b1_stmts[idx]):
+                break
+            common_len += 1
+        if not common_len:
+            raise ValueError("No common statements found, this is unexpected")
+        common_stmts = [new_b0_stmts.pop(0) for _ in range(common_len)]
+        for _ in range(common_len):
+            new_b1_stmts.pop(0)
+        parent_stmts = parent.statements.copy() or []
+        if isinstance(parent_stmts[-1], (ConditionalJump, Jump)):
+            parent_stmts = parent_stmts[:-1] + common_stmts + [parent_stmts[-1]]
+        new_parent = parent.copy(statements=parent_stmts)
+        return True, {b0: new_b0, b1: new_b1, parent: new_parent}
+    def _move_common_code_to_child(self, b0: Block, b1: Block, child: Block):
+        changed, new_b0, new_b1 = self._make_stmts_end_similar(b0, b1, down=True)
+        if not changed:
+            return False, None
+        # move the longest common suffix to the parent
+        new_b0_stmts = new_b0.statements
+        new_b1_stmts = new_b1.statements
+        common_len = 0
+        # start from the -1 index and go backwards
+        for idx in range(-1, -(min(len(new_b0_stmts), len(new_b1_stmts))) - 1, -1):
+            if not new_b0_stmts[idx].likes(new_b1_stmts[idx]):
+                break
+            common_len += 1
+        if not common_len:
+            raise ValueError("No common statements found, this is unexpected")
+        common_stmts = [new_b0_stmts.pop() for _ in range(common_len)]
+        for _ in range(common_len):
+            new_b1_stmts.pop()
+        child_stmts = child.statements.copy() or []
+        new_child = child.copy(statements=common_stmts[::-1] + child_stmts)
+        return True, {b0: new_b0, b1: new_b1, child: new_child}
+    def _make_stmts_end_similar(
+        self, b0: Block, b1: Block, up=False, down=False
+    ) -> Tuple[bool, Optional[Block], Optional[Block]]:
+        """
+        This algorithm attempts to rearrange two blocks to have the longest common sequence of statements
+        at either ends of the blocks. It is flawed in that it currently only attempts to do this rearrangement
+        if the blocks have at least one matching statement at the end.
+        This algorithm iteratively removes statements from the ends of the blocks and then attempts to match
+        the ends of the blocks. It will only do this if one of the two ends has a matching statement in the other.
+        """
+        self._assert_up_or_down(up, down)
+        # copy the statements while filtering out statements that are not needed in the specific
+        # movement case (up or down)
+        curr_stmts = {}
+        for blk in (b0, b1):
+            new_stmts = blk.statements.copy()
+            if down:
+                last_stmt = new_stmts[-1]
+                if isinstance(last_stmt, Jump):
+                    new_stmts.pop()
+                elif isinstance(last_stmt, ConditionalJump):
+                    _l.warning("ConditionalJump at the end of block %s, this should never happen!", blk)
+                    return False, None, None
+            curr_stmts[blk] = new_stmts
+        if not curr_stmts[b0] or not curr_stmts[b1]:
+            return False, None, None
+        # attempt to do a swapping algorithm to maximize the number of similar statements at the end
+        changed = True
+        stmts_updated = False
+        matched_stmts = {b0: [], b1: []}
+        max_iters = len(curr_stmts[b0]) * len(curr_stmts[b1])
+        curr_iters = 0
+        while changed and curr_iters < max_iters:
+            changed = False
+            try_next_swap = False
+            for tgt0, tgt1 in ((b0, b1), (b1, b0)):
+                t0_stmts = curr_stmts[tgt0]
+                t1_stmts = curr_stmts[tgt1]
+                if not t0_stmts or not t1_stmts:
+                    break
+                if up:
+                    # maximize up
+                    while t0_stmts and t1_stmts:
+                        if t0_stmts[0].likes(t1_stmts[0]):
+                            matched_stmts[b0].append((t0_stmts.pop(0), 0))
+                            matched_stmts[b1].append((t1_stmts.pop(0), 0))
+                            try_next_swap = True
+                        else:
+                            break
+                    if not t0_stmts or not t1_stmts:
+                        break
+                elif down:
+                    # maximize down
+                    while t0_stmts and t1_stmts:
+                        if t0_stmts[-1].likes(t1_stmts[-1]):
+                            matched_stmts[b0].append((t0_stmts.pop(), -1))
+                            matched_stmts[b1].append((t1_stmts.pop(), -1))
+                            try_next_swap = True
+                        else:
+                            break
+                    if not t0_stmts or not t1_stmts:
+                        break
+                if not try_next_swap:
+                    continue
+                stmts_updated = True
+                swap_occurred, new_stmts = self._maximize_ends(t0_stmts, t1_stmts, up=up, down=down)
+                if swap_occurred:
+                    changed = True
+                    curr_stmts[b0], curr_stmts[b1] = new_stmts
+                    break
+                try_next_swap = True
+            curr_iters += 1
+            if curr_iters > max_iters:
+                raise ValueError("Exceeded max iterations, likely stuck in infinite loop")
+        # did any changes occur?
+        if not stmts_updated:
+            return False, None, None
+        # reconstruct the blocks and return them
+        new_blks = {}
+        for blk in (b0, b1):
+            new_stmts = curr_stmts[blk]
+            for stmt, idx in matched_stmts[blk][::-1]:
+                if idx == -1:
+                    new_stmts.append(stmt)
+                else:
+                    new_stmts.insert(idx, stmt)
+            new_blks[blk] = blk.copy(statements=new_stmts)
+        return True, new_blks[b0], new_blks[b1]
+    def _maximize_ends(
+        self, b0_stmts, b1_stmts, up=False, down=False
+    ) -> Tuple[bool, Tuple[List[Statement], List[Statement]]]:
+        self._assert_up_or_down(up, down)
+        similar_stmt = b0_stmts[0] if up else b0_stmts[-1]
+        idx_similar = index_of_similar_stmts([similar_stmt], b1_stmts)
+        if idx_similar is None or len(b1_stmts) == 1:
+            return False, (b0_stmts, b1_stmts)
+        target_stmt = b1_stmts[idx_similar]
+        success, new_b1_stmts = self._move_to_end(target_stmt, b1_stmts, up=up, down=down)
+        return (success and (b1_stmts != new_b1_stmts)), (b0_stmts, new_b1_stmts)
+    def _move_to_end(self, stmt, stmts, up=False, down=False) -> Tuple[bool, List[Statement]]:
+        """
+        Attempts to move a stmt to either the top or the bottom of stmts.
+        It does this by attempting to swap, 1 by 1, in either direction it is targeting.
+        """
+        new_stmts = stmts.copy()
+        stmt_idx = new_stmts.index(stmt)
+        swap_offset = -1 if up else 1
+        swap_order = range(stmt_idx + 1, len(new_stmts)) if down else range(stmt_idx - 1, -1, -1)
+        io_finder = BlockIOFinder(new_stmts, self.project)
+        for swap_pos in swap_order:
+            src_stmt = new_stmts[stmt_idx]
+            if io_finder.can_swap(src_stmt, new_stmts, 1 if down else -1):
+                new_stmts[stmt_idx], new_stmts[swap_pos] = new_stmts[swap_pos], new_stmts[stmt_idx]
+                stmt_idx += swap_offset
+            else:
+                return False, stmts
+        return True, new_stmts
+    @staticmethod
+    def _assert_up_or_down(up, down):
+        if up and down:
+            raise ValueError("Cannot maximize both up and down")
+        if not up and not down:
+            raise ValueError("Must maximize either up or down")

angr/analyses/decompiler/optimization_passes/optimization_pass.py CHANGED Viewed

@@ -335,6 +335,7 @@ class StructuringOptimizationPass(OptimizationPass):
         simp = self.project.analyses.AILSimplifier(
             self._func,
             func_graph=graph,
+            use_callee_saved_regs_at_return=False,
             gp=self._func.info.get("gp", None) if self.project.arch.name in {"MIPS32", "MIPS64"} else None,
         )
         return simp.func_graph if simp.simplified else graph

angr/analyses/decompiler/optimization_passes/stack_canary_simplifier.py CHANGED Viewed

@@ -178,24 +178,36 @@ class StackCanarySimplifier(OptimizationPass):
         # Done!
     def _find_canary_init_stmt(self):
-        first_block = self._get_block(self._func.addr)
-        if first_block is None:
-            return None
-        for idx, stmt in enumerate(first_block.statements):
-            if (
-                isinstance(stmt, ailment.Stmt.Store)
-                and isinstance(stmt.addr, ailment.Expr.StackBaseOffset)
-                and isinstance(stmt.data, ailment.Expr.Load)
-                and self._is_add(stmt.data.addr)
-            ):
-                # Check addr: must be fs+0x28
-                op0, op1 = stmt.data.addr.operands
-                if isinstance(op1, ailment.Expr.Register):
-                    op0, op1 = op1, op0
-                if isinstance(op0, ailment.Expr.Register) and isinstance(op1, ailment.Expr.Const):
-                    if op0.reg_offset == self.project.arch.get_register_offset("fs") and op1.value == 0x28:
-                        return first_block, idx
+        block_addr = self._func.addr
+        traversed = set()
+        while True:
+            traversed.add(block_addr)
+            first_block = self._get_block(block_addr)
+            if first_block is None:
+                break
+            for idx, stmt in enumerate(first_block.statements):
+                if (
+                    isinstance(stmt, ailment.Stmt.Store)
+                    and isinstance(stmt.addr, ailment.Expr.StackBaseOffset)
+                    and isinstance(stmt.data, ailment.Expr.Load)
+                    and self._is_add(stmt.data.addr)
+                ):
+                    # Check addr: must be fs+0x28
+                    op0, op1 = stmt.data.addr.operands
+                    if isinstance(op1, ailment.Expr.Register):
+                        op0, op1 = op1, op0
+                    if isinstance(op0, ailment.Expr.Register) and isinstance(op1, ailment.Expr.Const):
+                        if op0.reg_offset == self.project.arch.get_register_offset("fs") and op1.value == 0x28:
+                            return first_block, idx
+            succs = list(self._graph.successors(first_block))
+            if len(succs) == 1:
+                block_addr = succs[0].addr
+                if block_addr not in traversed:
+                    continue
+            break
         return None

angr/analyses/decompiler/optimization_passes/switch_default_case_duplicator.py ADDED Viewed

@@ -0,0 +1,110 @@
+# pylint:disable=too-many-boolean-expressions
+from itertools import count
+import logging
+import networkx
+from angr.knowledge_plugins.cfg import IndirectJumpType
+from .optimization_pass import OptimizationPass, OptimizationPassStage
+_l = logging.getLogger(name=__name__)
+def s2u(s, bits):
+    if s > 0:
+        return s
+    return (1 << bits) + s
+class SwitchDefaultCaseDuplicator(OptimizationPass):
+    """
+    For each switch-case construct (identified by jump tables), duplicate the default-case node when we detect
+    situations where the default-case node is seemingly reused by edges outside the switch-case construct. This code
+    reuse is usually caused by compiler code deduplication.
+    Ideally this pass should be implemented as an ISC optimization reversion.
+    """
+    ARCHES = None
+    PLATFORMS = None
+    STAGE = OptimizationPassStage.BEFORE_REGION_IDENTIFICATION
+    NAME = "Duplicate default-case nodes to undo default-case node reuse caused by compiler code deduplication"
+    DESCRIPTION = __doc__.strip()
+    def __init__(self, func, **kwargs):
+        super().__init__(func, **kwargs)
+        self.node_idx = count(start=0)
+        self.analyze()
+    def _check(self):
+        jumptables = self.kb.cfgs.get_most_accurate().jump_tables
+        switch_jump_block_addrs = {
+            jumptable.addr
+            for jumptable in jumptables.values()
+            if jumptable.type
+            in {IndirectJumpType.Jumptable_AddressComputed, IndirectJumpType.Jumptable_AddressLoadedFromMemory}
+        }
+        jump_node_addrs = self._func.block_addrs_set.intersection(switch_jump_block_addrs)
+        if not jump_node_addrs:
+            return False, None
+        default_case_node_addrs = set()
+        for node_addr in jump_node_addrs:
+            node = self._func.get_node(node_addr)
+            if self._func.graph.in_degree[node] == 1:
+                pred = list(self._func.graph.predecessors(node))[0]
+                if self._func.graph.out_degree[pred] == 2:
+                    default_case_node = next(
+                        iter(nn for nn in self._func.graph.successors(pred) if nn.addr != node_addr)
+                    )
+                    if self._func.graph.out_degree[default_case_node] == 1:
+                        default_case_node_addrs.add((pred.addr, node_addr, default_case_node.addr))
+        if not default_case_node_addrs:
+            return False, None
+        cache = {"default_case_node_addrs": default_case_node_addrs}
+        return True, cache
+    def _analyze(self, cache=None):
+        default_case_node_addrs = cache["default_case_node_addrs"]
+        out_graph = None
+        for switch_head_addr, jump_node_addr, default_addr in default_case_node_addrs:
+            default_case_node = self._func.get_node(default_addr)
+            unexpected_pred_addrs = {
+                pred.addr
+                for pred in self._func.graph.predecessors(default_case_node)
+                if pred.addr not in {switch_head_addr, jump_node_addr}
+            }
+            if unexpected_pred_addrs:
+                default_case_block = self._get_block(default_addr)
+                default_case_succ_block = list(self._graph.successors(default_case_block))[0]
+                jump_nodes = self._get_blocks(jump_node_addr)
+                jump_node_descedents = set()
+                for jump_node in jump_nodes:
+                    jump_node_descedents |= networkx.descendants(self._graph, jump_node)
+                # duplicate default_case_node for each unexpected predecessor
+                for unexpected_pred_addr in unexpected_pred_addrs:
+                    for unexpected_pred in self._get_blocks(unexpected_pred_addr):
+                        # is this predecessor reachable from the jump node? if so, we believe this is a legitimate edge
+                        # and do not duplicate it.
+                        if unexpected_pred in jump_node_descedents:
+                            continue
+                        default_case_block_copy = default_case_block.copy()
+                        default_case_block_copy.idx = next(self.node_idx)
+                        if out_graph is None:
+                            out_graph = self._graph
+                        out_graph.remove_edge(unexpected_pred, default_case_block)
+                        out_graph.add_edge(unexpected_pred, default_case_block_copy)
+                        out_graph.add_edge(default_case_block_copy, default_case_succ_block)
+        self.out_graph = out_graph