PyPI - angr - Versions diffs - 9.2.156__cp310-cp310-manylinux2014_aarch64.whl → 9.2.157__cp310-cp310-manylinux2014_aarch64.whl - Mend

angr 9.2.156__cp310-cp310-manylinux2014_aarch64.whl → 9.2.157__cp310-cp310-manylinux2014_aarch64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of angr might be problematic. Click here for more details.

Files changed (34) hide show

angr/__init__.py +1 -1
angr/analyses/cfg/cfg_base.py +87 -71
angr/analyses/cfg/cfg_fast.py +5 -0
angr/analyses/decompiler/clinic.py +182 -104
angr/analyses/decompiler/decompiler.py +11 -0
angr/analyses/decompiler/dephication/graph_vvar_mapping.py +1 -1
angr/analyses/decompiler/structured_codegen/c.py +18 -5
angr/analyses/disassembly.py +5 -11
angr/analyses/s_propagator.py +2 -4
angr/analyses/stack_pointer_tracker.py +3 -7
angr/analyses/typehoon/simple_solver.py +3 -3
angr/analyses/variable_recovery/engine_base.py +2 -8
angr/analyses/variable_recovery/variable_recovery.py +4 -3
angr/calling_conventions.py +3 -3
angr/engines/hook.py +1 -1
angr/engines/icicle.py +229 -0
angr/engines/pcode/behavior.py +1 -4
angr/engines/pcode/emulate.py +1 -4
angr/engines/pcode/lifter.py +2 -10
angr/engines/vex/claripy/irop.py +2 -2
angr/knowledge_plugins/functions/function.py +18 -10
angr/knowledge_plugins/functions/function_manager.py +68 -5
angr/knowledge_plugins/variables/variable_manager.py +15 -3
angr/rustylib.cpython-310-aarch64-linux-gnu.so +0 -0
angr/sim_variable.py +31 -0
angr/storage/memory_mixins/address_concretization_mixin.py +2 -2
angr/storage/memory_mixins/convenient_mappings_mixin.py +1 -1
{angr-9.2.156.dist-info → angr-9.2.157.dist-info}/METADATA +7 -8
{angr-9.2.156.dist-info → angr-9.2.157.dist-info}/RECORD +33 -33
{angr-9.2.156.dist-info → angr-9.2.157.dist-info}/WHEEL +1 -1
angr/rustylib.pyi +0 -165
{angr-9.2.156.dist-info → angr-9.2.157.dist-info}/entry_points.txt +0 -0
{angr-9.2.156.dist-info → angr-9.2.157.dist-info}/licenses/LICENSE +0 -0
{angr-9.2.156.dist-info → angr-9.2.157.dist-info}/top_level.txt +0 -0

angr/__init__.py CHANGED Viewed

@@ -2,7 +2,7 @@
 # pylint: disable=wrong-import-position
 from __future__ import annotations
-__version__ = "9.2.156"
+__version__ = "9.2.157"
 if bytes is str:
     raise Exception(

angr/analyses/cfg/cfg_base.py CHANGED Viewed

@@ -1147,7 +1147,8 @@ class CFGBase(Analysis):
         graph = self.graph
         smallest_nodes = {}  # indexed by end address of the node
-        end_addresses_to_nodes = defaultdict(set)
+        end_addr_to_node = {}  # a dictionary from node key to node *if* only one node exists for the key
+        end_addr_to_nodes = defaultdict(list)  # a dictionary from node key to nodes *if* more than one node exist
         for n in graph.nodes():
             if n.is_simprocedure:
@@ -1155,76 +1156,89 @@ class CFGBase(Analysis):
             end_addr = n.addr + n.size
             key = (end_addr, n.callstack_key)
             # add the new item
-            end_addresses_to_nodes[key].add(n)
-        for key in list(end_addresses_to_nodes.keys()):
-            if len(end_addresses_to_nodes[key]) == 1:
-                smallest_nodes[key] = next(iter(end_addresses_to_nodes[key]))
-                del end_addresses_to_nodes[key]
+            if key not in end_addr_to_node:
+                # this is the first node of this key
+                end_addr_to_node[key] = n
+            else:
+                # this is the 2nd+ node of this key
+                if key not in end_addr_to_nodes:
+                    end_addr_to_nodes[key].append(end_addr_to_node[key])
+                end_addr_to_nodes[key].append(n)
+        # update smallest_nodes
+        for key, node in end_addr_to_node.items():
+            if key in end_addr_to_nodes:
+                continue
+            smallest_nodes[key] = node
+        del end_addr_to_node  # micro memory optimization
-        while end_addresses_to_nodes:
+        while end_addr_to_nodes:
             key_to_find = (None, None)
-            for tpl, x in end_addresses_to_nodes.items():
-                if len(x) > 1:
-                    key_to_find = tpl
-                    break
+            for tpl in list(end_addr_to_nodes):
+                x = end_addr_to_nodes[tpl]
+                if len(x) <= 1:
+                    continue
+                key_to_find = tpl
-            end_addr, callstack_key = key_to_find
-            all_nodes = end_addresses_to_nodes[key_to_find]
+                end_addr, callstack_key = key_to_find
+                all_nodes = end_addr_to_nodes[key_to_find]
-            all_nodes = sorted(all_nodes, key=lambda node: node.addr, reverse=True)
-            smallest_node = all_nodes[0]  # take the one that has the highest address
-            other_nodes = all_nodes[1:]
+                all_nodes = sorted(all_nodes, key=lambda node: node.addr, reverse=True)
+                smallest_node = all_nodes[0]  # take the one that has the highest address
+                other_nodes = all_nodes[1:]
-            self._normalize_core(
-                graph, callstack_key, smallest_node, other_nodes, smallest_nodes, end_addresses_to_nodes
-            )
+                self._normalize_core(
+                    graph, callstack_key, smallest_node, other_nodes, smallest_nodes, end_addr_to_nodes
+                )
-            del end_addresses_to_nodes[key_to_find]
-            # make sure the smallest node is stored in end_addresses
-            smallest_nodes[key_to_find] = smallest_node
-            # corner case
-            # sometimes two overlapping blocks may not be ending at the instruction. this might happen when one of the
-            # blocks (the bigger one) hits the instruction count limit or bytes limit before reaching the end address
-            # of the smaller block. in this case we manually pick up those blocks.
-            if not end_addresses_to_nodes:
-                # find if there are still overlapping blocks
-                sorted_smallest_nodes = defaultdict(list)  # callstack_key is the key of this dict
-                for k, node in smallest_nodes.items():
-                    _, callstack_key = k
-                    sorted_smallest_nodes[callstack_key].append(node)
-                for k in sorted_smallest_nodes:
-                    sorted_smallest_nodes[k] = sorted(sorted_smallest_nodes[k], key=lambda node: node.addr)
-                for callstack_key, lst in sorted_smallest_nodes.items():
-                    lst_len = len(lst)
-                    for i, node in enumerate(lst):
-                        if i == lst_len - 1:
-                            break
-                        next_node = lst[i + 1]
-                        if node is not next_node and node.addr <= next_node.addr < node.addr + node.size:
-                            # umm, those nodes are overlapping, but they must have different end addresses
-                            nodekey_a = node.addr + node.size, callstack_key
-                            nodekey_b = next_node.addr + next_node.size, callstack_key
-                            if nodekey_a == nodekey_b:
-                                # error handling: this will only happen if we have completely overlapping nodes
-                                # caused by different jumps (one of the jumps is probably incorrect), which usually
-                                # indicates an error in CFG recovery. we print a warning and skip this node
-                                l.warning(
-                                    "Found completely overlapping nodes %s. It usually indicates an error in CFG "
-                                    "recovery. Skip.",
-                                    node,
-                                )
-                                continue
-                            if nodekey_a in smallest_nodes and nodekey_b in smallest_nodes:
-                                # misuse end_addresses_to_nodes
-                                end_addresses_to_nodes[(node.addr + node.size, callstack_key)].add(node)
-                                end_addresses_to_nodes[(node.addr + node.size, callstack_key)].add(next_node)
-                            smallest_nodes.pop(nodekey_a, None)
-                            smallest_nodes.pop(nodekey_b, None)
+                del end_addr_to_nodes[key_to_find]
+                # make sure the smallest node is stored in end_addresses
+                smallest_nodes[key_to_find] = smallest_node
+                # corner case
+                # sometimes two overlapping blocks may not end at the instruction. this might happen when one of the
+                # blocks (the bigger one) hits the instruction count limit or bytes limit before reaching the end
+                # address of the smaller block. in this case we manually pick up those blocks.
+                if not end_addr_to_nodes:
+                    # find if there are still overlapping blocks
+                    sorted_smallest_nodes = defaultdict(list)  # callstack_key is the key of this dict
+                    for k, node in smallest_nodes.items():
+                        _, callstack_key = k
+                        sorted_smallest_nodes[callstack_key].append(node)
+                    for k in sorted_smallest_nodes:
+                        sorted_smallest_nodes[k] = sorted(sorted_smallest_nodes[k], key=lambda node: node.addr)
+                    for callstack_key, lst in sorted_smallest_nodes.items():
+                        lst_len = len(lst)
+                        for i, node in enumerate(lst):
+                            if i == lst_len - 1:
+                                break
+                            next_node = lst[i + 1]
+                            if node is not next_node and node.addr <= next_node.addr < node.addr + node.size:
+                                # umm, those nodes are overlapping, but they must have different end addresses
+                                nodekey_a = node.addr + node.size, callstack_key
+                                nodekey_b = next_node.addr + next_node.size, callstack_key
+                                if nodekey_a == nodekey_b:
+                                    # error handling: this will only happen if we have completely overlapping nodes
+                                    # caused by different jumps (one of the jumps is probably incorrect), which usually
+                                    # indicates an error in CFG recovery. we print a warning and skip this node
+                                    l.warning(
+                                        "Found completely overlapping nodes %s. It usually indicates an error in CFG "
+                                        "recovery. Skip.",
+                                        node,
+                                    )
+                                    continue
+                                if nodekey_a in smallest_nodes and nodekey_b in smallest_nodes:
+                                    # misuse end_addresses_to_nodes
+                                    key = node.addr + node.size, callstack_key
+                                    if node not in end_addr_to_nodes[key]:
+                                        end_addr_to_nodes[key].append(node)
+                                    if next_node not in end_addr_to_nodes[key]:
+                                        end_addr_to_nodes[key].append(next_node)
+                                smallest_nodes.pop(nodekey_a, None)
+                                smallest_nodes.pop(nodekey_b, None)
         self.normalized = True
@@ -1235,7 +1249,7 @@ class CFGBase(Analysis):
         smallest_node,
         other_nodes,
         smallest_nodes,
-        end_addresses_to_nodes,
+        end_addr_to_nodes,
     ):
         # Break other nodes
         for n in other_nodes:
@@ -1254,8 +1268,8 @@ class CFGBase(Analysis):
             # the logic below is a little convoluted. we check if key exists in either end_address_to_nodes or
             # smallest_nodes, since we don't always add the new node back to end_addresses_to_nodes dict - we only do so
             # when there are more than one node with that key.
-            if key in end_addresses_to_nodes:
-                new_node = next((i for i in end_addresses_to_nodes[key] if i.addr == n.addr), None)
+            if key in end_addr_to_nodes:
+                new_node = next((i for i in end_addr_to_nodes[key] if i.addr == n.addr), None)
             if new_node is None and key in smallest_nodes and smallest_nodes[key].addr == n.addr:
                 new_node = smallest_nodes[key]
@@ -1304,8 +1318,10 @@ class CFGBase(Analysis):
                 # Put the new node into end_addresses list
                 if key in smallest_nodes:
-                    end_addresses_to_nodes[key].add(smallest_nodes[key])
-                    end_addresses_to_nodes[key].add(new_node)
+                    if smallest_nodes[key] not in end_addr_to_nodes[key]:
+                        end_addr_to_nodes[key].append(smallest_nodes[key])
+                    if new_node not in end_addr_to_nodes[key]:
+                        end_addr_to_nodes[key].append(new_node)
                 else:
                     smallest_nodes[key] = new_node
@@ -1936,7 +1952,7 @@ class CFGBase(Analysis):
                     # skip empty blocks (that are usually caused by lifting failures)
                     continue
                 block = func_0.get_block(block_node.addr, block_node.size)
-                if block.vex.jumpkind not in ("Ijk_Boring", "Ijk_InvalICache"):
+                if block.vex_nostmt.jumpkind not in ("Ijk_Boring", "Ijk_InvalICache"):
                     continue
                 # Skip alignment blocks
                 if self._is_noop_block(self.project.arch, block):

angr/analyses/cfg/cfg_fast.py CHANGED Viewed

@@ -2841,6 +2841,11 @@ class CFGFast(ForwardAnalysis[CFGNode, CFGNode, CFGJob, int], CFGBase):  # pylin
     def _process_irsb_data_refs(self, irsb_addr, data_refs):
         assumption = self._decoding_assumptions.get(irsb_addr & ~1)
         for ref in data_refs:
+            # data_addr + data_size might overflow; we ignore such cases
+            max_addr = 0xFFFF_FFFF if self.project.arch.bits == 32 else 0xFFFF_FFFF_FFFF_FFFF
+            if ref.data_addr + ref.data_size > max_addr:
+                continue
             if ref.data_type_str == "integer(store)":
                 data_type_str = "integer"
                 is_store = True