PyPI - reait - Versions diffs - 0.0.19__py3-none-any.whl → 1.0.0__py3-none-any.whl - Mend

reait 0.0.19py3-none-any.whl → 1.0.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

reait/__init__.py +2 -0
reait/api.py +523 -218
reait/main.py +265 -295
{reait-0.0.19.dist-info → reait-1.0.0.dist-info}/METADATA +40 -51
reait-1.0.0.dist-info/RECORD +9 -0
{reait-0.0.19.dist-info → reait-1.0.0.dist-info}/WHEEL +1 -1
reait-0.0.19.dist-info/RECORD +0 -9
{reait-0.0.19.dist-info → reait-1.0.0.dist-info}/LICENSE +0 -0
{reait-0.0.19.dist-info → reait-1.0.0.dist-info}/entry_points.txt +0 -0
{reait-0.0.19.dist-info → reait-1.0.0.dist-info}/top_level.txt +0 -0

reait/api.py CHANGED Viewed

@@ -1,349 +1,654 @@
-#!/usr/bin/env python
-from __future__ import print_function
+# -*- coding: utf-8 -*-
+from __future__ import print_function, annotations
+import json
+import tomli
+import logging
+import requests
 from hashlib import sha256
-from rich import print_json, print as rich_print
+from datetime import datetime
 from sklearn.metrics.pairwise import cosine_similarity
-import os
-import re
-import argparse
-import requests
-from numpy import array, vstack, mean, average, dot, arccos, pi
+from os import access, R_OK
+from os.path import basename, isfile, expanduser, getsize
+from requests import request, Response, HTTPError
+from numpy import array, vstack, dot, arccos, pi
 from pandas import DataFrame
-import json
-import tomli
-from os.path import isfile
-from sys import exit
-from IPython import embed
-import lief
+from lief import parse, Binary, ELF, PE, MachO
-__version__ = "0.0.19"
+__version__ = "1.0.0"
 re_conf = {
-    'apikey' : 'l1br3',
-    'host' : 'https://api.reveng.ai',
-    'model': 'binnet-0.1'
+    "apikey": "l1br3",
+    "host": "https://api.reveng.ai",
+    "model": "binnet-0.3-x86",
 }
-def reveng_req(r: requests.request, end_point: str, data=None, ex_headers: dict = None, params=None):
-    url = f"{re_conf['host']}/{end_point}"
-    headers = { "Authorization": f"{re_conf['apikey']}" }
-    if ex_headers:
-        headers.update(ex_headers)
-    return r(url, headers=headers, data=data, params=params)
+logger = logging.getLogger("REAIT")
+class ReaitError(HTTPError):
+    def __init__(self, reason: str, end_point: str = None):
+        response = Response()
+        response.reason = reason
+        response.status_code = 404
+        response._content = b'{"success": false, "error": "' + reason.encode() + b'"}'
+        response.url = f"{re_conf['host']}/{end_point if end_point[0] != '/' else end_point[1:]}" if end_point else None
+        super().__init__(reason, response=response)
-def RE_delete(fpath: str, model_name: str):
+def reveng_req(r: request, end_point: str, data: dict = None, ex_headers: dict = None,
+               params: dict = None, json_data: dict = None, timeout: int = 60, files: dict = None) -> Response:
     """
-        Delete analysis results for Binary ID in command
+    Constructs and sends a Request
+    :param r: Method for the new Request
+    :param end_point: Endpoint to add to the base URL
+    :param ex_headers: Extended HTTP headers to add
+    :param data: Dictionary, list of tuples, bytes, or file-like object to send in the body
+    :param params: Dictionary, list of tuples or bytes to send in the query string for the query string
+    :param json_data: A JSON serializable Python object to send in the body
+    :param timeout: Number of seconds to stop waiting for a Response
+    :param files: Dictionary of files to send to the specified URL
     """
-    bin_id = binary_id(fpath)
-    params = { 'model_name': model_name }
-    res = reveng_req(requests.delete, f"/analyse/{bin_id}", params=params)
-    if res.status_code == 200:
-        print(f"[+] Success. Securely deleted {fpath} analysis")
-    elif res.status_code == 404:
-        print(f"[!] Error, analysis not found for {bin_id} under {model_name}.")
+    url = f"{re_conf['host']}/{end_point if end_point[0] != '/' else end_point[1:]}"
+    headers = {"Authorization": re_conf["apikey"]}
+    if ex_headers:
+        headers.update(ex_headers)
+    logger.debug("Making %s request %s:\n  - headers: %s\n  - data: %s\n  - json_data: %s\n  - params: %s\n  - files: %s",
+                 r.__name__.upper(), url, headers, data, json_data, params, files)
+    response: Response = r(url, headers=headers, json=json_data, data=data, params=params, timeout=timeout, files=files)
+    logger.debug("Making %s response %s:\n  - headers: %s\n  - status_code: %d\n  - content: %s",
+                 r.__name__.upper(), url, response.headers, response.status_code, response.text)
+    return response
+def re_hash_check(bin_id: str) -> bool:
+    res: Response = reveng_req(requests.get, "v1/search", json_data={"sha_256_hash": bin_id})
+    if res.ok:
+        return any(binary["sha_256_hash"] == bin_id for binary in res.json()["query_results"])
     else:
-        print(f"[!] Error deleteing binary {bin_id} under {model_name}. Server returned {res.status_code}.")
-    return
+        logger.warning("Bad Request: %s", res.text)
+    return False
-def RE_analyse(fpath: str, model: str = None, isa_options: str = None, platform_options: str = None, file_options: str = None, dynamic_execution: bool = False, command_line_args: str = None, scope: str = None, tags: str = None):
-    """
-        Start analysis job for binary file
-    """
-    filename = os.path.basename(fpath)
-    params={ 'file_name': filename }
-    for p_name in ('model', 'isa_options', 'platform_options', 'file_options', 'dynamic_execution', 'command_line_args', 'scope', 'tags'):
-        p_value = locals()[p_name]
-        if p_value:
-            params[p_name] = p_value
-    res = reveng_req(requests.post, f"analyse", data=open(fpath, 'rb').read(), params=params)
-    if res.status_code == 200:
-        print("[+] Successfully submitted binary for analysis.")
-        print(f"[+] {fpath} - {binary_id(fpath)}")
-        return res
+# Bin_id is referred to as hash in this program - to maintain usage BID = id of a binary bin_id = hash
+# Assumes a file has been passed, correct hash only
+# Returns the BID of the binary_id (hash)
+def re_bid_search(bin_id: str) -> int:
+    res: Response = reveng_req(requests.get, "v1/search", json_data={"sha_256_hash": bin_id})
-    if res.status_code == 400:
-        response = json.loads(res.text)
-        if 'error' in response.keys():
-            print(f"[-] Error analysing {fpath} - {response['error']}. Please check the results log file for {binary_id(fpath)}")
-            return res
+    bid = -1
+    if res.ok:
+        # Filter the result who matches the SHA-256
+        binaries = list(filter(lambda binary: binary["sha_256_hash"] == bin_id, res.json()["query_results"]))
+        # Check only one record is returned
+        if len(binaries) == 1:
+            binary = binaries[0]
+            bid = binary["binary_id"]
+            logger.info("Only one record exists, selecting - ID: %d, Name: %s, Creation: %s, Model: %s, Status: %s",
+                        bid, binary["binary_name"], binary["creation"], binary["model_name"], binary["status"])
+        elif len(binaries) > 1:
+            binaries.sort(key=lambda binary: datetime.fromisoformat(binary["creation"]).timestamp(), reverse=True)
+            logger.info("%d matches found for hash: %s", len(binaries), bin_id)
+            options_dict = {}
+            for idx, binary in enumerate(binaries):
+                logger.info("[%d] - ID: %d, Name: %s, Creation: %s, Model: %s, Status: %s",
+                            idx, binary["binary_id"], binary["binary_name"], binary["creation"],
+                            binary["model_name"], binary["status"])
+                options_dict[idx] = binary["binary_id"]
+            try:
+                user_input = input("[+] Please enter the option you want to use for this operation:")
+                option_number = int(user_input)
+                bid = options_dict.get(option_number, -1)
+                if bid == -1:
+                    logger.warning("Invalid option.")
+            except Exception:
+                bid = options_dict[0]
+                logger.warning("Select the most recent analysis - ID: %d", bid)
+        else:
+            logger.warning("No matches found for hash: %s", bin_id)
+    else:
+        logger.warning("Bad Request: %s", res.text)
     res.raise_for_status()
+    return bid
-def RE_upload(fpath: str):
+def RE_delete(fpath: str, binary_id: int = 0) -> Response:
     """
-        Upload binary to Server
+    Delete analysis results for Binary ID in command
+    :param fpath: File path for binary to analyse
+    :param binary_id: ID of binary
     """
-    res = reveng_req(requests.post, f"upload", data=open(fpath, 'rb').read())
-    if res.status_code == 200:
-        print("[+] Successfully uploaded binary to your account.")
-        print(f"[+] {fpath} - {binary_id(fpath)}")
-        return res
+    bin_id = re_binary_id(fpath)
+    bid = re_bid_search(bin_id) if binary_id == 0 else binary_id
-    if res.status_code == 400:
-        if 'already exists' in json.loads(res.text)['reason']:
-            print(f"[-] {fpath} already exists. Please check the results log file for {binary_id(fpath)}")
-            return True
+    end_point = f"v1/analyse/{bid}"
+    if bid == -1:
+        raise ReaitError(f"No matches found for hash: {bin_id}", end_point)
+    res: Response = reveng_req(requests.delete, end_point)
+    if res.ok:
+        logger.info("Securely deleted analysis ID %s - %s.", bid, bin_id)
+    elif res.status_code == 404:
+        logger.warning("Error analysis not found for ID %s - %s.", bid, bin_id)
+    else:
+        logger.error("Error deleting binary %s under. Server returned %d.", bin_id, res.status_code)
     res.raise_for_status()
+    return res
+def RE_analyse(fpath: str, model_name: str = None, isa_options: str = None,
+               platform_options: str = None, file_options: str = None, dynamic_execution: bool = False,
+               command_line_args: str = None, binary_scope: str = None, tags: list = None, priority: int = 0,
+               duplicate: bool = False, symbols: dict = None, debug_fpath: str = None) -> Response:
+    """
+    Start analysis job for binary file
+    :param fpath: File path for binary to analyse
+    :param model_name: Binary model name
+    :param isa_options: Executable ISA
+    :param file_options: File options
+    :param platform_options: OS platform
+    :param dynamic_execution: Enable dynamic execution in sandbox during analysis
+    :param command_line_args: Command line arguments to pass when running binary sample in the sandbox
+    :param binary_scope: Analysis visibility
+    :param tags: Assign tags to an analysis
+    :param priority: Priority to processing queue
+    :param duplicate: Duplicate an existing binary
+    :param symbols: JSON object containing the base address and the list of functions
+    :param debug_fpath: File path for debug file
+    """
+    bin_id = re_binary_id(fpath)
+    result = re_hash_check(bin_id)
+    end_point = "v1/analyse/"
+    if result and duplicate is False:
+        logger.error("Error, duplicate analysis for %s. To upload again, use the --duplicate flag.",
+                     bin_id)
+        raise ReaitError(f"Duplicate analysis for hash: {bin_id}", end_point)
+    filename = basename(fpath)
+    params = {"file_name": filename, "size_in_bytes": getsize(fpath), "sha_256_hash": bin_id,}
+    if debug_fpath and isfile(debug_fpath) and access(debug_fpath, R_OK):
+        try:
+            debug = RE_upload(debug_fpath).json()
+            if debug["success"]:
+                params["debug_hash"] = debug["sha_256_hash"]
+        except HTTPError:
+            pass
+    for p_name in ("model_name", "isa_options", "platform_options", "file_options",
+                   "dynamic_execution", "command_line_args", "binary_scope", "tags", "priority", "symbols",):
+        p_value = locals()[p_name]
+        if p_value:
+            params[p_name] = p_value
+    res: Response = reveng_req(requests.post, end_point, json_data=params)
-def RE_embeddings(fpath: str, model_name: str):
-    """
-        Fetch symbol embeddings
-    """
-    params = { 'model_name': model_name }
-    res = reveng_req(requests.get, f"embeddings/{binary_id(fpath)}", params=params)
-    if res.status_code == 400:
-        print(f"[-] Analysis for {binary_id(fpath)} still in progress. Please check the logs (-l) and try again later.")
+    if res.ok:
+        logger.info("Successfully submitted binary for analysis. %s - %s", fpath, bin_id)
+    elif res.status_code == 400:
+        if "error" in res.json().keys():
+            logger.warning("Error analysing %s - %s", fpath, res.json()["error"])
     res.raise_for_status()
-    return res.json()
+    return res
-def RE_signature(fpath: str, model_name: str):
+def RE_upload(fpath: str) -> Response:
     """
-        Fetch binary BinNet signature
+    Upload binary to Server
+    :param fpath: File path for binary to analyse
     """
-    params = { 'model_name': model_name }
-    res = reveng_req(requests.get, f"signature/{binary_id(fpath)}", params=params)
-    if res.status_code == 425:
-        print(f"[-] Analysis for {binary_id(fpath)} still in progress. Please check the logs (-l) and try again later.")
+    bin_id = re_binary_id(fpath)
+    result = re_hash_check(bin_id)
+    if result:
+        logger.info("File %s - %s already uploaded. Skipping upload...", fpath, bin_id)
+        res = Response()
+        res.status_code = 200
+        res.url = f"{re_conf['host']}/v1/upload"
+        res._content = ('{0}"success": true,'
+                        '"message": "File already uploaded!",'
+                        '"sha_256_hash": "{1}"{2}').format("{", bin_id, "}").encode()
+    else:
+        with open(fpath, "rb") as fd:
+            res: Response = reveng_req(requests.post, "v1/upload", files={"file": fd})
+        if res.ok:
+            logger.info("Successfully uploaded binary to your account. %s - %s", fpath, bin_id)
+        elif res.status_code == 400:
+            if "error" in res.json().keys():
+                logger.warning("Error uploading %s - %s", fpath, res.json()["error"])
+        elif res.status_code == 413:
+            logger.warning("File too large. Please upload files under 10MB.")
+        elif res.status_code == 500:
+            logger.error("Internal Server Error. Please contact support. Skipping upload...")
     res.raise_for_status()
-    return res.json()
+    return res
-def RE_embedding(fpath: str, start_vaddr: int, end_vaddr: int = None, base_vaddr: int = None, model: str = None):
+def RE_embeddings(fpath: str, binary_id: int = 0) -> Response:
     """
-        Fetch embedding for custom symbol range
+    Fetch symbol embeddings
+    :param fpath: File path for binary to analyse
+    :param binary_id: ID of binary
     """
-    params = {}
+    bin_id = re_binary_id(fpath)
+    bid = re_bid_search(bin_id) if binary_id == 0 else binary_id
-    if end_vaddr:
-        params['end_vaddr']: end_vaddr
-    if base_vaddr:
-        params['base_vaddr']: base_vaddr
-    if model:
-        params['model']: model
+    end_point = f"v1/embeddings/binary/{bid}"
-    res = reveng_req(requests.get, f"embedding/{binary_id(fpath)}/{start_vaddr}", params=params)
-    if res.status_code == 425:
-        print(f"[-] Analysis for {binary_id(fpath)} still in progress. Please check the logs (-l) and try again later.")
-        return
+    if bid == -1:
+        raise ReaitError(f"No matches found for hash: {bin_id}", end_point)
+    res: Response = reveng_req(requests.get, end_point)
+    if res.status_code == 400:
+        logger.warning("Analysis for %s still in progress. Please check the logs (-l) and try again later.",
+                       bin_id)
     res.raise_for_status()
-    return res.json()
+    return res
-def RE_logs(fpath: str, model_name: str):
+def RE_logs(fpath: str, binary_id: int = 0, console: bool = True) -> Response:
     """
-        Delete analysis results for Binary ID in command
+    Get the logs for an analysis associated to Binary ID in command
+    :param fpath: File path for binary to analyse
+    :param binary_id: ID of binary
+    :param console: Show response in console
     """
-    bin_id = binary_id(fpath)
-    params = { 'model_name': model_name }
-    res = reveng_req(requests.get, f"/logs/{bin_id}", params=params)
-    if res.status_code == 200:
-        print(res.text)
-        return
+    bin_id = re_binary_id(fpath)
+    bid = re_bid_search(bin_id) if binary_id == 0 else binary_id
+    end_point = f"v1/logs/{bid}"
+    if bid == -1:
+        raise ReaitError(f"No matches found for hash: {bin_id}", end_point)
+    res: Response = reveng_req(requests.get, end_point)
+    if res.ok and console:
+        logger.info("Logs found for %s:\n%s", bin_id, res.json()["logs"])
     elif res.status_code == 404:
-        print(f"[!] Error, binary analysis for {bin_id} under {model_name} not found.")
-        return
+        logger.warning("Error, logs not found for %s.", bin_id)
     res.raise_for_status()
+    return res
-def RE_cves(fpath: str, model_name: str):
+def RE_cves(fpath: str, binary_id: int = 0) -> Response:
     """
-        Check for known CVEs in Binary
+    Check for known CVEs in Binary
+    :param fpath: File path for binary to analyse
+    :param binary_id: ID of binary
     """
-    bin_id = binary_id(fpath)
-    params = { 'model_name': model_name }
-    res = reveng_req(requests.get, f"/cves/{bin_id}", params)
-    if res.status_code == 200:
+    bin_id = re_binary_id(fpath)
+    bid = re_bid_search(bin_id) if binary_id == 0 else binary_id
+    end_point = f"cves/{bid}"
+    if bid == -1:
+        raise ReaitError(f"No matches found for hash: {bin_id}", end_point)
+    res: Response = reveng_req(requests.get, end_point)
+    if res.ok:
         cves = json.loads(res.text)
-        rich_print(f"[bold blue]Checking for known CVEs embedded inside [/bold blue] [bold bright_green]{fpath}[/bold bright_green]:")
+        logger.info("Checking for known CVEs embedded inside %s", fpath)
         if len(cves) == 0:
-            rich_print(f"[bold bright_green]0 CVEs found.[/bold bright_green]")
+            logger.info("0 CVEs found.")
         else:
-            rich_print(f"[bold red]Warning CVEs found![/bold red]")
-            print_json(data=cves)
-        return
+            logger.warning("Warning CVEs found!\n%s", res.text)
     elif res.status_code == 404:
-        print(f"[!] Error, binary analysis for {bin_id} not found.")
-        return
+        logger.warning("Error, binary analysis not found for %s.", bin_id)
     res.raise_for_status()
+    return res
-def RE_status(fpath: str, model_name: str):
+def RE_status(fpath: str, binary_id: int = 0, console: bool = False) -> Response:
     """
-        Check for known CVEs in Binary
+    Get the status of an ongoing binary analysis
+    :param fpath: File path for binary to analyse
+    :param binary_id: ID of binary
     """
-    bin_id = binary_id(fpath)
-    params = { 'model_name': model_name }
-    res = reveng_req(requests.get, f"/analyse/status/{bin_id}", params)
-    if res.status_code == 200:
-        return res.json()
-    elif res.status_code == 400:
-        print(f"[!] Error, status not found for {bin_id}:{model_name} not found.")
-        return res.json()
+    bin_id = re_binary_id(fpath)
+    bid = re_bid_search(bin_id) if binary_id == 0 else binary_id
+    end_point = f"v1/analyse/status/{bid}"
+    if bid == -1:
+        raise ReaitError(f"No matches found for hash: {bin_id}", end_point)
+    res: Response = reveng_req(requests.get, end_point)
+    if res.ok and console:
+        logger.info("Binary analysis status: %s", res.json()["status"])
+    if res.status_code == 400:
+        logger.warning(" Error, status not found for %s.", bin_id)
     res.raise_for_status()
+    return res
-def RE_compute_distance(embedding: list, embeddings: list, nns: int = 5):
+def RE_compute_distance(embedding: list, embeddings: list, nns: int = 5) -> list:
     """
-        Compute the cosine distance between source embedding and embeddinsg from binary
+    Compute the cosine distance between source embedding and embedding from binary
+    :param embedding: Embedding vector as python list
+    :param embeddings: Symbol embeddings
+    :param nns: Number of nearest neighbors
     """
     df = DataFrame(data=embeddings)
     np_embedding = array(embedding).reshape(1, -1)
-    source_embeddings = vstack(df['embedding'].values)
+    source_embeddings = vstack(df["embedding"].values)
     closest = cosine_similarity(source_embeddings, np_embedding).squeeze().argsort()[::-1][:nns]
     distances = cosine_similarity(source_embeddings[closest], np_embedding)
     # match closest embeddings with similarity
     closest_df = df.iloc[closest]
     # create json similarity object
     similarities = list(zip(distances, closest_df.index.tolist()))
-    json_sims = [{'similaritiy': float(d[0]), 'vaddr': int(df.iloc[v]['vaddr']), 'name': str(df.iloc[v]['name']), 'size': int(df.iloc[v]['size'])} for d, v in similarities]
+    json_sims = [{"similaritiy": float(d[0]),
+                  "vaddr": int(df.iloc[v]["vaddr"]),
+                  "name": str(df.iloc[v]["name"]),
+                  "size": int(df.iloc[v]["size"])
+                 } for d, v in similarities]
     return json_sims
-def RE_nearest_symbols(embedding: list, model_name, nns: int = 5, collections : list = None):
+def RE_nearest_symbols_batch(function_ids: list[int], nns: int = 5, collections: list[str] = None,
+                             distance: float = 0.1, debug_enabled: bool = False) -> Response:
     """
-        Get function name suggestions for an embedding
-        :param embedding: embedding vector as python list
-        :param nns: Number of nearest neighbors
-        :param collections: str RegEx to search through RevEng.AI collections
+    Get nearest functions to a passed function ids
+    :param function_ids: List of function ids
+    :param nns: Number of nearest neighbors
+    :param collections: List of collections RevEng.AI collection names to search through
+    :param distance: How close we want the ANN search to filter for
+    :param debug_enabled: ANN Symbol Search, only perform ANN on debug symbols if set
     """
-    params={'nns': nns, 'model_name': model_name }
+    params = {"function_id_list": function_ids,
+              "result_per_function": nns,
+              "debug_mode": debug_enabled,
+              "distance": distance,}
     if collections:
-        params['collections'] = collections
+        # api param is collection, not collections
+        params["collection"] = collections
+    res: Response = reveng_req(requests.post, "v1/ann/symbol/batch", json_data=params)
-    res = reveng_req(requests.post, "ann/symbol", data=json.dumps(embedding), params=params)
     res.raise_for_status()
-    f_suggestions = res.json()
-    print_json(data=f_suggestions)
+    return res
-def RE_nearest_binaries(embedding: list, model_name, nns: int = 5, collections : list = None):
+def RE_nearest_functions(fpath: str, binary_id: int = 0, nns: int = 5,
+                         distance: float = 0.1, debug_enabled: bool = False) -> Response:
     """
-        Get executable suggestions for a binary embedding
-        :param embedding: embedding vector as python list
-        :param nns: Number of nearest neighbors
-        :param collections: str RegEx to search through RevEng.AI collections
+    Get the nearest functions
+    :param fpath: File path for binary to analyse
+    :param binary_id: ID of binary
+    :param nns: Number of nearest neighbors
+    :param distance: How close we want the ANN search to filter for
+    :param debug_enabled: ANN Symbol Search, only perform ANN on debug symbols if set
     """
-    params={'nns': nns, 'model_name': model_name }
+    bin_id = re_binary_id(fpath)
+    bid = re_bid_search(bin_id) if binary_id == 0 else binary_id
-    if collections:
-        params['collections'] = collections
+    end_point = f"v1/ann/symbol/{bid}"
+    if bid == -1:
+        raise ReaitError(f"No matches found for hash: {bin_id}", end_point)
+    params = {"result_per_function": nns,
+              "debug_mode": debug_enabled,
+              "distance": distance, }
+    res: Response = reveng_req(requests.post, end_point, json_data=params)
+    res.raise_for_status()
+    return res
+def RE_analyze_functions(fpath: str, binary_id: int = 0) -> Response:
+    bin_id = re_binary_id(fpath)
+    bid = re_bid_search(bin_id) if binary_id == 0 else binary_id
+    end_point = f"v1/analyse/functions/{bid}"
+    if bid == -1:
+        raise ReaitError(f"No matches found for hash: {bin_id}", end_point)
+    res: Response = reveng_req(requests.get, end_point)
+    res.raise_for_status()
+    return res
+def RE_SBOM(fpath: str, binary_id: int = 0) -> Response:
+    """
+    Get Software Bill Of Materials for binary
+    :param fpath: File path for binary to analyse
+    :param binary_id: ID of binary
+    """
+    bin_id = re_binary_id(fpath)
+    bid = re_bid_search(bin_id) if binary_id == 0 else binary_id
+    end_point = f"sboms/{bid}"
+    if bid == -1:
+        raise ReaitError(f"No matches found for hash: {bin_id}", end_point)
+    res: Response = reveng_req(requests.get, end_point)
+    logger.info("SBOM for %s:\n%s", fpath, res.text)
+    res.raise_for_status()
+    return res
+def RE_functions_rename(function_id: int, new_name: str) -> Response:
+    """
+    Send the new name of a function to C2
+    :param function_id: ID of a function
+    :param new_name: New function name
+    """
+    res: Response = reveng_req(requests.post, f"v1/functions/rename/{function_id}",
+                               json_data={"new_name": new_name})
+    if res.ok:
+        logger.info("FunctionId %d has been renamed with '%s'.", function_id, new_name)
+    else:
+        logger.warning("Error, cannot rename FunctionId %d. %s", function_id, res.text)
+    res.raise_for_status()
+    return res
+def RE_settings() -> Response:
+    """
+    Get the configuration settings
+    """
+    res: Response = reveng_req(requests.get, "v1/config")
-    res = reveng_req(requests.post, "ann/binary", data=json.dumps(embedding), params=params)
     res.raise_for_status()
-    f_suggestions = res.json()
-    print_json(data=f_suggestions)
+    return res
+def RE_health() -> bool:
+    """
+    Health check & verify access to the API
+    """
+    res: Response = reveng_req(requests.get, "v1")
+    success = res.json()["success"]
+    if success:
+        logger.info(res.json()["message"])
+    else:
+        logger.warning(res.json()["error"])
+    return success
-def RE_SBOM(fpath: str, model_name: str):
+def RE_authentication() -> Response:
     """
-        Get Software Bill Of Materials for binary
-        :param fpath: File path for binaty to analyse
-        :param model_name: str model name of RevEng.AI AI model
+    Authentication Check
     """
-    params={'model_name': model_name }
+    res: Response = reveng_req(requests.get, "v1/authenticate")
-    res = reveng_req(requests.get, f"sboms/{binary_id(fpath)}", params=params)
     res.raise_for_status()
-    sbom = res.json()
-    print_json(data=sbom)
+    return res
-def binary_id(path: str):
-    """Take the SHA-256 hash of binary file"""
-    hf = sha256()
-    with open(path, "rb") as f:
-        c = f.read()
-        hf.update(c)
-    return hf.hexdigest()
+def re_binary_id(fpath: str) -> str:
+    """
+    Take the SHA-256 hash of binary file
+    :param fpath: File path for binary to analyse
+    """
+    if fpath and isfile(fpath) and access(fpath, R_OK):
+        hf = sha256()
+        with open(fpath, "rb") as fd:
+            c = fd.read()
+            hf.update(c)
+        return hf.hexdigest()
+    else:
+        logger.error("File '%s' doesn't exist or isn't readable", fpath)
-def _binary_isa(lief_hdlr, exec_type):
+    return "undefined"
+def _binary_isa(binary: Binary, exec_type: str) -> str:
     """
-        Get executable file format
+    Get ISA format
     """
-    if exec_type == "elf":
-        machine_type = lief_hdlr.header.machine_type
-        if machine_type == lief.ELF.ARCH.i386:
+    if exec_type == "ELF":
+        arch = binary.header.machine_type
+        if arch == ELF.ARCH.i386:
             return "x86"
-        elif machine_type == lief.ELF.ARCH.x86_64:
+        elif arch == ELF.ARCH.x86_64:
             return "x86_64"
-    elif exec_type == "pe":
-        machine_type = lief_hdlr.header.machine
-        if machine_type == lief.PE.MACHINE_TYPES.I386:
+        elif arch == ELF.ARCH.ARM:
+            return "ARM32"
+        elif arch == ELF.ARCH.AARCH64:
+            return "ARM64"
+    elif exec_type == "PE":
+        machine_type = binary.header.machine
+        if machine_type == PE.Header.MACHINE_TYPES.I386:
             return "x86"
-        elif machine_type == lief.PE.MACHINE_TYPES.AMD64:
+        elif machine_type == PE.Header.MACHINE_TYPES.AMD64:
             return "x86_64"
-    elif exec_type == "macho":
-        machine_type = lief_hdlr.header.cpu_type
-        if machine_type == lief.MachO.CPU_TYPES.x86:
+        elif machine_type == PE.Header.MACHINE_TYPES.ARM:
+            return "ARM32"
+        elif machine_type == PE.Header.MACHINE_TYPES.ARM64:
+            return "ARM64"
+    elif exec_type == "Mach-O":
+        cpu_type = binary.header.cpu_type
+        if cpu_type == MachO.CPU_TYPES.x86:
             return "x86"
-        elif machine_type == lief.MachO.CPU_TYPES.x86_64:
+        elif cpu_type == MachO.CPU_TYPES.x86_64:
             return "x86_64"
-    raise RuntimeError(f"Error, failed to determine or unsupported ISA for exec_type:{exec_type}")
+        elif cpu_type == MachO.CPU_TYPES.ARM:
+            return "ARM32"
+        elif cpu_type == MachO.CPU_TYPES.ARM64:
+            return "ARM64"
+    logger.error("Error, could not determine or unsupported ISA for binary format: %s.", exec_type)
+    raise RuntimeError(f"Error, could not determine or unsupported ISA for binary format: {exec_type}.")
-def _binary_format(lief_hdlr):
+def _binary_format(binary: Binary) -> str:
     """
-        Get executable file format
+    Get executable file format
     """
-    if lief_hdlr.format == lief_hdlr.format.PE:
-        return "pe"
-    if lief_hdlr.format == lief_hdlr.format.ELF:
-        return "elf"
-    if lief_hdlr.format == lief_hdlr.format.MACHO:
-        return "macho"
-    raise RuntimeError("Error, could not determine binary format")
+    if binary.format == Binary.FORMATS.PE:
+        return "PE"
+    if binary.format == Binary.FORMATS.ELF:
+        return "ELF"
+    if binary.format == Binary.FORMATS.MACHO:
+        return "Mach-O"
+    logger.error("Error, could not determine or unsupported binary format: %s.", binary.format)
+    raise RuntimeError(f"Error, could not determine or unsupported binary format: {binary.format}")
-def file_type(fpath: str):
+def file_type(fpath: str) -> tuple[str, str]:
     """
-        Determine ISA for binary
+    Determine ISA for binary
+    :param fpath: File path for binary to analyse
     """
-    binary = lief.parse(fpath)
+    binary = parse(fpath)
-    # handle PE and ELF files
-    file_format = _binary_format(binary)
-    isa         = _binary_isa(binary, file_format)
-    return file_format, isa
+    if not binary:
+        file_format = isa_format = "Unknown format"
+    else:
+        # handle PE and ELF files
+        file_format = _binary_format(binary)
+        isa_format = _binary_isa(binary, file_format)
+    return file_format, isa_format
-def parse_config():
+def parse_config() -> None:
+    """
+    Parse ~/.reait.toml config file
     """
-        Parse ~/.reait.toml config file
-    """
-    if not os.path.exists(os.path.expanduser("~/.reait.toml")):
-        return
+    fpath = expanduser("~/.reait.toml")
-    with open(os.path.expanduser("~/.reait.toml"), "r") as file:
-        config = tomli.loads(file.read())
-        for key in ('apikey', 'host'):
-            if key in config:
-                re_conf[key] = config[key]
+    if isfile(fpath) and access(fpath, R_OK):
+        with open(fpath) as fd:
+            config = tomli.loads(fd.read())
+            for key in ("apikey", "host", "model",):
+                if key in config:
+                    re_conf[key] = config[key]
+    else:
+        logger.info("File %s doesn't exist or isn't readable", fpath)
-def angular_distance(x, y):
+def angular_distance(x, y) -> float:
     """
     Compute angular distance between two embedding vectors
-    Normalised euclidean distance
+    Normalised euclidian distance
     """
-    cos = dot(x, y) / ((dot(x, x) * dot(y, y)) ** 0.5)
-    return 1.0 - arccos(cos)/pi
+    cos = dot(x, y) / ((dot(x, x) * dot(y, y))**0.5)
+    return 1.0 - arccos(cos) / pi

reait 0.0.19__py3-none-any.whl → 1.0.0__py3-none-any.whl

reait 0.0.19py3-none-any.whl → 1.0.0py3-none-any.whl