PyPI - tooluniverse - Versions diffs - 1.0.0__py3-none-any.whl → 1.0.2__py3-none-any.whl - Mend

tooluniverse 1.0.0py3-none-any.whl → 1.0.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of tooluniverse might be problematic. Click here for more details.

Files changed (20) hide show

tooluniverse/__init__.py CHANGED Viewed

@@ -1,4 +1,5 @@
 from importlib.metadata import version
+import warnings
 from typing import Any, Optional, List
 from .execute_function import ToolUniverse
 from .base_tool import BaseTool
@@ -148,65 +149,76 @@ MCPClientTool: Any
 MCPAutoLoaderTool: Any
 ADMETAITool: Any
 AlphaFoldRESTTool: Any
+ComposeTool: Any
 if not LAZY_LOADING_ENABLED:
-    # Import all tool classes immediately (old behavior)
-    from .restful_tool import MonarchTool, MonarchDiseasesForMultiplePhenoTool
-    from .ctg_tool import ClinicalTrialsSearchTool, ClinicalTrialsDetailsTool
-    from .graphql_tool import (
-        OpentargetTool,
-        OpentargetGeneticsTool,
-        OpentargetToolDrugNameMatch,
-        DiseaseTargetScoreTool,
-    )
-    from .openfda_tool import (
-        FDADrugLabelTool,
-        FDADrugLabelSearchTool,
-        FDADrugLabelSearchIDTool,
-        FDADrugLabelGetDrugGenericNameTool,
-    )
-    from .openfda_adv_tool import FDADrugAdverseEventTool, FDACountAdditiveReactionsTool
-    from .chem_tool import ChEMBLTool
-    from .europe_pmc_tool import EuropePMCTool
-    from .semantic_scholar_tool import SemanticScholarTool
-    from .pubtator_tool import PubTatorTool
-    from .efo_tool import EFOTool
-    from .agentic_tool import AgenticTool
-    from .dataset_tool import DatasetTool
-    from .dailymed_tool import SearchSPLTool, GetSPLBySetIDTool
-    from .hpa_tool import HPAGetGeneJSONTool, HPAGetGeneXMLTool
-    from .reactome_tool import ReactomeRESTTool
-    from .pubchem_tool import PubChemRESTTool
-    from .url_tool import URLHTMLTagTool, URLToPDFTextTool
-    from .medlineplus_tool import MedlinePlusRESTTool
-    from .uniprot_tool import UniProtRESTTool
-    from .package_tool import PackageTool
-    from .uspto_tool import USPTOOpenDataPortalTool
-    from .xml_tool import XMLDatasetTool
-    from .tool_finder_embedding import ToolFinderEmbedding
-    from .tool_finder_keyword import ToolFinderKeyword
-    from .tool_finder_llm import ToolFinderLLM
-    from .embedding_database import EmbeddingDatabase
-    from .embedding_sync import EmbeddingSync
-    from .rcsb_pdb_tool import RCSBTool
-    from .gwas_tool import (
-        GWASAssociationSearch,
-        GWASStudySearch,
-        GWASSNPSearch,
-        GWASAssociationByID,
-        GWASStudyByID,
-        GWASSNPByID,
-        GWASVariantsForTrait,
-        GWASAssociationsForTrait,
-        GWASAssociationsForSNP,
-        GWASStudiesForTrait,
-        GWASSNPsForGene,
-        GWASAssociationsForStudy,
-    )
+    # Import all tool classes immediately (old behavior) with warning suppression  # noqa: E501
+    with warnings.catch_warnings():
+        warnings.filterwarnings("ignore", category=DeprecationWarning)
+        warnings.filterwarnings("ignore", category=RuntimeWarning)
+        warnings.filterwarnings("ignore", category=UserWarning)
+        warnings.filterwarnings("ignore", category=FutureWarning)
+        from .restful_tool import MonarchTool, MonarchDiseasesForMultiplePhenoTool
+        from .ctg_tool import ClinicalTrialsSearchTool, ClinicalTrialsDetailsTool
+        from .graphql_tool import (
+            OpentargetTool,
+            OpentargetGeneticsTool,
+            OpentargetToolDrugNameMatch,
+            DiseaseTargetScoreTool,
+        )
+        from .openfda_tool import (
+            FDADrugLabelTool,
+            FDADrugLabelSearchTool,
+            FDADrugLabelSearchIDTool,
+            FDADrugLabelGetDrugGenericNameTool,
+        )
+        from .openfda_adv_tool import (
+            FDADrugAdverseEventTool,
+            FDACountAdditiveReactionsTool,
+        )
+        from .chem_tool import ChEMBLTool
+        from .compose_tool import ComposeTool
+        from .europe_pmc_tool import EuropePMCTool
+        from .semantic_scholar_tool import SemanticScholarTool
+        from .pubtator_tool import PubTatorTool
+        from .efo_tool import EFOTool
+        from .agentic_tool import AgenticTool
+        from .dataset_tool import DatasetTool
+        from .dailymed_tool import SearchSPLTool, GetSPLBySetIDTool
+        from .hpa_tool import HPAGetGeneJSONTool, HPAGetGeneXMLTool
+        from .reactome_tool import ReactomeRESTTool
+        from .pubchem_tool import PubChemRESTTool
+        from .url_tool import URLHTMLTagTool, URLToPDFTextTool
+        from .medlineplus_tool import MedlinePlusRESTTool
+        from .uniprot_tool import UniProtRESTTool
+        from .package_tool import PackageTool
+        from .uspto_tool import USPTOOpenDataPortalTool
+        from .xml_tool import XMLDatasetTool
+        from .tool_finder_embedding import ToolFinderEmbedding
+        from .tool_finder_keyword import ToolFinderKeyword
+        from .tool_finder_llm import ToolFinderLLM
+        from .embedding_database import EmbeddingDatabase
+        from .embedding_sync import EmbeddingSync
+        from .rcsb_pdb_tool import RCSBTool
+        from .gwas_tool import (
+            GWASAssociationSearch,
+            GWASStudySearch,
+            GWASSNPSearch,
+            GWASAssociationByID,
+            GWASStudyByID,
+            GWASSNPByID,
+            GWASVariantsForTrait,
+            GWASAssociationsForTrait,
+            GWASAssociationsForSNP,
+            GWASStudiesForTrait,
+            GWASSNPsForGene,
+            GWASAssociationsForStudy,
+        )
-    # from .admetai_tool import ADMETAITool
-    from .mcp_client_tool import MCPClientTool, MCPAutoLoaderTool
-    from .admetai_tool import ADMETAITool
-    from .alphafold_tool import AlphaFoldRESTTool
+        # from .admetai_tool import ADMETAITool
+        from .mcp_client_tool import MCPClientTool, MCPAutoLoaderTool
+        from .admetai_tool import ADMETAITool
+        from .alphafold_tool import AlphaFoldRESTTool
 else:
     # With lazy loading, create lazy import proxies that import modules only when accessed
     MonarchTool = _LazyImportProxy("restful_tool", "MonarchTool")
@@ -238,6 +250,7 @@ else:
         "openfda_adv_tool", "FDACountAdditiveReactionsTool"
     )
     ChEMBLTool = _LazyImportProxy("chem_tool", "ChEMBLTool")
+    ComposeTool = _LazyImportProxy("compose_tool", "ComposeTool")
     EuropePMCTool = _LazyImportProxy("europe_pmc_tool", "EuropePMCTool")
     SemanticScholarTool = _LazyImportProxy(
         "semantic_scholar_tool", "SemanticScholarTool"
@@ -306,6 +319,7 @@ __all__ = [
     "FDADrugAdverseEventTool",
     "FDACountAdditiveReactionsTool",
     "ChEMBLTool",
+    "ComposeTool",
     "EuropePMCTool",
     "SemanticScholarTool",
     "PubTatorTool",

tooluniverse/alphafold_tool.py CHANGED Viewed

@@ -11,7 +11,7 @@ ALPHAFOLD_BASE_URL = "https://alphafold.ebi.ac.uk/api"
 class AlphaFoldRESTTool(BaseTool):
     """
     AlphaFold Protein Structure Database API tool.
-    Supports queries by UniProt accession ID.
+    Generic wrapper for AlphaFold API endpoints defined in alphafold_tools.json.
     """
     def __init__(self, tool_config):
@@ -20,28 +20,38 @@ class AlphaFoldRESTTool(BaseTool):
         parameter = tool_config.get("parameter", {})
         self.endpoint_template: str = fields["endpoint"]
-        self.param_schema: Dict[str, Any] = parameter.get("properties", {})
         self.required: List[str] = parameter.get("required", [])
         self.output_format: str = fields.get("return_format", "JSON")
-    def _build_url(self, arguments: Dict[str, Any]) -> Dict[str, Any] | str:
+    def _build_url(self, arguments: Dict[str, Any]) -> str | Dict[str, Any]:
+        # Example: endpoint_template = "/annotations/{qualifier}.json"
         url_path = self.endpoint_template
+        # Find placeholders like {qualifier} in the path
         placeholders = re.findall(r"\{([^{}]+)\}", url_path)
+        used = set()
+        # Replace placeholders with provided arguments
+        #   ex. if arguments = {"qualifier": "P69905", "type": "MUTAGEN"}
         for ph in placeholders:
             if ph not in arguments or arguments[ph] is None:
                 return {"error": f"Missing required parameter '{ph}'"}
             url_path = url_path.replace(f"{{{ph}}}", str(arguments[ph]))
-        return ALPHAFOLD_BASE_URL + url_path
+            used.add(ph)
+        # Now url_path = "/annotations/P69905.json"
-    def run(self, arguments: Dict[str, Any]):
-        # Validate required params
-        missing = [k for k in self.required if k not in arguments]
-        if missing:
-            return {"error": f"Missing required parameter(s): {', '.join(missing)}"}
+        # Treat all remaining args as query parameters
+        #   "type" wasn’t a placeholder, so it becomes a query param
+        query_args = {k: v for k, v in arguments.items() if k not in used}
+        if query_args:
+            from urllib.parse import urlencode
-        url = self._build_url(arguments)
-        if isinstance(url, dict) and "error" in url:
-            return url
+            url_path += "?" + urlencode(query_args)
+        # Final result = "https://alphafold.ebi.ac.uk/api/annotations/P69905.json?type=MUTAGEN"
+        return ALPHAFOLD_BASE_URL + url_path
+    def _make_request(self, url: str) -> Dict[str, Any]:
+        """Perform a GET request and handle common errors."""
         try:
             resp = requests.get(
                 url,
@@ -54,18 +64,36 @@ class AlphaFoldRESTTool(BaseTool):
         except Exception as e:
             return {"error": "Request to AlphaFold API failed", "detail": str(e)}
-        # Handle HTTP errors cleanly
         if resp.status_code == 404:
-            return {
-                "error": "No AlphaFold prediction found",
-                "uniprot_id": arguments.get("uniprot_id"),
-            }
+            return {"error": "Not found", "endpoint": url}
         if resp.status_code != 200:
             return {
                 "error": f"AlphaFold API returned {resp.status_code}",
                 "detail": resp.text,
+                "endpoint": url,
             }
+        return {"response": resp}
+    def run(self, arguments: Dict[str, Any]):
+        """Execute the tool with provided arguments."""
+        # Validate required params
+        missing = [k for k in self.required if k not in arguments]
+        if missing:
+            return {"error": f"Missing required parameter(s): {', '.join(missing)}"}
+        # Build URL
+        url = self._build_url(arguments)
+        if isinstance(url, dict) and "error" in url:
+            return {**url, "query": arguments}
+        # Make request
+        result = self._make_request(url)
+        if "error" in result:
+            return {**result, "query": arguments}
+        resp = result["response"]
         # Parse JSON
         if self.output_format.upper() == "JSON":
             try:
@@ -73,7 +101,8 @@ class AlphaFoldRESTTool(BaseTool):
                 if not data:
                     return {
                         "error": "AlphaFold returned an empty response",
-                        "uniprot_id": arguments.get("uniprot_id"),
+                        "endpoint": url,
+                        "query": arguments,
                     }
                 return {
@@ -90,7 +119,9 @@ class AlphaFoldRESTTool(BaseTool):
                     "error": "Failed to parse JSON response",
                     "raw": resp.text,
                     "detail": str(e),
+                    "endpoint": url,
+                    "query": arguments,
                 }
-        # Fallback if non-JSON format
-        return {"data": resp.text, "metadata": {"endpoint": url}}
+        # Fallback for non-JSON output
+        return {"data": resp.text, "metadata": {"endpoint": url, "query": arguments}}

tooluniverse/compose_scripts/tool_graph_generation.py ADDED Viewed

@@ -0,0 +1,249 @@
+"""Tool Graph Generation Compose Script
+Efficiently evaluates directional data-flow relationships between all unique pairs
+of provided tool configs using one agentic tool:
+  - ToolRelationshipDetector
+Outputs a graph structure with edges representing valid directional relationships.
+Each edge stores: source, target, rationale.
+Performance considerations:
+  - Iterates i<j once (O(N^2/2) pairs)
+  - Lightweight JSON serialization of minimal fields
+  - Optional batching hook (currently sequential because call_tool likely remote)
+Arguments:
+  tool_configs (list[dict]) REQUIRED
+  max_tools (int) optional limit for debugging
+  output_path (str) path to write resulting graph JSON (default './tool_relationship_graph.json')
+  save_intermediate_every (int) checkpoint frequency (default 5000 pairs processed)
+Return:
+  dict with keys: nodes, edges, stats
+"""
+from __future__ import annotations
+import json
+import math
+import os
+import time
+from typing import Any, Dict, List, Tuple
+DETECTOR_NAME = "ToolRelationshipDetector"
+def compose(arguments, tooluniverse, call_tool):  # noqa: D401
+    tool_configs: List[dict] = arguments.get("tool_configs") or []
+    if not tool_configs:
+        return {"status": "error", "message": "tool_configs empty"}
+    max_tools = arguments.get("max_tools")
+    if isinstance(max_tools, int) and max_tools > 0:
+        tool_configs = tool_configs[: max_tools]
+    output_path = arguments.get("output_path", "./tool_relationship_graph.json")
+    checkpoint_every = int(arguments.get("save_intermediate_every", 5000))
+    # Prepare nodes list (unique tool names)
+    nodes = []
+    minimal_tool_map: Dict[str, dict] = {}
+    for cfg in tool_configs:
+        name = cfg.get("name")
+        if not name:
+            continue
+        if name in minimal_tool_map:
+            continue
+        minimal_tool = {
+            "name": name,
+            "description": cfg.get("description", ""),
+            "parameter": cfg.get("parameter", {}),
+            "type": cfg.get("type", cfg.get("toolType", "unknown")),
+        }
+        minimal_tool_map[name] = minimal_tool
+        nodes.append({"id": name, "name": name, "type": minimal_tool["type"]})
+    names = list(minimal_tool_map.keys())
+    n = len(names)
+    total_pairs = n * (n - 1) // 2
+    edges: List[dict] = []
+    processed_pairs = 0
+    llm_calls = 0
+    start_time = time.time()
+    batch_size = 100
+    # --- Resume from checkpoint ---
+    checkpoint_path = output_path + ".checkpoint.json"
+    load_path = None
+    # Prefer checkpoint file, otherwise use the main output file
+    if os.path.exists(checkpoint_path):
+        load_path = checkpoint_path
+    elif os.path.exists(output_path):
+        load_path = output_path
+    if load_path:
+        print(f"Attempting to resume from {load_path}")
+        try:
+            with open(load_path, "r", encoding="utf-8") as f:
+                existing_graph = json.load(f)
+            # Re-hydrate edges and find processed source tools
+            if "edges" in existing_graph and isinstance(existing_graph["edges"], list):
+                edges = existing_graph["edges"]
+            # Align the 'names' list order with the loaded graph to ensure correct loop continuation
+            if "nodes" in existing_graph and isinstance(existing_graph["nodes"], list):
+                loaded_node_order = [node.get("name") for node in existing_graph.get("nodes", [])]
+                if names == loaded_node_order:
+                    print("Current tool order matches the loaded graph.")
+                else:
+                    print("Reordering tools to match the loaded graph for correct resume.")
+                    # Create a map for quick lookup of current tool positions
+                    current_name_pos = {name: i for i, name in enumerate(names)}
+                    # Build the new 'names' list and 'minimal_tool_map' based on the loaded order
+                    new_names = [name for name in loaded_node_order if name in current_name_pos]
+                    # Find any new tools not in the original graph and append them
+                    new_tools_from_config = [name for name in names if name not in loaded_node_order]
+                    if new_tools_from_config:
+                        print(f"Appending {len(new_tools_from_config)} new tools to the list.")
+                        new_names.extend(new_tools_from_config)
+                    names = new_names
+                    assert(n==len(names)) # n should remain the same
+                    print("Tool order successfully realigned.")
+        except Exception as e:
+            print(f"Warning: Could not load or parse existing graph at {load_path}. Starting fresh. Error: {e}")
+            edges = [] # Reset edges if loading failed
+    # Core loop over unique unordered pairs (i<j). We'll batch the 'j' tools.
+    for i in range(n):
+        tool_a = minimal_tool_map[names[i]]
+        a_json = json.dumps(tool_a, ensure_ascii=False)
+        # This logic is to skip all tools until a specific one is found,
+        # skip that one, and then process all subsequent tools.
+        # This is useful for debugging or resuming from a specific point.
+        start_processing_flag_name = 'get_em_3d_fitting_and_reconstruction_details'
+        # Find the index of the tool to start after
+        try:
+            start_index = names.index(start_processing_flag_name)
+        except ValueError:
+            start_index = -1 # Flag tool not found, process all
+        if start_index != -1 and i <= start_index:
+            print(f"Skipping tool {tool_a['name']} with index {i} (target index is {start_index}).")
+            continue
+        # Batch the remaining tools to compare against tool_a
+        for j_batch_start in range(i + 1, n, batch_size):
+            j_batch_end = min(j_batch_start + batch_size, n)
+            other_tools_batch_names = names[j_batch_start:j_batch_end]
+            if not other_tools_batch_names:
+                continue
+            other_tools_list = [minimal_tool_map[name] for name in other_tools_batch_names]
+            other_tools_json = json.dumps(other_tools_list, ensure_ascii=False)
+            # Call detector with the batch
+            detector_args = {"tool_a": a_json, "other_tools": other_tools_json}
+            detector_res = {}
+            for _ in range(5):  # Retry up to 5 times
+                detector_raw = call_tool(DETECTOR_NAME, detector_args)
+                llm_calls += 1
+                detector_res = _parse_json(detector_raw)
+                if detector_res and "relationships" in detector_res:
+                    break
+            processed_pairs += len(other_tools_list)
+            relationships = detector_res.get("relationships", [])
+            if not isinstance(relationships, list):
+                relationships = []
+            print(f"Tool A: {tool_a['name']} vs {len(other_tools_list)} others => Found {len(relationships)} relationships")
+            for rel in relationships:
+                tool_b_name = rel.get("tool_b_name")
+                direction = rel.get("direction")
+                rationale = rel.get("rationale")
+                if not tool_b_name or tool_b_name not in minimal_tool_map:
+                    continue
+                if direction in ("A->B", "both"):
+                    edges.append({
+                        "source": tool_a["name"],
+                        "target": tool_b_name,
+                        "rationale": rationale,
+                    })
+                if direction in ("B->A", "both"):
+                    edges.append({
+                        "source": tool_b_name,
+                        "target": tool_a["name"],
+                        "rationale": rationale,
+                    })
+            # Progress reporting and checkpointing
+            if processed_pairs % 1000 < len(other_tools_list): # Heuristic to report near the thousand marks
+                elapsed = time.time() - start_time
+                rate = processed_pairs / elapsed if elapsed > 0 else 0
+                print(f"[progress] pairs={processed_pairs}/{total_pairs} edges={len(edges)} llm_calls={llm_calls} rate={rate:.2f} pairs/s")
+            if processed_pairs // checkpoint_every > (processed_pairs - len(other_tools_list)) // checkpoint_every:
+                _maybe_checkpoint(output_path, nodes, edges)
+    graph = {
+        "nodes": nodes,
+        "edges": edges,
+        "stats": {
+            "tools": n,
+            "pairs_evaluated": processed_pairs,
+            "edges": len(edges),
+            "llm_calls": llm_calls,
+            "runtime_sec": round(time.time() - start_time, 2)
+        }
+    }
+    # Final save
+    try:
+        with open(output_path, "w", encoding="utf-8") as f:
+            json.dump(graph, f, indent=2)
+    except Exception as e:
+        return {"status": "error", "message": f"Failed to write output: {e}", "graph": graph}
+    return {"status": "success", "output_file": output_path, "graph": graph}
+def _maybe_checkpoint(base_path: str, nodes: List[dict], edges: List[dict]):
+    ck_path = base_path + ".checkpoint_new.json"
+    try:
+        with open(ck_path, "w", encoding="utf-8") as f:
+            json.dump({"nodes": nodes, "edges": edges}, f)
+        print(f"[checkpoint] saved {ck_path} nodes={len(nodes)} edges={len(edges)}")
+    except Exception as e:
+        print(f"[checkpoint] failed: {e}")
+def _parse_json(obj: Any) -> dict:
+    if isinstance(obj, dict):
+        # may be wrapped
+        if "result" in obj and isinstance(obj["result"], str):
+            try:
+                return json.loads(obj["result"])
+            except Exception:
+                return {}
+        if "content" in obj and isinstance(obj["content"], str):
+            try:
+                return json.loads(obj["content"])
+            except Exception:
+                return {}
+        return obj
+    if isinstance(obj, str):
+        try:
+            return json.loads(obj)
+        except Exception:
+            return {}
+    return {}

tooluniverse 1.0.0__py3-none-any.whl → 1.0.2__py3-none-any.whl

Potentially problematic release.

tooluniverse 1.0.0py3-none-any.whl → 1.0.2py3-none-any.whl