PyPI - aiagents4pharma - Versions diffs - 1.44.0__py3-none-any.whl → 1.45.1__py3-none-any.whl - Mend

aiagents4pharma 1.44.0py3-none-any.whl → 1.45.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (289) hide show

aiagents4pharma/talk2knowledgegraphs/tools/multimodal_subgraph_extraction.py CHANGED Viewed

@@ -2,23 +2,25 @@
 Tool for performing multimodal subgraph extraction.
 """
-from typing import Type, Annotated
 import logging
 import pickle
-import numpy as np
-import pandas as pd
+from typing import Annotated
 import hydra
 import networkx as nx
-from pydantic import BaseModel, Field
-from langchain_core.tools import BaseTool
+import numpy as np
+import pandas as pd
+import torch
 from langchain_core.messages import ToolMessage
+from langchain_core.tools import BaseTool
 from langchain_core.tools.base import InjectedToolCallId
-from langgraph.types import Command
 from langgraph.prebuilt import InjectedState
-import torch
+from langgraph.types import Command
+from pydantic import BaseModel, Field
 from torch_geometric.data import Data
-from ..utils.extractions.multimodal_pcst import MultimodalPCSTPruning
 from ..utils.embeddings.ollama import EmbeddingWithOllama
+from ..utils.extractions.multimodal_pcst import MultimodalPCSTPruning
 from .load_arguments import ArgumentData
 # Initialize logger
@@ -38,14 +40,10 @@ class MultimodalSubgraphExtractionInput(BaseModel):
         arg_data: Argument for analytical process over graph data.
     """
-    tool_call_id: Annotated[str, InjectedToolCallId] = Field(
-        description="Tool call ID."
-    )
+    tool_call_id: Annotated[str, InjectedToolCallId] = Field(description="Tool call ID.")
     state: Annotated[dict, InjectedState] = Field(description="Injected state.")
     prompt: str = Field(description="Prompt to interact with the backend.")
-    arg_data: ArgumentData = Field(
-        description="Experiment over graph data.", default=None
-    )
+    arg_data: ArgumentData = Field(description="Experiment over graph data.", default=None)
 class MultimodalSubgraphExtractionTool(BaseTool):
@@ -56,12 +54,11 @@ class MultimodalSubgraphExtractionTool(BaseTool):
     name: str = "subgraph_extraction"
     description: str = "A tool for subgraph extraction based on user's prompt."
-    args_schema: Type[BaseModel] = MultimodalSubgraphExtractionInput
+    args_schema: type[BaseModel] = MultimodalSubgraphExtractionInput
-    def _prepare_query_modalities(self,
-                                  prompt_emb: list,
-                                  state: Annotated[dict, InjectedState],
-                                  pyg_graph: Data) -> pd.DataFrame:
+    def _prepare_query_modalities(
+        self, prompt_emb: list, state: Annotated[dict, InjectedState], pyg_graph: Data
+    ) -> pd.DataFrame:
         """
         Prepare the modality-specific query for subgraph extraction.
@@ -75,77 +72,90 @@ class MultimodalSubgraphExtractionTool(BaseTool):
         """
         # Initialize dataframes
         multimodal_df = pd.DataFrame({"name": []})
-        query_df = pd.DataFrame({"node_id": [],
-                                 "node_type": [],
-                                 "x": [],
-                                 "desc_x": [],
-                                 "use_description": []})
+        query_df = pd.DataFrame(
+            {
+                "node_id": [],
+                "node_type": [],
+                "x": [],
+                "desc_x": [],
+                "use_description": [],
+            }
+        )
         # Loop over the uploaded files and find multimodal files
         for i in range(len(state["uploaded_files"])):
             # Check if multimodal file is uploaded
             if state["uploaded_files"][i]["file_type"] == "multimodal":
                 # Read the Excel file
-                multimodal_df = pd.read_excel(state["uploaded_files"][i]["file_path"],
-                                              sheet_name=None)
+                multimodal_df = pd.read_excel(
+                    state["uploaded_files"][i]["file_path"], sheet_name=None
+                )
         # Check if the multimodal_df is empty
         if len(multimodal_df) > 0:
             # Merge all obtained dataframes into a single dataframe
             multimodal_df = pd.concat(multimodal_df).reset_index()
             multimodal_df.drop(columns=["level_1"], inplace=True)
-            multimodal_df.rename(columns={"level_0": "q_node_type",
-                                        "name": "q_node_name"}, inplace=True)
+            multimodal_df.rename(
+                columns={"level_0": "q_node_type", "name": "q_node_name"}, inplace=True
+            )
             # Since an excel sheet name could not contain a `/`,
             # but the node type can be 'gene/protein' as exists in the PrimeKG
             multimodal_df["q_node_type"] = multimodal_df.q_node_type.apply(
-                lambda x: x.replace('-', '/')
+                lambda x: x.replace("-", "/")
             )
             # Convert PyG graph to a DataFrame for easier filtering
-            graph_df = pd.DataFrame({
-                "node_id": pyg_graph.node_id,
-                "node_name": pyg_graph.node_name,
-                "node_type": pyg_graph.node_type,
-                "x": pyg_graph.x,
-                "desc_x": pyg_graph.desc_x.tolist(),
-            })
+            graph_df = pd.DataFrame(
+                {
+                    "node_id": pyg_graph.node_id,
+                    "node_name": pyg_graph.node_name,
+                    "node_type": pyg_graph.node_type,
+                    "x": pyg_graph.x,
+                    "desc_x": pyg_graph.desc_x.tolist(),
+                }
+            )
             # Make a query dataframe by merging the graph_df and multimodal_df
-            query_df = graph_df.merge(multimodal_df, how='cross')
+            query_df = graph_df.merge(multimodal_df, how="cross")
             query_df = query_df[
                 query_df.apply(
-                    lambda x:
-                    (x['q_node_name'].lower() in x['node_name'].lower()) & # node name
-                    (x['node_type'] == x['q_node_type']), # node type
-                    axis=1
+                    lambda x: (x["q_node_name"].lower() in x["node_name"].lower())  # node name
+                    & (x["node_type"] == x["q_node_type"]),  # node type
+                    axis=1,
                 )
             ]
-            query_df = query_df[['node_id', 'node_type', 'x', 'desc_x']].reset_index(drop=True)
-            query_df['use_description'] = False # set to False for modal-specific embeddings
+            query_df = query_df[["node_id", "node_type", "x", "desc_x"]].reset_index(drop=True)
+            query_df["use_description"] = False  # set to False for modal-specific embeddings
             # Update the state by adding the the selected node IDs
             state["selections"] = query_df.groupby("node_type")["node_id"].apply(list).to_dict()
         # Append a user prompt to the query dataframe
-        query_df = pd.concat([
-            query_df,
-            pd.DataFrame({
-                'node_id': 'user_prompt',
-                'node_type': 'prompt',
-                'x': prompt_emb,
-                'desc_x': prompt_emb,
-                'use_description': True # set to True for user prompt embedding
-            })
-        ]).reset_index(drop=True)
+        query_df = pd.concat(
+            [
+                query_df,
+                pd.DataFrame(
+                    {
+                        "node_id": "user_prompt",
+                        "node_type": "prompt",
+                        "x": prompt_emb,
+                        "desc_x": prompt_emb,
+                        "use_description": True,  # set to True for user prompt embedding
+                    }
+                ),
+            ]
+        ).reset_index(drop=True)
         return query_df
-    def _perform_subgraph_extraction(self,
-                                     state: Annotated[dict, InjectedState],
-                                     cfg: dict,
-                                     pyg_graph: Data,
-                                     query_df: pd.DataFrame) -> dict:
+    def _perform_subgraph_extraction(
+        self,
+        state: Annotated[dict, InjectedState],
+        cfg: dict,
+        pyg_graph: Data,
+        query_df: pd.DataFrame,
+    ) -> dict:
         """
         Perform multimodal subgraph extraction based on modal-specific embeddings.
@@ -176,11 +186,13 @@ class MultimodalSubgraphExtractionTool(BaseTool):
                 num_clusters=cfg.num_clusters,
                 pruning=cfg.pruning,
                 verbosity_level=cfg.verbosity_level,
-                use_description=q[1]['use_description'],
-            ).extract_subgraph(pyg_graph,
-                               torch.tensor(q[1]['desc_x']), # description embedding
-                               torch.tensor(q[1]['x']), # modal-specific embedding
-                               q[1]['node_type'])
+                use_description=q[1]["use_description"],
+            ).extract_subgraph(
+                pyg_graph,
+                torch.tensor(q[1]["desc_x"]),  # description embedding
+                torch.tensor(q[1]["x"]),  # modal-specific embedding
+                q[1]["node_type"],
+            )
             # Append the extracted subgraph to the dictionary
             subgraphs["nodes"].append(subgraph["nodes"].tolist())
@@ -196,11 +208,9 @@ class MultimodalSubgraphExtractionTool(BaseTool):
         return subgraphs
-    def _prepare_final_subgraph(self,
-                               state:Annotated[dict, InjectedState],
-                               subgraph: dict,
-                               graph: dict,
-                               cfg) -> dict:
+    def _prepare_final_subgraph(
+        self, state: Annotated[dict, InjectedState], subgraph: dict, graph: dict, cfg
+    ) -> dict:
         """
         Prepare the subgraph based on the extracted subgraph.
@@ -227,14 +237,8 @@ class MultimodalSubgraphExtractionTool(BaseTool):
             # Edge features
             edge_index=torch.LongTensor(
                 [
-                    [
-                        mapping[i]
-                        for i in graph["pyg"].edge_index[:, subgraph["edges"]][0].tolist()
-                    ],
-                    [
-                        mapping[i]
-                        for i in graph["pyg"].edge_index[:, subgraph["edges"]][1].tolist()
-                    ],
+                    [mapping[i] for i in graph["pyg"].edge_index[:, subgraph["edges"]][0].tolist()],
+                    [mapping[i] for i in graph["pyg"].edge_index[:, subgraph["edges"]][1].tolist()],
                 ]
             ),
             edge_attr=graph["pyg"].edge_attr[subgraph["edges"]],
@@ -247,8 +251,9 @@ class MultimodalSubgraphExtractionTool(BaseTool):
         # Networkx DiGraph construction to be visualized in the frontend
         nx_graph = nx.DiGraph()
         # Add nodes with attributes
-        node_colors = {n: cfg.node_colors_dict[k]
-                       for k, v in state["selections"].items() for n in v}
+        node_colors = {
+            n: cfg.node_colors_dict[k] for k, v in state["selections"].items() for n in v
+        }
         for n in pyg_graph.node_name:
             nx_graph.add_node(n, color=node_colors.get(n, None))
@@ -256,7 +261,8 @@ class MultimodalSubgraphExtractionTool(BaseTool):
         edges = zip(
             pyg_graph.edge_index[0].tolist(),
             pyg_graph.edge_index[1].tolist(),
-            pyg_graph.edge_type
+            pyg_graph.edge_type,
+            strict=False,
         )
         for src, dst, edge_type in edges:
             nx_graph.add_edge(
@@ -303,7 +309,8 @@ class MultimodalSubgraphExtractionTool(BaseTool):
         # Load hydra configuration
         with hydra.initialize(version_base=None, config_path="../configs"):
             cfg = hydra.compose(
-                config_name="config", overrides=["tools/multimodal_subgraph_extraction=default"]
+                config_name="config",
+                overrides=["tools/multimodal_subgraph_extraction=default"],
             )
             cfg = cfg.tools.multimodal_subgraph_extraction
@@ -322,20 +329,14 @@ class MultimodalSubgraphExtractionTool(BaseTool):
         query_df = self._prepare_query_modalities(
             [EmbeddingWithOllama(model_name=cfg.ollama_embeddings[0]).embed_query(prompt)],
             state,
-            initial_graph["pyg"]
+            initial_graph["pyg"],
         )
         # Perform subgraph extraction
-        subgraphs = self._perform_subgraph_extraction(state,
-                                                      cfg,
-                                                      initial_graph["pyg"],
-                                                      query_df)
+        subgraphs = self._perform_subgraph_extraction(state, cfg, initial_graph["pyg"], query_df)
         # Prepare subgraph as a NetworkX graph and textualized graph
-        final_subgraph = self._prepare_final_subgraph(state,
-                                                      subgraphs,
-                                                      initial_graph,
-                                                      cfg)
+        final_subgraph = self._prepare_final_subgraph(state, subgraphs, initial_graph, cfg)
         # Prepare the dictionary of extracted graph
         dic_extracted_graph = {
@@ -362,7 +363,8 @@ class MultimodalSubgraphExtractionTool(BaseTool):
         # Return the updated state of the tool
         return Command(
-            update=dic_updated_state_for_model | {
+            update=dic_updated_state_for_model
+            | {
                 # update the message history
                 "messages": [
                     ToolMessage(

aiagents4pharma/talk2knowledgegraphs/tools/subgraph_extraction.py CHANGED Viewed

@@ -2,29 +2,31 @@
 Tool for performing subgraph extraction.
 """
-from typing import Type, Annotated
 import logging
 import pickle
-import numpy as np
-import pandas as pd
+from typing import Annotated
 import hydra
 import networkx as nx
-from pydantic import BaseModel, Field
-from langchain.chains.retrieval import create_retrieval_chain
+import numpy as np
+import pandas as pd
+import torch
 from langchain.chains.combine_documents import create_stuff_documents_chain
+from langchain.chains.retrieval import create_retrieval_chain
+from langchain_community.document_loaders import PyPDFLoader
+from langchain_core.messages import ToolMessage
 from langchain_core.prompts import ChatPromptTemplate
-from langchain_core.vectorstores import InMemoryVectorStore
 from langchain_core.tools import BaseTool
-from langchain_core.messages import ToolMessage
 from langchain_core.tools.base import InjectedToolCallId
-from langchain_community.document_loaders import PyPDFLoader
+from langchain_core.vectorstores import InMemoryVectorStore
 from langchain_text_splitters import RecursiveCharacterTextSplitter
-from langgraph.types import Command
 from langgraph.prebuilt import InjectedState
-import torch
+from langgraph.types import Command
+from pydantic import BaseModel, Field
 from torch_geometric.data import Data
-from ..utils.extractions.pcst import PCSTPruning
 from ..utils.embeddings.ollama import EmbeddingWithOllama
+from ..utils.extractions.pcst import PCSTPruning
 from .load_arguments import ArgumentData
 # Initialize logger
@@ -43,14 +45,10 @@ class SubgraphExtractionInput(BaseModel):
         arg_data: Argument for analytical process over graph data.
     """
-    tool_call_id: Annotated[str, InjectedToolCallId] = Field(
-        description="Tool call ID."
-    )
+    tool_call_id: Annotated[str, InjectedToolCallId] = Field(description="Tool call ID.")
     state: Annotated[dict, InjectedState] = Field(description="Injected state.")
     prompt: str = Field(description="Prompt to interact with the backend.")
-    arg_data: ArgumentData = Field(
-        description="Experiment over graph data.", default=None
-    )
+    arg_data: ArgumentData = Field(description="Experiment over graph data.", default=None)
 class SubgraphExtractionTool(BaseTool):
@@ -61,7 +59,7 @@ class SubgraphExtractionTool(BaseTool):
     name: str = "subgraph_extraction"
     description: str = "A tool for subgraph extraction based on user's prompt."
-    args_schema: Type[BaseModel] = SubgraphExtractionInput
+    args_schema: type[BaseModel] = SubgraphExtractionInput
     def perform_endotype_filtering(
         self,
@@ -98,9 +96,7 @@ class SubgraphExtractionTool(BaseTool):
                     ]
                 )
-                qa_chain = create_stuff_documents_chain(
-                    state["llm_model"], prompt_template
-                )
+                qa_chain = create_stuff_documents_chain(state["llm_model"], prompt_template)
                 rag_chain = create_retrieval_chain(
                     InMemoryVectorStore.from_documents(
                         documents=splits, embedding=state["embedding_model"]
@@ -119,16 +115,13 @@ class SubgraphExtractionTool(BaseTool):
         # Prepare the prompt
         if len(all_genes) > 0:
-            prompt = " ".join(
-                [prompt, cfg.prompt_endotype_addition, ", ".join(all_genes)]
-            )
+            prompt = " ".join([prompt, cfg.prompt_endotype_addition, ", ".join(all_genes)])
         return prompt
-    def prepare_final_subgraph(self,
-                               subgraph: dict,
-                               pyg_graph: Data,
-                               textualized_graph: pd.DataFrame) -> dict:
+    def prepare_final_subgraph(
+        self, subgraph: dict, pyg_graph: Data, textualized_graph: pd.DataFrame
+    ) -> dict:
         """
         Prepare the subgraph based on the extracted subgraph.
@@ -153,14 +146,8 @@ class SubgraphExtractionTool(BaseTool):
             # Edge features
             edge_index=torch.LongTensor(
                 [
-                    [
-                        mapping[i]
-                        for i in pyg_graph.edge_index[:, subgraph["edges"]][0].tolist()
-                    ],
-                    [
-                        mapping[i]
-                        for i in pyg_graph.edge_index[:, subgraph["edges"]][1].tolist()
-                    ],
+                    [mapping[i] for i in pyg_graph.edge_index[:, subgraph["edges"]][0].tolist()],
+                    [mapping[i] for i in pyg_graph.edge_index[:, subgraph["edges"]][1].tolist()],
                 ]
             ),
             edge_attr=pyg_graph.edge_attr[subgraph["edges"]],
@@ -293,7 +280,8 @@ class SubgraphExtractionTool(BaseTool):
         # Return the updated state of the tool
         return Command(
-            update=dic_updated_state_for_model | {
+            update=dic_updated_state_for_model
+            | {
                 # update the message history
                 "messages": [
                     ToolMessage(

aiagents4pharma/talk2knowledgegraphs/tools/subgraph_summarization.py CHANGED Viewed

@@ -3,16 +3,17 @@ Tool for performing subgraph summarization.
 """
 import logging
-from typing import Type, Annotated
-from pydantic import BaseModel, Field
+from typing import Annotated
+import hydra
+from langchain_core.messages import ToolMessage
 from langchain_core.output_parsers import StrOutputParser
 from langchain_core.prompts import ChatPromptTemplate
-from langchain_core.messages import ToolMessage
-from langchain_core.tools.base import InjectedToolCallId
 from langchain_core.tools import BaseTool
-from langgraph.types import Command
+from langchain_core.tools.base import InjectedToolCallId
 from langgraph.prebuilt import InjectedState
-import hydra
+from langgraph.types import Command
+from pydantic import BaseModel, Field
 # Initialize logger
 logging.basicConfig(level=logging.INFO)
@@ -31,9 +32,7 @@ class SubgraphSummarizationInput(BaseModel):
         extraction_name: Name assigned to the subgraph extraction process
     """
-    tool_call_id: Annotated[str, InjectedToolCallId] = Field(
-        description="Tool call ID."
-    )
+    tool_call_id: Annotated[str, InjectedToolCallId] = Field(description="Tool call ID.")
     state: Annotated[dict, InjectedState] = Field(description="Injected state.")
     prompt: str = Field(description="Prompt to interact with the backend.")
     extraction_name: str = Field(
@@ -51,7 +50,7 @@ class SubgraphSummarizationTool(BaseTool):
     name: str = "subgraph_summarization"
     description: str = """A tool to perform subgraph summarization over textualized graph
                         for responding to user's follow-up prompt(s)."""
-    args_schema: Type[BaseModel] = SubgraphSummarizationInput
+    args_schema: type[BaseModel] = SubgraphSummarizationInput
     def _run(
         self,
@@ -69,9 +68,7 @@ class SubgraphSummarizationTool(BaseTool):
             prompt: The prompt to interact with the backend.
             extraction_name: The name assigned to the subgraph extraction process.
         """
-        logger.log(
-            logging.INFO, "Invoking subgraph_summarization tool for %s", extraction_name
-        )
+        logger.log(logging.INFO, "Invoking subgraph_summarization tool for %s", extraction_name)
         # Load hydra configuration
         with hydra.initialize(version_base=None, config_path="../configs"):

aiagents4pharma/talk2knowledgegraphs/utils/__init__.py CHANGED Viewed

@@ -1,8 +1,5 @@
-'''
+"""
 This file is used to import all the models in the package.
-'''
-from . import embeddings
-from . import enrichments
-from . import extractions
-from . import kg_utils
-from . import pubchem_utils
+"""
+from . import embeddings, enrichments, extractions, kg_utils, pubchem_utils

aiagents4pharma/talk2knowledgegraphs/utils/embeddings/__init__.py CHANGED Viewed

@@ -1,8 +1,5 @@
-'''
+"""
 This file is used to import all the models in the package.
-'''
-from . import embeddings
-from . import sentence_transformer
-from . import huggingface
-from . import ollama
-from . import nim_molmim
+"""
+from . import embeddings, huggingface, nim_molmim, ollama, sentence_transformer

aiagents4pharma/talk2knowledgegraphs/utils/embeddings/embeddings.py CHANGED Viewed

@@ -2,9 +2,12 @@
 Embeddings interface from LangChain Core.
 https://github.com/langchain-ai/langchain/blob/master/libs/core/langchain_core/embeddings/embeddings.py
 """
 from abc import ABC, abstractmethod
 from langchain_core.runnables.config import run_in_executor
 class Embeddings(ABC):
     """Interface for embedding models.
@@ -32,6 +35,7 @@ class Embeddings(ABC):
     however, implementations may choose to override the asynchronous methods with
     an async native implementation for performance reasons.
     """
     @abstractmethod
     def embed_documents(self, texts: list[str]) -> list[list[float]]:
         """Embed search docs.

aiagents4pharma/talk2knowledgegraphs/utils/embeddings/huggingface.py CHANGED Viewed

@@ -2,11 +2,12 @@
 Embedding class using HuggingFace model based on LangChain Embeddings class.
 """
-from typing import List
 import torch
-from transformers import AutoModel, AutoTokenizer, AutoConfig
+from transformers import AutoConfig, AutoModel, AutoTokenizer
 from .embeddings import Embeddings
 class EmbeddingWithHuggingFace(Embeddings):
     """
     Embedding class using HuggingFace model based on LangChain Embeddings class.
@@ -39,18 +40,14 @@ class EmbeddingWithHuggingFace(Embeddings):
         # Try to load the model from HuggingFace Hub
         try:
             AutoConfig.from_pretrained(self.model_name)
-        except EnvironmentError as e:
-            raise ValueError(
-                f"Model {self.model_name} is not available on HuggingFace Hub."
-            ) from e
+        except OSError as e:
+            raise ValueError(f"Model {self.model_name} is not available on HuggingFace Hub.") from e
         # Load HuggingFace tokenizer and model
         self.tokenizer = AutoTokenizer.from_pretrained(
             self.model_name, cache_dir=self.model_cache_dir
         )
-        self.model = AutoModel.from_pretrained(
-            self.model_name, cache_dir=self.model_cache_dir
-        )
+        self.model = AutoModel.from_pretrained(self.model_name, cache_dir=self.model_cache_dir)
     def meanpooling(self, output, mask) -> torch.Tensor:
         """
@@ -62,11 +59,11 @@ class EmbeddingWithHuggingFace(Embeddings):
             output: The output of the model.
             mask: The mask of the model.
         """
-        embeddings = output[0] # First element of model_output contains all token embeddings
+        embeddings = output[0]  # First element of model_output contains all token embeddings
         mask = mask.unsqueeze(-1).expand(embeddings.size()).float()
         return torch.sum(embeddings * mask, 1) / torch.clamp(mask.sum(1), min=1e-9)
-    def embed_documents(self, texts: List[str]) -> List[float]:
+    def embed_documents(self, texts: list[str]) -> list[float]:
         """
         Generate embedding for a list of input texts using HuggingFace model.
@@ -86,11 +83,11 @@ class EmbeddingWithHuggingFace(Embeddings):
                 return_tensors="pt",
             ).to(self.device)
             outputs = self.model.to(self.device)(**inputs)
-            embeddings = self.meanpooling(outputs, inputs['attention_mask']).cpu()
+            embeddings = self.meanpooling(outputs, inputs["attention_mask"]).cpu()
         return embeddings
-    def embed_query(self, text: str) -> List[float]:
+    def embed_query(self, text: str) -> list[float]:
         """
         Generate embeddings for an input text using HuggingFace model.
@@ -109,6 +106,6 @@ class EmbeddingWithHuggingFace(Embeddings):
                 return_tensors="pt",
             ).to(self.device)
             outputs = self.model.to(self.device)(**inputs)
-            embeddings = self.meanpooling(outputs, inputs['attention_mask']).cpu()[0]
+            embeddings = self.meanpooling(outputs, inputs["attention_mask"]).cpu()[0]
         return embeddings

aiagents4pharma/talk2knowledgegraphs/utils/embeddings/nim_molmim.py CHANGED Viewed

@@ -3,14 +3,17 @@ Embedding class using MOLMIM model from NVIDIA NIM.
 """
 import json
-from typing import List
 import requests
 from .embeddings import Embeddings
 class EmbeddingWithMOLMIM(Embeddings):
     """
     Embedding class using MOLMIM model from NVIDIA NIM
     """
     def __init__(self, base_url: str):
         """
         Initialize the EmbeddingWithMOLMIM class.
@@ -21,7 +24,7 @@ class EmbeddingWithMOLMIM(Embeddings):
         # Set base URL
         self.base_url = base_url
-    def embed_documents(self, texts: List[str]) -> List[float]:
+    def embed_documents(self, texts: list[str]) -> list[float]:
         """
         Generate embedding for a list of SMILES strings using MOLMIM model.
@@ -31,16 +34,13 @@ class EmbeddingWithMOLMIM(Embeddings):
         Returns:
             The list of embeddings for the given SMILES strings.
         """
-        headers = {
-            'accept': 'application/json',
-            'Content-Type': 'application/json'
-        }
+        headers = {"accept": "application/json", "Content-Type": "application/json"}
         data = json.dumps({"sequences": texts})
         response = requests.post(self.base_url, headers=headers, data=data, timeout=60)
         embeddings = response.json()["embeddings"]
         return embeddings
-    def embed_query(self, text: str) -> List[float]:
+    def embed_query(self, text: str) -> list[float]:
         """
         Generate embeddings for an input query using MOLMIM model.

aiagents4pharma 1.44.0__py3-none-any.whl → 1.45.1__py3-none-any.whl

aiagents4pharma 1.44.0py3-none-any.whl → 1.45.1py3-none-any.whl