PyPI - nvidia-nat-llama-index - Versions diffs - 1.3.dev0__py3-none-any.whl → 1.3.0rc1__py3-none-any.whl - Mend

nvidia-nat-llama-index 1.3.dev0py3-none-any.whl → 1.3.0rc1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

nat/plugins/llama_index/embedder.py CHANGED Viewed

@@ -12,28 +12,58 @@
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
-# pylint: disable=unused-argument
 from nat.builder.builder import Builder
 from nat.builder.framework_enum import LLMFrameworkEnum
 from nat.cli.register_workflow import register_embedder_client
 from nat.data_models.retry_mixin import RetryMixin
+from nat.embedder.azure_openai_embedder import AzureOpenAIEmbedderModelConfig
 from nat.embedder.nim_embedder import NIMEmbedderModelConfig
+from nat.embedder.openai_embedder import OpenAIEmbedderModelConfig
 from nat.utils.exception_handlers.automatic_retries import patch_with_retry
+@register_embedder_client(config_type=AzureOpenAIEmbedderModelConfig, wrapper_type=LLMFrameworkEnum.LLAMA_INDEX)
+async def azure_openai_llama_index(embedder_config: AzureOpenAIEmbedderModelConfig, _builder: Builder):
+    from llama_index.embeddings.azure_openai import AzureOpenAIEmbedding
+    client = AzureOpenAIEmbedding(**embedder_config.model_dump(exclude={"type"}, by_alias=True, exclude_none=True))
+    if isinstance(embedder_config, RetryMixin):
+        client = patch_with_retry(client,
+                                  retries=embedder_config.num_retries,
+                                  retry_codes=embedder_config.retry_on_status_codes,
+                                  retry_on_messages=embedder_config.retry_on_errors)
+    yield client
 @register_embedder_client(config_type=NIMEmbedderModelConfig, wrapper_type=LLMFrameworkEnum.LLAMA_INDEX)
-async def nim_llamaindex(embedder_config: NIMEmbedderModelConfig, builder: Builder):
+async def nim_llama_index(embedder_config: NIMEmbedderModelConfig, _builder: Builder):
     from llama_index.embeddings.nvidia import NVIDIAEmbedding  # pylint: disable=no-name-in-module
-    config_obj = {
-        **embedder_config.model_dump(exclude={"type", "model_name"}, by_alias=True),
-        "model":
-            embedder_config.model_name,
-    }
+    client = NVIDIAEmbedding(
+        **embedder_config.model_dump(exclude={"type", "model_name"}, by_alias=True, exclude_none=True),
+        model=embedder_config.model_name,
+    )
+    if isinstance(embedder_config, RetryMixin):
+        client = patch_with_retry(client,
+                                  retries=embedder_config.num_retries,
+                                  retry_codes=embedder_config.retry_on_status_codes,
+                                  retry_on_messages=embedder_config.retry_on_errors)
+    yield client
+@register_embedder_client(config_type=OpenAIEmbedderModelConfig, wrapper_type=LLMFrameworkEnum.LLAMA_INDEX)
+async def openai_llama_index(embedder_config: OpenAIEmbedderModelConfig, _builder: Builder):
+    from llama_index.embeddings.openai import OpenAIEmbedding
-    client = NVIDIAEmbedding(**config_obj)
+    client = OpenAIEmbedding(**embedder_config.model_dump(exclude={"type"}, by_alias=True, exclude_none=True))
     if isinstance(embedder_config, RetryMixin):
         client = patch_with_retry(client,

nat/plugins/llama_index/llm.py CHANGED Viewed

@@ -13,71 +13,97 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
+from collections.abc import Sequence
+from typing import TypeVar
 from nat.builder.builder import Builder
 from nat.builder.framework_enum import LLMFrameworkEnum
 from nat.cli.register_workflow import register_llm_client
+from nat.data_models.llm import LLMBaseConfig
 from nat.data_models.retry_mixin import RetryMixin
+from nat.data_models.thinking_mixin import ThinkingMixin
 from nat.llm.aws_bedrock_llm import AWSBedrockModelConfig
+from nat.llm.azure_openai_llm import AzureOpenAIModelConfig
 from nat.llm.nim_llm import NIMModelConfig
 from nat.llm.openai_llm import OpenAIModelConfig
+from nat.llm.utils.thinking import BaseThinkingInjector
+from nat.llm.utils.thinking import FunctionArgumentWrapper
+from nat.llm.utils.thinking import patch_with_thinking
 from nat.utils.exception_handlers.automatic_retries import patch_with_retry
+from nat.utils.type_utils import override
+ModelType = TypeVar("ModelType")
-@register_llm_client(config_type=NIMModelConfig, wrapper_type=LLMFrameworkEnum.LLAMA_INDEX)
-async def nim_llama_index(llm_config: NIMModelConfig, builder: Builder):
-    from llama_index.llms.nvidia import NVIDIA
+def _patch_llm_based_on_config(client: ModelType, llm_config: LLMBaseConfig) -> ModelType:
-    kwargs = llm_config.model_dump(exclude={"type"}, by_alias=True)
+    from llama_index.core.base.llms.types import ChatMessage
-    if ("base_url" in kwargs and kwargs["base_url"] is None):
-        del kwargs["base_url"]
+    class LlamaIndexThinkingInjector(BaseThinkingInjector):
-    llm = NVIDIA(**kwargs)
+        @override
+        def inject(self, messages: Sequence[ChatMessage], *args, **kwargs) -> FunctionArgumentWrapper:
+            new_messages = [ChatMessage(role="system", content=self.system_prompt)] + list(messages)
+            return FunctionArgumentWrapper(new_messages, *args, **kwargs)
     if isinstance(llm_config, RetryMixin):
-        llm = patch_with_retry(llm,
-                               retries=llm_config.num_retries,
-                               retry_codes=llm_config.retry_on_status_codes,
-                               retry_on_messages=llm_config.retry_on_errors)
+        client = patch_with_retry(client,
+                                  retries=llm_config.num_retries,
+                                  retry_codes=llm_config.retry_on_status_codes,
+                                  retry_on_messages=llm_config.retry_on_errors)
+    if isinstance(llm_config, ThinkingMixin) and llm_config.thinking_system_prompt is not None:
+        client = patch_with_thinking(
+            client,
+            LlamaIndexThinkingInjector(
+                system_prompt=llm_config.thinking_system_prompt,
+                function_names=[
+                    "chat",
+                    "stream_chat",
+                    "achat",
+                    "astream_chat",
+                ],
+            ))
+    return client
-    yield llm
+@register_llm_client(config_type=AWSBedrockModelConfig, wrapper_type=LLMFrameworkEnum.LLAMA_INDEX)
+async def aws_bedrock_llama_index(llm_config: AWSBedrockModelConfig, _builder: Builder):
-@register_llm_client(config_type=OpenAIModelConfig, wrapper_type=LLMFrameworkEnum.LLAMA_INDEX)
-async def openai_llama_index(llm_config: OpenAIModelConfig, builder: Builder):
+    from llama_index.llms.bedrock import Bedrock
-    from llama_index.llms.openai import OpenAI
+    # LlamaIndex uses context_size instead of max_tokens
+    llm = Bedrock(**llm_config.model_dump(exclude={"type", "top_p", "thinking"}, by_alias=True))
-    kwargs = llm_config.model_dump(exclude={"type"}, by_alias=True)
+    yield _patch_llm_based_on_config(llm, llm_config)
-    if ("base_url" in kwargs and kwargs["base_url"] is None):
-        del kwargs["base_url"]
-    llm = OpenAI(**kwargs)
+@register_llm_client(config_type=AzureOpenAIModelConfig, wrapper_type=LLMFrameworkEnum.LLAMA_INDEX)
+async def azure_openai_llama_index(llm_config: AzureOpenAIModelConfig, _builder: Builder):
-    if isinstance(llm_config, RetryMixin):
-        llm = patch_with_retry(llm,
-                               retries=llm_config.num_retries,
-                               retry_codes=llm_config.retry_on_status_codes,
-                               retry_on_messages=llm_config.retry_on_errors)
+    from llama_index.llms.azure_openai import AzureOpenAI
-    yield llm
+    llm = AzureOpenAI(**llm_config.model_dump(exclude={"type", "thinking"}, by_alias=True))
+    yield _patch_llm_based_on_config(llm, llm_config)
-@register_llm_client(config_type=AWSBedrockModelConfig, wrapper_type=LLMFrameworkEnum.LLAMA_INDEX)
-async def aws_bedrock_llama_index(llm_config: AWSBedrockModelConfig, builder: Builder):
-    from llama_index.llms.bedrock import Bedrock
+@register_llm_client(config_type=NIMModelConfig, wrapper_type=LLMFrameworkEnum.LLAMA_INDEX)
+async def nim_llama_index(llm_config: NIMModelConfig, _builder: Builder):
-    kwargs = llm_config.model_dump(exclude={"type", "max_tokens"}, by_alias=True)
+    from llama_index.llms.nvidia import NVIDIA
-    llm = Bedrock(**kwargs)
+    llm = NVIDIA(**llm_config.model_dump(exclude={"type", "thinking"}, by_alias=True, exclude_none=True))
-    if isinstance(llm_config, RetryMixin):
-        llm = patch_with_retry(llm,
-                               retries=llm_config.num_retries,
-                               retry_codes=llm_config.retry_on_status_codes,
-                               retry_on_messages=llm_config.retry_on_errors)
+    yield _patch_llm_based_on_config(llm, llm_config)
+@register_llm_client(config_type=OpenAIModelConfig, wrapper_type=LLMFrameworkEnum.LLAMA_INDEX)
+async def openai_llama_index(llm_config: OpenAIModelConfig, _builder: Builder):
+    from llama_index.llms.openai import OpenAI
+    llm = OpenAI(**llm_config.model_dump(exclude={"type", "thinking"}, by_alias=True, exclude_none=True))
-    yield llm
+    yield _patch_llm_based_on_config(llm, llm_config)

nat/plugins/llama_index/register.py CHANGED Viewed

@@ -13,12 +13,11 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
-# pylint: disable=unused-import
 # flake8: noqa
 # isort:skip_file
 # Import any providers which need to be automatically registered here
+from . import embedder
 from . import llm
 from . import tool_wrapper
-from . import embedder

{nvidia_nat_llama_index-1.3.dev0.dist-info → nvidia_nat_llama_index-1.3.0rc1.dist-info}/METADATA RENAMED Viewed

@@ -1,18 +1,25 @@
 Metadata-Version: 2.4
 Name: nvidia-nat-llama-index
-Version: 1.3.dev0
+Version: 1.3.0rc1
 Summary: Subpackage for Llama-Index integration in NeMo Agent toolkit
 Keywords: ai,rag,agents
 Classifier: Programming Language :: Python
-Requires-Python: <3.13,>=3.11
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Programming Language :: Python :: 3.13
+Requires-Python: <3.14,>=3.11
 Description-Content-Type: text/markdown
-Requires-Dist: nvidia-nat==v1.3-dev
-Requires-Dist: llama-index-core==0.12.21
-Requires-Dist: llama-index-embeddings-nvidia==0.3.1
-Requires-Dist: llama-index-llms-bedrock==0.3.8
-Requires-Dist: llama-index-llms-nvidia==0.3.1
-Requires-Dist: llama-index-readers-file==0.4.4
-Requires-Dist: llama-index==0.12.21
+Requires-Dist: nvidia-nat==v1.3.0-rc1
+Requires-Dist: llama-index-core~=0.12.21
+Requires-Dist: llama-index-embeddings-azure-openai~=0.3.9
+Requires-Dist: llama-index-embeddings-nvidia~=0.3.1
+Requires-Dist: llama-index-embeddings-openai~=0.3.1
+Requires-Dist: llama-index-llms-azure-openai~=0.3.2
+Requires-Dist: llama-index-llms-bedrock~=0.3.8
+Requires-Dist: llama-index-llms-nvidia~=0.3.1
+Requires-Dist: llama-index-llms-openai~=0.3.42
+Requires-Dist: llama-index-readers-file~=0.4.4
+Requires-Dist: llama-index~=0.12.21
 <!--
 SPDX-FileCopyrightText: Copyright (c) 2025, NVIDIA CORPORATION & AFFILIATES. All rights reserved.

nvidia_nat_llama_index-1.3.0rc1.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,11 @@
+nat/meta/pypi.md,sha256=s9C3pgWB0HLIXTx5QPryNOWN0O2fIRIap0p9_zCHlTs,1112
+nat/plugins/llama_index/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+nat/plugins/llama_index/embedder.py,sha256=4c4uAa19UArqA_Npe5mwEnUhCaguTbyWcAntBzcPEeQ,3493
+nat/plugins/llama_index/llm.py,sha256=0M1m1sjGwVMNibiAzkH2_hnAfdC-Ptc6PM9IKDmfSL8,4500
+nat/plugins/llama_index/register.py,sha256=1x_b8u6cuQwh4Iz_7TcIFWXvLIL9IIKUPE-zR9d6ug8,859
+nat/plugins/llama_index/tool_wrapper.py,sha256=VFKMIIeLdWqHwW2Ax11E2w-_9w3ow6Iuhra1Hk78RYM,1387
+nvidia_nat_llama_index-1.3.0rc1.dist-info/METADATA,sha256=RwXDLjxwnnOjiWB-XC5y6olMd0ckHTzRIDlE3SAafyg,2058
+nvidia_nat_llama_index-1.3.0rc1.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+nvidia_nat_llama_index-1.3.0rc1.dist-info/entry_points.txt,sha256=2LqRRju5448P2v8B3y6TSPnk-nOd5T3AmV5JibCnoQc,68
+nvidia_nat_llama_index-1.3.0rc1.dist-info/top_level.txt,sha256=8-CJ2cP6-f0ZReXe5Hzqp-5pvzzHz-5Ds5H2bGqh1-U,4
+nvidia_nat_llama_index-1.3.0rc1.dist-info/RECORD,,

nvidia_nat_llama_index-1.3.dev0.dist-info/RECORD DELETED Viewed

@@ -1,11 +0,0 @@
-nat/meta/pypi.md,sha256=s9C3pgWB0HLIXTx5QPryNOWN0O2fIRIap0p9_zCHlTs,1112
-nat/plugins/llama_index/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-nat/plugins/llama_index/embedder.py,sha256=L7Wx9QJH2Sh0y6kmgisjtTZfDC9YcuuusKl0Tn_7JgA,1921
-nat/plugins/llama_index/llm.py,sha256=VyuIqks2G9Zcs9a0X7jJyASzSUdtL0Pns0v4_rFEsJE,3220
-nat/plugins/llama_index/register.py,sha256=DelI6uth8dO8h_7czPW4Akfr_ajXDBwhEa1dJzRf5u4,891
-nat/plugins/llama_index/tool_wrapper.py,sha256=VFKMIIeLdWqHwW2Ax11E2w-_9w3ow6Iuhra1Hk78RYM,1387
-nvidia_nat_llama_index-1.3.dev0.dist-info/METADATA,sha256=EP1nCqjUnjLBuvlh_JKpFIG_rebxwmKzo0MjDejM0MY,1694
-nvidia_nat_llama_index-1.3.dev0.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-nvidia_nat_llama_index-1.3.dev0.dist-info/entry_points.txt,sha256=2LqRRju5448P2v8B3y6TSPnk-nOd5T3AmV5JibCnoQc,68
-nvidia_nat_llama_index-1.3.dev0.dist-info/top_level.txt,sha256=8-CJ2cP6-f0ZReXe5Hzqp-5pvzzHz-5Ds5H2bGqh1-U,4
-nvidia_nat_llama_index-1.3.dev0.dist-info/RECORD,,

{nvidia_nat_llama_index-1.3.dev0.dist-info → nvidia_nat_llama_index-1.3.0rc1.dist-info}/WHEEL RENAMED Viewed

File without changes

{nvidia_nat_llama_index-1.3.dev0.dist-info → nvidia_nat_llama_index-1.3.0rc1.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{nvidia_nat_llama_index-1.3.dev0.dist-info → nvidia_nat_llama_index-1.3.0rc1.dist-info}/top_level.txt RENAMED Viewed

File without changes

nvidia-nat-llama-index 1.3.dev0__py3-none-any.whl → 1.3.0rc1__py3-none-any.whl

nvidia-nat-llama-index 1.3.dev0py3-none-any.whl → 1.3.0rc1py3-none-any.whl