PyPI - datarobot-moderations - Versions diffs - 11.1.15__py3-none-any.whl → 11.1.16__py3-none-any.whl - Mend

datarobot-moderations 11.1.15py3-none-any.whl → 11.1.16py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

datarobot_dome/guard.py CHANGED Viewed

@@ -49,11 +49,13 @@ from datarobot_dome.constants import GuardStage
 from datarobot_dome.constants import GuardTimeoutAction
 from datarobot_dome.constants import GuardType
 from datarobot_dome.constants import OOTBType
+from datarobot_dome.guard_helpers import DEFAULT_OPEN_AI_API_VERSION
 from datarobot_dome.guard_helpers import ModerationDeepEvalLLM
 from datarobot_dome.guard_helpers import get_azure_openai_client
 from datarobot_dome.guard_helpers import get_chat_nvidia_llm
 from datarobot_dome.guard_helpers import get_datarobot_endpoint_and_token
-from datarobot_dome.guard_helpers import try_to_fallback_to_llm_gateway
+from datarobot_dome.guard_helpers import get_llm_gateway_client
+from datarobot_dome.guard_helpers import use_llm_gateway_inference
 from datarobot_dome.guards.guard_llm_mixin import GuardLLMMixin
 MAX_GUARD_NAME_LENGTH = 255
@@ -142,6 +144,7 @@ guard_intervention_trafaret = t.Dict(
 additional_guard_config_trafaret = t.Dict(
     {
         t.Key("cost", to_name="cost", optional=True): t.Or(cost_metric_trafaret, t.Null),
+        t.Key("tool_call", to_name="tool_call", optional=True): t.Or(t.Any(), t.Null),
     }
 )
@@ -484,12 +487,18 @@ class NeMoGuard(Guard, GuardLLMMixin):
         self.openai_api_base = config.get("openai_api_base")
         self.openai_deployment_id = config.get("openai_deployment_id")
         llm_id = None
+        credentials = None
+        use_llm_gateway = use_llm_gateway_inference(self._llm_type)
         try:
             self.openai_api_key = self.get_openai_api_key(config, self._llm_type)
             if self._llm_type != GuardLLMType.NIM and self.openai_api_key is None:
                 raise ValueError("OpenAI API key is required for NeMo Guardrails")
             if self.llm_type == GuardLLMType.OPENAI:
+                credentials = {
+                    "credential_type": "openai",
+                    "api_key": self.openai_api_key,
+                }
                 os.environ["OPENAI_API_KEY"] = self.openai_api_key
                 llm = None
             elif self.llm_type == GuardLLMType.AZURE_OPENAI:
@@ -497,6 +506,12 @@ class NeMoGuard(Guard, GuardLLMMixin):
                     raise ValueError("Azure OpenAI API base url is required for LLM Guard")
                 if self.openai_deployment_id is None:
                     raise ValueError("Azure OpenAI deployment ID is required for LLM Guard")
+                credentials = {
+                    "credential_type": "azure_openai",
+                    "api_base": self.openai_api_base,
+                    "api_version": DEFAULT_OPEN_AI_API_VERSION,
+                    "api_key": self.openai_api_key,
+                }
                 azure_openai_client = get_azure_openai_client(
                     openai_api_key=self.openai_api_key,
                     openai_api_base=self.openai_api_base,
@@ -537,15 +552,20 @@ class NeMoGuard(Guard, GuardLLMMixin):
                 raise ValueError(f"Invalid LLMType: {self.llm_type}")
         except Exception as e:
-            llm = try_to_fallback_to_llm_gateway(
-                # Currently only OPENAI and AZURE_OPENAI are supported by NeMoGuard
-                # For Bedrock and Vertex the model in the config is actually the LLM ID
-                # For OpenAI we use the default model defined in get_llm_gateway_client
-                # For Azure we use the deployment ID
+            # no valid user credentials provided, raise if not using LLM Gateway
+            credentials = None
+            if not use_llm_gateway:
+                raise e
+        if use_llm_gateway:
+            # Currently only OPENAI and AZURE_OPENAI are supported by NeMoGuard
+            # For Bedrock and Vertex the model in the config is actually the LLM ID
+            # For OpenAI we use the default model defined in get_llm_gateway_client
+            # For Azure we use the deployment ID
+            llm = get_llm_gateway_client(
                 llm_id=llm_id,
                 openai_deployment_id=self.openai_deployment_id,
-                llm_type=self.llm_type,
-                e=e,
+                credentials=credentials,
             )
         # Use guard stage to determine whether to read from prompt/response subdirectory

datarobot_dome/guard_helpers.py CHANGED Viewed

@@ -47,7 +47,7 @@ from datarobot_dome.llm import DataRobotLLM
 # but for ROUGE-1 guard, UI allows the user to configure value between
 # 0 and 1, so making scaling factor 1.
 SCALING_FACTOR = 1
-DEFAULT_OPEN_AI_API_VERSION = "2023-03-15-preview"
+DEFAULT_OPEN_AI_API_VERSION = "2024-10-21"
 _logger = logging.getLogger(LOGGER_NAME_PREFIX + ".guard_helpers")
@@ -195,8 +195,10 @@ def get_llm_gateway_client(
     model: str | None = None,
     llm_id: str | None = None,
     openai_deployment_id: str | None = None,
+    credentials: dict | None = None,
 ) -> ChatOpenAI:
     """The LLM gateway client enables chat completions with DR provided credentials and metering.
+    User provided credentials are optional and passed to the completion request as json string.
     Providing model is always required due to openai's chat api.
     llm_id and deployment_id override model if provided.
@@ -208,7 +210,8 @@ def get_llm_gateway_client(
         model=model or "azure/gpt-4o",
         api_key=datarobot_api_token,
         base_url=f"{datarobot_endpoint}/genai/llmgw",
-        max_retries=0,  # retries are handled by the LLM Gateway
+        # retries are handled by the LLM Gateway
+        max_retries=0,
         default_headers={
             # used for metering
             "Client-Id": "moderations",
@@ -217,28 +220,24 @@ def get_llm_gateway_client(
             # optional model overrides
             "deployment_id": openai_deployment_id,
             "llm_id": llm_id,
+            # optional user provided credentials
+            "credential_json": json.dumps(credentials) if credentials else None,
         },
     )
     return client
-def try_to_fallback_to_llm_gateway(
-    llm_id: str | None,
-    openai_deployment_id: str | None,
-    llm_type: GuardLLMType,
-    e: Exception,
-) -> ChatOpenAI:
-    # USE the LLM gateway if its runtime parameter is available and enabled
-    # DO NOT USE the gateway if user provided credentials are specified
-    # which is the case if no exception was raised trying to create the LLM
-    # DATAROBOT and NIM LLM types are not supported by the gateway
-    if not json.loads(os.environ.get("ENABLE_LLM_GATEWAY_INFERENCE", "false")) or llm_type in [
+def use_llm_gateway_inference(llm_type: GuardLLMType):
+    """
+    USE the LLM gateway if its runtime parameter is available and enabled
+    DATAROBOT and NIM LLM types are not supported by the gateway
+    """
+    if json.loads(os.environ.get("ENABLE_LLM_GATEWAY_INFERENCE", "false")) and llm_type not in [
         GuardLLMType.DATAROBOT,
         GuardLLMType.NIM,
     ]:
-        raise e
-    llm = get_llm_gateway_client(llm_id=llm_id, openai_deployment_id=openai_deployment_id)
-    return llm
+        return True
+    return False
 def get_azure_openai_client(

datarobot_dome/guards/guard_llm_mixin.py CHANGED Viewed

@@ -22,11 +22,13 @@ from datarobot_dome.constants import SECRET_DEFINITION_PREFIX
 from datarobot_dome.constants import GuardLLMType
 from datarobot_dome.constants import GuardType
 from datarobot_dome.constants import OOTBType
+from datarobot_dome.guard_helpers import DEFAULT_OPEN_AI_API_VERSION
 from datarobot_dome.guard_helpers import get_azure_openai_client
 from datarobot_dome.guard_helpers import get_bedrock_client
 from datarobot_dome.guard_helpers import get_datarobot_llm
+from datarobot_dome.guard_helpers import get_llm_gateway_client
 from datarobot_dome.guard_helpers import get_vertex_client
-from datarobot_dome.guard_helpers import try_to_fallback_to_llm_gateway
+from datarobot_dome.guard_helpers import use_llm_gateway_inference
 basic_credential_trafaret = t.Dict(
     {
@@ -156,6 +158,8 @@ class GuardLLMMixin:
         openai_api_base = config.get("openai_api_base")
         openai_deployment_id = config.get("openai_deployment_id")
         llm_id = None
+        credentials = None
+        use_llm_gateway = use_llm_gateway_inference(llm_type)
         try:
             if llm_type in [GuardLLMType.OPENAI, GuardLLMType.AZURE_OPENAI]:
                 openai_api_key = self.get_openai_api_key(config, llm_type)
@@ -163,6 +167,10 @@ class GuardLLMMixin:
                     raise ValueError("OpenAI API key is required for Faithfulness guard")
                 if llm_type == GuardLLMType.OPENAI:
+                    credentials = {
+                        "credential_type": "openai",
+                        "api_key": openai_api_key,
+                    }
                     os.environ["OPENAI_API_KEY"] = openai_api_key
                     llm = "default"
                 elif llm_type == GuardLLMType.AZURE_OPENAI:
@@ -170,6 +178,12 @@ class GuardLLMMixin:
                         raise ValueError("OpenAI API base url is required for LLM Guard")
                     if openai_deployment_id is None:
                         raise ValueError("OpenAI deployment ID is required for LLM Guard")
+                    credentials = {
+                        "credential_type": "azure_openai",
+                        "api_key": openai_api_key,
+                        "api_base": openai_api_base,
+                        "api_version": DEFAULT_OPEN_AI_API_VERSION,
+                    }
                     azure_openai_client = get_azure_openai_client(
                         openai_api_key=openai_api_key,
                         openai_api_base=openai_api_base,
@@ -182,9 +196,15 @@ class GuardLLMMixin:
                     raise ValueError("Google model is required for LLM Guard")
                 if config.get("google_region") is None:
                     raise ValueError("Google region is required for LLM Guard")
+                service_account_info = self.get_google_service_account(config)
+                credentials = {
+                    "credential_type": "google_vertex_ai",
+                    "region": config["google_region"],
+                    "service_account_info": service_account_info,
+                }
                 llm = get_vertex_client(
                     google_model=llm_id,
-                    google_service_account=self.get_google_service_account(config),
+                    google_service_account=service_account_info,
                     google_region=config["google_region"],
                 )
             elif llm_type == GuardLLMType.AMAZON:
@@ -194,6 +214,13 @@ class GuardLLMMixin:
                 if config.get("aws_region") is None:
                     raise ValueError("AWS region is required for LLM Guard")
                 credential_config = self.get_aws_account(config)
+                credentials = {
+                    "credential_type": "amazon_bedrock",
+                    "access_key_id": credential_config["aws_access_key_id"],
+                    "secret_access_key": credential_config["aws_secret_access_key"],
+                    "session_token": credential_config["aws_session_token"],
+                    "region": config["aws_region"],
+                }
                 llm = get_bedrock_client(
                     aws_model=llm_id,
                     aws_access_key_id=credential_config["aws_access_key_id"],
@@ -219,14 +246,19 @@ class GuardLLMMixin:
                 raise ValueError(f"Invalid LLMType: {llm_type}")
         except Exception as e:
-            llm = try_to_fallback_to_llm_gateway(
-                # For Bedrock and Vertex the model in the config is actually the LLM ID
-                # For OpenAI we use the default model defined in get_llm_gateway_client
-                # For Azure we use the deployment ID
+            # no valid user credentials provided, raise if not using LLM Gateway
+            credentials = None
+            if not use_llm_gateway:
+                raise e
+        if use_llm_gateway:
+            # For Bedrock and Vertex the model in the config is actually the LLM ID
+            # For OpenAI we use the default model defined in get_llm_gateway_client
+            # For Azure we use the deployment ID
+            llm = get_llm_gateway_client(
                 llm_id=llm_id,
                 openai_deployment_id=openai_deployment_id,
-                llm_type=llm_type,
-                e=e,
+                credentials=credentials,
             )
         return llm

{datarobot_moderations-11.1.15.dist-info → datarobot_moderations-11.1.16.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.3
 Name: datarobot-moderations
-Version: 11.1.15
+Version: 11.1.16
 Summary: DataRobot Monitoring and Moderation framework
 License: DataRobot Tool and Utility Agreement
 Author: DataRobot

{datarobot_moderations-11.1.15.dist-info → datarobot_moderations-11.1.16.dist-info}/RECORD RENAMED Viewed

@@ -3,11 +3,11 @@ datarobot_dome/async_http_client.py,sha256=wkB4irwvnchNGzO1bk2C_HWM-GOSB3AUn5TXK
 datarobot_dome/chat_helper.py,sha256=BzvtUyZSZxzOqq-5a2wQKhHhr2kMlcP1MFrHaDAeD_o,9671
 datarobot_dome/constants.py,sha256=mnSa8rUAha4XlsS2lwPmFCkH2RzfSL_MMkErsWHqIbA,9040
 datarobot_dome/drum_integration.py,sha256=nULpLYVMiS5vihfNUyuq-nvZpgXrQibQbVu2UMAscu8,42102
-datarobot_dome/guard.py,sha256=7T0a1gsWqVmVvEf4SLkVBi8lIRYl8PeMB7TnQGszWtc,32371
+datarobot_dome/guard.py,sha256=1INYx17n9ToiB5bzI-jIReUUuqkK_ucxpOx4jQLts6g,33264
 datarobot_dome/guard_executor.py,sha256=AOI8MZeZETHMoFgBePe0wa2vE9d2975MYQnEDHLZL7s,35462
-datarobot_dome/guard_helpers.py,sha256=YHhSUSuvxAgDdWPXiwYiHtrl-6ZlObE9n6CjYPQNSuA,16375
+datarobot_dome/guard_helpers.py,sha256=Bfdi8gow2_TAVzRHYUDqEfcG5bWx2KR1dnpxt9E850Y,16311
 datarobot_dome/guards/__init__.py,sha256=B5Rx8_CNCNsOpxBbRj27XOXCfRZmvmrAR-NzlzIKnDw,583
-datarobot_dome/guards/guard_llm_mixin.py,sha256=ON-zuVL3xhQmXv0rFkalWrW_Q67Wwya2IQerHO8WkKU,10694
+datarobot_dome/guards/guard_llm_mixin.py,sha256=VovlpNZjWIGamF4SSvLF5lzOFyApH5IoOiB_qtCmRg0,12216
 datarobot_dome/llm.py,sha256=L02OvTrflmD34-FrfXebfF-zzKTeuin7fpne1Cl5psg,5719
 datarobot_dome/metrics/__init__.py,sha256=B5Rx8_CNCNsOpxBbRj27XOXCfRZmvmrAR-NzlzIKnDw,583
 datarobot_dome/metrics/citation_metrics.py,sha256=q0hTMWuk6wy_jqk2UjFPON3kU94HN3W2vxr9giJ8O8E,3544
@@ -18,6 +18,6 @@ datarobot_dome/pipeline/llm_pipeline.py,sha256=fOp_OJnQMDUJH-LKv12kEqli-EqfHjAiS
 datarobot_dome/pipeline/pipeline.py,sha256=_pZ_4K2LMnfYCYj_ur9EwJzo3T-pbO6lFYz1O-_3uQ4,16491
 datarobot_dome/pipeline/vdb_pipeline.py,sha256=WTOGn1qe_ZvEcdlvHgeXxl2xTqp7GjfL13c6S-FmAfM,5146
 datarobot_dome/streaming.py,sha256=6nYvh6SoxPRLfO6GGdEoHsQuyLP9oX1lDMe8IeGo4lw,17801
-datarobot_moderations-11.1.15.dist-info/METADATA,sha256=zHt26VnmHpn-0cL-egKPqdcTvKPTittBNtVHLVylbHo,4827
-datarobot_moderations-11.1.15.dist-info/WHEEL,sha256=b4K_helf-jlQoXBBETfwnf4B04YC67LOev0jo4fX5m8,88
-datarobot_moderations-11.1.15.dist-info/RECORD,,
+datarobot_moderations-11.1.16.dist-info/METADATA,sha256=WBOhNlF-pwpbJ2PvlkhwqlKbF3vtWkbNdu6vjqvmvaQ,4827
+datarobot_moderations-11.1.16.dist-info/WHEEL,sha256=b4K_helf-jlQoXBBETfwnf4B04YC67LOev0jo4fX5m8,88
+datarobot_moderations-11.1.16.dist-info/RECORD,,

{datarobot_moderations-11.1.15.dist-info → datarobot_moderations-11.1.16.dist-info}/WHEEL RENAMED Viewed

File without changes

datarobot-moderations 11.1.15__py3-none-any.whl → 11.1.16__py3-none-any.whl

datarobot-moderations 11.1.15py3-none-any.whl → 11.1.16py3-none-any.whl