PyPI - clarifai - Versions diffs - 11.3.0rc2__py3-none-any.whl → 11.4.0__py3-none-any.whl - Mend

clarifai 11.3.0rc2py3-none-any.whl → 11.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (300) hide show

clarifai/__init__.py +1 -1
clarifai/cli/__main__.py +1 -1
clarifai/cli/base.py +144 -136
clarifai/cli/compute_cluster.py +45 -31
clarifai/cli/deployment.py +93 -76
clarifai/cli/model.py +578 -180
clarifai/cli/nodepool.py +100 -82
clarifai/client/__init__.py +12 -2
clarifai/client/app.py +973 -911
clarifai/client/auth/helper.py +345 -342
clarifai/client/auth/register.py +7 -7
clarifai/client/auth/stub.py +107 -106
clarifai/client/base.py +185 -178
clarifai/client/compute_cluster.py +214 -180
clarifai/client/dataset.py +793 -698
clarifai/client/deployment.py +55 -50
clarifai/client/input.py +1223 -1088
clarifai/client/lister.py +47 -45
clarifai/client/model.py +1939 -1717
clarifai/client/model_client.py +525 -502
clarifai/client/module.py +82 -73
clarifai/client/nodepool.py +358 -213
clarifai/client/runner.py +58 -0
clarifai/client/search.py +342 -309
clarifai/client/user.py +419 -414
clarifai/client/workflow.py +294 -274
clarifai/constants/dataset.py +11 -17
clarifai/constants/model.py +8 -2
clarifai/datasets/export/inputs_annotations.py +233 -217
clarifai/datasets/upload/base.py +63 -51
clarifai/datasets/upload/features.py +43 -38
clarifai/datasets/upload/image.py +237 -207
clarifai/datasets/upload/loaders/coco_captions.py +34 -32
clarifai/datasets/upload/loaders/coco_detection.py +72 -65
clarifai/datasets/upload/loaders/imagenet_classification.py +57 -53
clarifai/datasets/upload/loaders/xview_detection.py +274 -132
clarifai/datasets/upload/multimodal.py +55 -46
clarifai/datasets/upload/text.py +55 -47
clarifai/datasets/upload/utils.py +250 -234
clarifai/errors.py +51 -50
clarifai/models/api.py +260 -238
clarifai/modules/css.py +50 -50
clarifai/modules/pages.py +33 -33
clarifai/rag/rag.py +312 -288
clarifai/rag/utils.py +91 -84
clarifai/runners/models/model_builder.py +906 -802
clarifai/runners/models/model_class.py +370 -331
clarifai/runners/models/model_run_locally.py +459 -419
clarifai/runners/models/model_runner.py +170 -162
clarifai/runners/models/model_servicer.py +78 -70
clarifai/runners/server.py +111 -101
clarifai/runners/utils/code_script.py +225 -187
clarifai/runners/utils/const.py +4 -1
clarifai/runners/utils/data_types/__init__.py +12 -0
clarifai/runners/utils/data_types/data_types.py +598 -0
clarifai/runners/utils/data_utils.py +387 -440
clarifai/runners/utils/loader.py +247 -227
clarifai/runners/utils/method_signatures.py +411 -386
clarifai/runners/utils/openai_convertor.py +108 -109
clarifai/runners/utils/serializers.py +175 -179
clarifai/runners/utils/url_fetcher.py +35 -35
clarifai/schema/search.py +56 -63
clarifai/urls/helper.py +125 -102
clarifai/utils/cli.py +129 -123
clarifai/utils/config.py +127 -87
clarifai/utils/constants.py +49 -0
clarifai/utils/evaluation/helpers.py +503 -466
clarifai/utils/evaluation/main.py +431 -393
clarifai/utils/evaluation/testset_annotation_parser.py +154 -144
clarifai/utils/logging.py +324 -306
clarifai/utils/misc.py +60 -56
clarifai/utils/model_train.py +165 -146
clarifai/utils/protobuf.py +126 -103
clarifai/versions.py +3 -1
clarifai/workflows/export.py +48 -50
clarifai/workflows/utils.py +39 -36
clarifai/workflows/validate.py +55 -43
{clarifai-11.3.0rc2.dist-info → clarifai-11.4.0.dist-info}/METADATA +16 -6
clarifai-11.4.0.dist-info/RECORD +109 -0
{clarifai-11.3.0rc2.dist-info → clarifai-11.4.0.dist-info}/WHEEL +1 -1
clarifai/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/__pycache__/errors.cpython-310.pyc +0 -0
clarifai/__pycache__/errors.cpython-311.pyc +0 -0
clarifai/__pycache__/versions.cpython-310.pyc +0 -0
clarifai/__pycache__/versions.cpython-311.pyc +0 -0
clarifai/cli/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/cli/__pycache__/base.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/base.cpython-311.pyc +0 -0
clarifai/cli/__pycache__/base_cli.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/compute_cluster.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/compute_cluster.cpython-311.pyc +0 -0
clarifai/cli/__pycache__/deployment.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/deployment.cpython-311.pyc +0 -0
clarifai/cli/__pycache__/model.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/model.cpython-311.pyc +0 -0
clarifai/cli/__pycache__/model_cli.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/nodepool.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/nodepool.cpython-311.pyc +0 -0
clarifai/client/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/client/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/client/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/client/__pycache__/app.cpython-310.pyc +0 -0
clarifai/client/__pycache__/app.cpython-311.pyc +0 -0
clarifai/client/__pycache__/app.cpython-39.pyc +0 -0
clarifai/client/__pycache__/base.cpython-310.pyc +0 -0
clarifai/client/__pycache__/base.cpython-311.pyc +0 -0
clarifai/client/__pycache__/compute_cluster.cpython-310.pyc +0 -0
clarifai/client/__pycache__/compute_cluster.cpython-311.pyc +0 -0
clarifai/client/__pycache__/dataset.cpython-310.pyc +0 -0
clarifai/client/__pycache__/dataset.cpython-311.pyc +0 -0
clarifai/client/__pycache__/deployment.cpython-310.pyc +0 -0
clarifai/client/__pycache__/deployment.cpython-311.pyc +0 -0
clarifai/client/__pycache__/input.cpython-310.pyc +0 -0
clarifai/client/__pycache__/input.cpython-311.pyc +0 -0
clarifai/client/__pycache__/lister.cpython-310.pyc +0 -0
clarifai/client/__pycache__/lister.cpython-311.pyc +0 -0
clarifai/client/__pycache__/model.cpython-310.pyc +0 -0
clarifai/client/__pycache__/model.cpython-311.pyc +0 -0
clarifai/client/__pycache__/module.cpython-310.pyc +0 -0
clarifai/client/__pycache__/module.cpython-311.pyc +0 -0
clarifai/client/__pycache__/nodepool.cpython-310.pyc +0 -0
clarifai/client/__pycache__/nodepool.cpython-311.pyc +0 -0
clarifai/client/__pycache__/search.cpython-310.pyc +0 -0
clarifai/client/__pycache__/search.cpython-311.pyc +0 -0
clarifai/client/__pycache__/user.cpython-310.pyc +0 -0
clarifai/client/__pycache__/user.cpython-311.pyc +0 -0
clarifai/client/__pycache__/workflow.cpython-310.pyc +0 -0
clarifai/client/__pycache__/workflow.cpython-311.pyc +0 -0
clarifai/client/auth/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/client/auth/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/client/auth/__pycache__/helper.cpython-310.pyc +0 -0
clarifai/client/auth/__pycache__/helper.cpython-311.pyc +0 -0
clarifai/client/auth/__pycache__/register.cpython-310.pyc +0 -0
clarifai/client/auth/__pycache__/register.cpython-311.pyc +0 -0
clarifai/client/auth/__pycache__/stub.cpython-310.pyc +0 -0
clarifai/client/auth/__pycache__/stub.cpython-311.pyc +0 -0
clarifai/client/cli/__init__.py +0 -0
clarifai/client/cli/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/client/cli/__pycache__/base_cli.cpython-310.pyc +0 -0
clarifai/client/cli/__pycache__/model_cli.cpython-310.pyc +0 -0
clarifai/client/cli/base_cli.py +0 -88
clarifai/client/cli/model_cli.py +0 -29
clarifai/constants/__pycache__/base.cpython-310.pyc +0 -0
clarifai/constants/__pycache__/base.cpython-311.pyc +0 -0
clarifai/constants/__pycache__/dataset.cpython-310.pyc +0 -0
clarifai/constants/__pycache__/dataset.cpython-311.pyc +0 -0
clarifai/constants/__pycache__/input.cpython-310.pyc +0 -0
clarifai/constants/__pycache__/input.cpython-311.pyc +0 -0
clarifai/constants/__pycache__/model.cpython-310.pyc +0 -0
clarifai/constants/__pycache__/model.cpython-311.pyc +0 -0
clarifai/constants/__pycache__/rag.cpython-310.pyc +0 -0
clarifai/constants/__pycache__/rag.cpython-311.pyc +0 -0
clarifai/constants/__pycache__/search.cpython-310.pyc +0 -0
clarifai/constants/__pycache__/search.cpython-311.pyc +0 -0
clarifai/constants/__pycache__/workflow.cpython-310.pyc +0 -0
clarifai/constants/__pycache__/workflow.cpython-311.pyc +0 -0
clarifai/datasets/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/datasets/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/datasets/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/datasets/export/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/datasets/export/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/datasets/export/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/datasets/export/__pycache__/inputs_annotations.cpython-310.pyc +0 -0
clarifai/datasets/export/__pycache__/inputs_annotations.cpython-311.pyc +0 -0
clarifai/datasets/upload/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/datasets/upload/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/datasets/upload/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/datasets/upload/__pycache__/base.cpython-310.pyc +0 -0
clarifai/datasets/upload/__pycache__/base.cpython-311.pyc +0 -0
clarifai/datasets/upload/__pycache__/features.cpython-310.pyc +0 -0
clarifai/datasets/upload/__pycache__/features.cpython-311.pyc +0 -0
clarifai/datasets/upload/__pycache__/image.cpython-310.pyc +0 -0
clarifai/datasets/upload/__pycache__/image.cpython-311.pyc +0 -0
clarifai/datasets/upload/__pycache__/multimodal.cpython-310.pyc +0 -0
clarifai/datasets/upload/__pycache__/multimodal.cpython-311.pyc +0 -0
clarifai/datasets/upload/__pycache__/text.cpython-310.pyc +0 -0
clarifai/datasets/upload/__pycache__/text.cpython-311.pyc +0 -0
clarifai/datasets/upload/__pycache__/utils.cpython-310.pyc +0 -0
clarifai/datasets/upload/__pycache__/utils.cpython-311.pyc +0 -0
clarifai/datasets/upload/loaders/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/datasets/upload/loaders/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/datasets/upload/loaders/__pycache__/coco_detection.cpython-311.pyc +0 -0
clarifai/datasets/upload/loaders/__pycache__/imagenet_classification.cpython-311.pyc +0 -0
clarifai/models/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/modules/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/rag/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/rag/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/rag/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/rag/__pycache__/rag.cpython-310.pyc +0 -0
clarifai/rag/__pycache__/rag.cpython-311.pyc +0 -0
clarifai/rag/__pycache__/rag.cpython-39.pyc +0 -0
clarifai/rag/__pycache__/utils.cpython-310.pyc +0 -0
clarifai/rag/__pycache__/utils.cpython-311.pyc +0 -0
clarifai/runners/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/runners/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/runners/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/runners/dockerfile_template/Dockerfile.cpu.template +0 -31
clarifai/runners/dockerfile_template/Dockerfile.cuda.template +0 -42
clarifai/runners/dockerfile_template/Dockerfile.nim +0 -71
clarifai/runners/models/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/runners/models/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/runners/models/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/runners/models/__pycache__/base_typed_model.cpython-310.pyc +0 -0
clarifai/runners/models/__pycache__/base_typed_model.cpython-311.pyc +0 -0
clarifai/runners/models/__pycache__/base_typed_model.cpython-39.pyc +0 -0
clarifai/runners/models/__pycache__/model_builder.cpython-311.pyc +0 -0
clarifai/runners/models/__pycache__/model_class.cpython-310.pyc +0 -0
clarifai/runners/models/__pycache__/model_class.cpython-311.pyc +0 -0
clarifai/runners/models/__pycache__/model_run_locally.cpython-310-pytest-7.1.2.pyc +0 -0
clarifai/runners/models/__pycache__/model_run_locally.cpython-310.pyc +0 -0
clarifai/runners/models/__pycache__/model_run_locally.cpython-311.pyc +0 -0
clarifai/runners/models/__pycache__/model_runner.cpython-310.pyc +0 -0
clarifai/runners/models/__pycache__/model_runner.cpython-311.pyc +0 -0
clarifai/runners/models/__pycache__/model_upload.cpython-310.pyc +0 -0
clarifai/runners/models/base_typed_model.py +0 -238
clarifai/runners/models/model_class_refract.py +0 -80
clarifai/runners/models/model_upload.py +0 -607
clarifai/runners/models/temp.py +0 -25
clarifai/runners/utils/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/runners/utils/__pycache__/__init__.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/buffered_stream.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/buffered_stream.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/buffered_stream.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/const.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/const.cpython-311.pyc +0 -0
clarifai/runners/utils/__pycache__/constants.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/constants.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/constants.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/data_handler.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/data_handler.cpython-311.pyc +0 -0
clarifai/runners/utils/__pycache__/data_handler.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/data_handler.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/data_utils.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/data_utils.cpython-311.pyc +0 -0
clarifai/runners/utils/__pycache__/data_utils.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/data_utils.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/grpc_server.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/grpc_server.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/grpc_server.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/health.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/health.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/health.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/loader.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/loader.cpython-311.pyc +0 -0
clarifai/runners/utils/__pycache__/logging.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/logging.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/logging.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/stream_source.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/stream_source.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/url_fetcher.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/url_fetcher.cpython-311.pyc +0 -0
clarifai/runners/utils/__pycache__/url_fetcher.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/url_fetcher.cpython-39.pyc +0 -0
clarifai/runners/utils/data_handler.py +0 -231
clarifai/runners/utils/data_handler_refract.py +0 -213
clarifai/runners/utils/data_types.py +0 -469
clarifai/runners/utils/logger.py +0 -0
clarifai/runners/utils/openai_format.py +0 -87
clarifai/schema/__pycache__/search.cpython-310.pyc +0 -0
clarifai/schema/__pycache__/search.cpython-311.pyc +0 -0
clarifai/urls/__pycache__/helper.cpython-310.pyc +0 -0
clarifai/urls/__pycache__/helper.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/utils/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/utils/__pycache__/cli.cpython-310.pyc +0 -0
clarifai/utils/__pycache__/cli.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/config.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/constants.cpython-310.pyc +0 -0
clarifai/utils/__pycache__/constants.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/logging.cpython-310.pyc +0 -0
clarifai/utils/__pycache__/logging.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/misc.cpython-310.pyc +0 -0
clarifai/utils/__pycache__/misc.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/model_train.cpython-310.pyc +0 -0
clarifai/utils/__pycache__/model_train.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/protobuf.cpython-311.pyc +0 -0
clarifai/utils/evaluation/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/utils/evaluation/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/utils/evaluation/__pycache__/helpers.cpython-311.pyc +0 -0
clarifai/utils/evaluation/__pycache__/main.cpython-311.pyc +0 -0
clarifai/utils/evaluation/__pycache__/main.cpython-39.pyc +0 -0
clarifai/workflows/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/workflows/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/workflows/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/workflows/__pycache__/export.cpython-310.pyc +0 -0
clarifai/workflows/__pycache__/export.cpython-311.pyc +0 -0
clarifai/workflows/__pycache__/utils.cpython-310.pyc +0 -0
clarifai/workflows/__pycache__/utils.cpython-311.pyc +0 -0
clarifai/workflows/__pycache__/validate.cpython-310.pyc +0 -0
clarifai/workflows/__pycache__/validate.cpython-311.pyc +0 -0
clarifai-11.3.0rc2.dist-info/RECORD +0 -322
{clarifai-11.3.0rc2.dist-info → clarifai-11.4.0.dist-info}/entry_points.txt +0 -0
{clarifai-11.3.0rc2.dist-info → clarifai-11.4.0.dist-info/licenses}/LICENSE +0 -0
{clarifai-11.3.0rc2.dist-info → clarifai-11.4.0.dist-info}/top_level.txt +0 -0

clarifai/client/model_client.py CHANGED Viewed

@@ -9,20 +9,24 @@ from clarifai.constants.model import MAX_MODEL_PREDICT_INPUTS
 from clarifai.errors import UserError
 from clarifai.runners.utils import code_script, method_signatures
 from clarifai.runners.utils.data_utils import is_openai_chat_format
-from clarifai.runners.utils.method_signatures import (CompatibilitySerializer, deserialize,
-                                                      get_stream_from_signature, serialize,
-                                                      signatures_from_json)
+from clarifai.runners.utils.method_signatures import (
+    CompatibilitySerializer,
+    deserialize,
+    get_stream_from_signature,
+    serialize,
+    signatures_from_json,
+)
 from clarifai.utils.logging import logger
 from clarifai.utils.misc import BackoffIterator, status_is_retryable
 class ModelClient:
-  '''
-  Client for calling model predict, generate, and stream methods.
-  '''
-  def __init__(self, stub, request_template: service_pb2.PostModelOutputsRequest = None):
     '''
+    Client for calling model predict, generate, and stream methods.
+    '''
+    def __init__(self, stub, request_template: service_pb2.PostModelOutputsRequest = None):
+        '''
         Initialize the model client.
         Args:
@@ -30,501 +34,520 @@ class ModelClient:
             request_template: The template for the request to send to the model, including
             common fields like model_id, model_version, cluster, etc.
         '''
-    self.STUB = stub
-    self.request_template = request_template or service_pb2.PostModelOutputsRequest()
-    self._method_signatures = None
-    self._defined = False
+        self.STUB = stub
+        self.request_template = request_template or service_pb2.PostModelOutputsRequest()
+        self._method_signatures = None
+        self._defined = False
-  def fetch(self):
-    '''
-    Fetch function signature definitions from the model and define the functions in the client
-    '''
-    if self._defined:
-      return
-    try:
-      self._fetch_signatures()
-      self._define_functions()
-    finally:
-      self._defined = True
-  def __getattr__(self, name):
-    if not self._defined:
-      self.fetch()
-    return self.__getattribute__(name)
-  def _fetch_signatures(self):
-    '''
-      Fetch the method signatures from the model.
-      Returns:
-          Dict: The method signatures.
-      '''
-    try:
-      response = self.STUB.GetModelVersion(
-          service_pb2.GetModelVersionRequest(
-              user_app_id=self.request_template.user_app_id,
-              model_id=self.request_template.model_id,
-              version_id=self.request_template.version_id,
-          ))
-      method_signatures = None
-      if response.status.code == status_code_pb2.SUCCESS:
-        method_signatures = response.model_version.method_signatures
-      if response.status.code != status_code_pb2.SUCCESS:
-        raise Exception(f"Model failed with response {response!r}")
-      self._method_signatures = {}
-      for method_signature in method_signatures:
-        method_name = method_signature.name
-        # check for duplicate method names
-        if method_name in self._method_signatures:
-          raise ValueError(f"Duplicate method name {method_name}")
-        self._method_signatures[method_name] = method_signature
-      if not self._method_signatures:  # if no method signatures, try to fetch from the model
-        self._fetch_signatures_backup()
-    except Exception:
-      # try to fetch from the model
-      self._fetch_signatures_backup()
-      if not self._method_signatures:
-        raise ValueError("Failed to fetch method signatures from model and backup method")
-  def _fetch_signatures_backup(self):
-    '''
-      This is a temporary method of fetching the method signatures from the model.
-      Returns:
-          Dict: The method signatures.
-      '''
-    request = service_pb2.PostModelOutputsRequest()
-    request.CopyFrom(self.request_template)
-    # request.model.model_version.output_info.params['_method_name'] = '_GET_SIGNATURES'
-    inp = request.inputs.add()  # empty input for this method
-    inp.data.parts.add()  # empty part for this input
-    inp.data.metadata['_method_name'] = '_GET_SIGNATURES'
-    start_time = time.time()
-    backoff_iterator = BackoffIterator(10)
-    while True:
-      response = self.STUB.PostModelOutputs(request)
-      if status_is_retryable(
-          response.status.code) and time.time() - start_time < 60 * 10:  # 10 minutes
-        logger.info(f"Retrying model info fetch with response {response.status!r}")
-        time.sleep(next(backoff_iterator))
-        continue
-      break
-    if (response.status.code == status_code_pb2.INPUT_UNSUPPORTED_FORMAT or
-        (response.status.code == status_code_pb2.SUCCESS and
-         response.outputs[0].data.text.raw == '')):
-      # return codes/values from older models that don't support _GET_SIGNATURES
-      self._method_signatures = {}
-      self._define_compatability_functions()
-      return
-    if response.status.code != status_code_pb2.SUCCESS:
-      raise Exception(f"Model failed with response {response!r}")
-    self._method_signatures = signatures_from_json(response.outputs[0].data.text.raw)
-  def _define_functions(self):
-    '''
-    Define the functions based on the method signatures.
-    '''
-    for method_name, method_signature in self._method_signatures.items():
-      # define the function in this client instance
-      if resources_pb2.RunnerMethodType.Name(method_signature.method_type) == 'UNARY_UNARY':
-        call_func = self._predict
-      elif resources_pb2.RunnerMethodType.Name(method_signature.method_type) == 'UNARY_STREAMING':
-        call_func = self._generate
-      elif resources_pb2.RunnerMethodType.Name(
-          method_signature.method_type) == 'STREAMING_STREAMING':
-        call_func = self._stream
-      else:
-        raise ValueError(f"Unknown method type {method_signature.method_type}")
-      # method argnames, in order, collapsing nested keys to corresponding user function args
-      method_argnames = []
-      for var in method_signature.input_fields:
-        outer = var.name.split('.', 1)[0]
-        if outer in method_argnames:
-          continue
-        method_argnames.append(outer)
-      def bind_f(method_name, method_argnames, call_func):
-        def f(*args, **kwargs):
-          if len(args) > len(method_argnames):
-            raise TypeError(
-                f"{method_name}() takes {len(method_argnames)} positional arguments but {len(args)} were given"
+    def fetch(self):
+        '''
+        Fetch function signature definitions from the model and define the functions in the client
+        '''
+        if self._defined:
+            return
+        try:
+            self._fetch_signatures()
+            self._define_functions()
+        finally:
+            self._defined = True
+    def __getattr__(self, name):
+        if not self._defined:
+            self.fetch()
+        return self.__getattribute__(name)
+    def _fetch_signatures(self):
+        '''
+        Fetch the method signatures from the model.
+        Returns:
+            Dict: The method signatures.
+        '''
+        try:
+            response = self.STUB.GetModelVersion(
+                service_pb2.GetModelVersionRequest(
+                    user_app_id=self.request_template.user_app_id,
+                    model_id=self.request_template.model_id,
+                    version_id=self.request_template.version_id,
+                )
             )
-          if len(args) + len(kwargs) > len(method_argnames):
-            raise TypeError(
-                f"{method_name}() got an unexpected keyword argument {next(iter(kwargs))}")
-          if len(args) == 1 and (not kwargs) and isinstance(args[0], list):
-            batch_inputs = args[0]
-            # Validate each input is a dictionary
-            is_batch_input_valid = all(isinstance(input, dict) for input in batch_inputs)
-            if is_batch_input_valid and (not is_openai_chat_format(batch_inputs)):
-              # If the batch input is valid, call the function with the batch inputs and the method name
-              return call_func(batch_inputs, method_name)
-          for name, arg in zip(method_argnames, args):  # handle positional with zip shortest
-            if name in kwargs:
-              raise TypeError(f"Multiple values for argument {name}")
-            kwargs[name] = arg
-          return call_func(kwargs, method_name)
-        return f
-      # need to bind method_name to the value, not the mutating loop variable
-      f = bind_f(method_name, method_argnames, call_func)
-      # set names, annotations and docstrings
-      f.__name__ = method_name
-      f.__qualname__ = f'{self.__class__.__name__}.{method_name}'
-      input_annotations = code_script._get_annotations_source(method_signature)
-      return_annotation = input_annotations.pop('return', (None, None))[0]
-      sig = inspect.signature(f).replace(
-          parameters=[
-              inspect.Parameter(k, inspect.Parameter.POSITIONAL_OR_KEYWORD, annotation=v[0])
-              for k, v in input_annotations.items()
-          ],
-          return_annotation=return_annotation,
-      )
-      f.__signature__ = sig
-      f.__doc__ = method_signature.description
-      setattr(self, method_name, f)
-  def available_methods(self) -> List[str]:
-    """Get the available methods for this model.
-    Returns:
-        List[str]: The available methods.
-    """
-    if not self._defined:
-      self.fetch()
-    return self._method_signatures.keys()
-  def method_signature(self, method_name: str) -> str:
-    """Get the method signature for a method.
-    Args:
-        method_name (str): The name of the method.
-    Returns:
-        str: The method signature.
-    """
-    if not self._defined:
-      self.fetch()
-    return method_signatures.get_method_signature(self._method_signatures[method_name])
-  def generate_client_script(self) -> str:
-    """Generate a client script for this model.
-    Returns:
-        str: The client script.
-    """
-    if not self._defined:
-      self.fetch()
-    method_signatures = []
-    for _, method_signature in self._method_signatures.items():
-      method_signatures.append(method_signature)
-    return code_script.generate_client_script(
-        method_signatures,
-        user_id=self.request_template.user_app_id.user_id,
-        app_id=self.request_template.user_app_id.app_id,
-        model_id=self.request_template.model_id)
-  def _define_compatability_functions(self):
-    serializer = CompatibilitySerializer()
-    def predict(input: Any) -> Any:
-      proto = resources_pb2.Input()
-      serializer.serialize(proto.data, input)
-      # always use text.raw for compat
-      if proto.data.string_value:
-        proto.data.text.raw = proto.data.string_value
-        proto.data.string_value = ''
-      response = self._predict_by_proto([proto])
-      if response.status.code != status_code_pb2.SUCCESS:
-        raise Exception(f"Model predict failed with response {response!r}")
-      response_data = response.outputs[0].data
-      if response_data.text.raw:
-        response_data.string_value = response_data.text.raw
-        response_data.text.raw = ''
-      return serializer.deserialize(response_data)
-    self.predict = predict
-  def _predict(
-      self,
-      inputs,  # TODO set up functions according to fetched signatures?
-      method_name: str = 'predict',
-  ) -> Any:
-    input_signature = self._method_signatures[method_name].input_fields
-    output_signature = self._method_signatures[method_name].output_fields
-    batch_input = True
-    if isinstance(inputs, dict):
-      inputs = [inputs]
-      batch_input = False
-    proto_inputs = []
-    for input in inputs:
-      proto = resources_pb2.Input()
-      serialize(input, input_signature, proto.data)
-      proto_inputs.append(proto)
-    response = self._predict_by_proto(proto_inputs, method_name)
-    outputs = []
-    for output in response.outputs:
-      outputs.append(deserialize(output.data, output_signature, is_output=True))
-    if batch_input:
-      return outputs
-    return outputs[0]
-  def _predict_by_proto(
-      self,
-      inputs: List[resources_pb2.Input],
-      method_name: str = None,
-      inference_params: Dict = None,
-      output_config: Dict = None,
-  ) -> service_pb2.MultiOutputResponse:
-    """Predicts the model based on the given inputs.
-      Args:
-          inputs (List[resources_pb2.Input]): The inputs to predict.
-          method_name (str): The remote method name to call.
-          inference_params (Dict): Inference parameters to override.
-          output_config (Dict): Output configuration to override.
-      Returns:
-          service_pb2.MultiOutputResponse: The prediction response(s).
-      """
-    if not isinstance(inputs, list):
-      raise UserError('Invalid inputs, inputs must be a list of Input objects.')
-    if len(inputs) > MAX_MODEL_PREDICT_INPUTS:
-      raise UserError(f"Too many inputs. Max is {MAX_MODEL_PREDICT_INPUTS}.")
-    request = service_pb2.PostModelOutputsRequest()
-    request.CopyFrom(self.request_template)
-    request.inputs.extend(inputs)
-    if method_name:
-      # TODO put in new proto field?
-      for inp in request.inputs:
-        inp.data.metadata['_method_name'] = method_name
-    if inference_params:
-      request.model.model_version.output_info.params.update(inference_params)
-    if output_config:
-      request.model.model_version.output_info.output_config.MergeFrom(
-          resources_pb2.OutputConfig(**output_config))
-    start_time = time.time()
-    backoff_iterator = BackoffIterator(10)
-    while True:
-      response = self.STUB.PostModelOutputs(request)
-      if status_is_retryable(
-          response.status.code) and time.time() - start_time < 60 * 10:  # 10 minutes
-        logger.info("Model is still deploying, please wait...")
-        time.sleep(next(backoff_iterator))
-        continue
-      if response.status.code != status_code_pb2.SUCCESS:
-        raise Exception(f"Model predict failed with response {response!r}")
-      break
-    return response
-  def _generate(
-      self,
-      inputs,  # TODO set up functions according to fetched signatures?
-      method_name: str = 'generate',
-  ) -> Any:
-    input_signature = self._method_signatures[method_name].input_fields
-    output_signature = self._method_signatures[method_name].output_fields
-    batch_input = True
-    if isinstance(inputs, dict):
-      inputs = [inputs]
-      batch_input = False
-    proto_inputs = []
-    for input in inputs:
-      proto = resources_pb2.Input()
-      serialize(input, input_signature, proto.data)
-      proto_inputs.append(proto)
-    response_stream = self._generate_by_proto(proto_inputs, method_name)
-    for response in response_stream:
-      outputs = []
-      for output in response.outputs:
-        outputs.append(deserialize(output.data, output_signature, is_output=True))
-      if batch_input:
-        yield outputs
-      else:
-        yield outputs[0]
-  def _generate_by_proto(
-      self,
-      inputs: List[resources_pb2.Input],
-      method_name: str = None,
-      inference_params: Dict = {},
-      output_config: Dict = {},
-  ):
-    """Generate the stream output on model based on the given inputs.
-    Args:
-        inputs (list[Input]): The inputs to generate, must be less than 128.
-        method_name (str): The remote method name to call.
-        inference_params (dict): The inference params to override.
-        output_config (dict): The output config to override.
-    """
-    if not isinstance(inputs, list):
-      raise UserError('Invalid inputs, inputs must be a list of Input objects.')
-    if len(inputs) > MAX_MODEL_PREDICT_INPUTS:
-      raise UserError(f"Too many inputs. Max is {MAX_MODEL_PREDICT_INPUTS}."
-                     )  # TODO Use Chunker for inputs len > 128
-    request = service_pb2.PostModelOutputsRequest()
-    request.CopyFrom(self.request_template)
-    request.inputs.extend(inputs)
-    if method_name:
-      # TODO put in new proto field?
-      for inp in request.inputs:
-        inp.data.metadata['_method_name'] = method_name
-    if inference_params:
-      request.model.model_version.output_info.params.update(inference_params)
-    if output_config:
-      request.model.model_version.output_info.output_config.MergeFromDict(output_config)
-    start_time = time.time()
-    backoff_iterator = BackoffIterator(10)
-    started = False
-    while not started:
-      stream_response = self.STUB.GenerateModelOutputs(request)
-      try:
-        response = next(stream_response)  # get the first response
-      except StopIteration:
-        raise Exception("Model Generate failed with no response")
-      if status_is_retryable(response.status.code) and \
-              time.time() - start_time < 60 * 10:
-        logger.info("Model is still deploying, please wait...")
-        time.sleep(next(backoff_iterator))
-        continue
-      if response.status.code != status_code_pb2.SUCCESS:
-        raise Exception(f"Model Generate failed with response {response.status!r}")
-      started = True
-    yield response  # yield the first response
-    for response in stream_response:
-      if response.status.code != status_code_pb2.SUCCESS:
-        raise Exception(f"Model Generate failed with response {response.status!r}")
-      yield response
-  def _stream(
-      self,
-      inputs,
-      method_name: str = 'stream',
-  ) -> Any:
-    input_signature = self._method_signatures[method_name].input_fields
-    output_signature = self._method_signatures[method_name].output_fields
-    if isinstance(inputs, list):
-      assert len(inputs) == 1, 'streaming methods do not support batched calls'
-      inputs = inputs[0]
-    assert isinstance(inputs, dict)
-    kwargs = inputs
-    # find the streaming vars in the input signature, and the streaming input python param
-    stream_sig = get_stream_from_signature(input_signature)
-    if stream_sig is None:
-      raise ValueError("Streaming method must have a Stream input")
-    stream_argname = stream_sig.name
-    # get the streaming input generator from the user-provided function arg values
-    user_inputs_generator = kwargs.pop(stream_argname)
-    def _input_proto_stream():
-      # first item contains all the inputs and the first stream item
-      proto = resources_pb2.Input()
-      try:
-        item = next(user_inputs_generator)
-      except StopIteration:
-        return  # no items to stream
-      kwargs[stream_argname] = item
-      serialize(kwargs, input_signature, proto.data)
-      yield proto
-      # subsequent items are just the stream items
-      for item in user_inputs_generator:
-        proto = resources_pb2.Input()
-        serialize({stream_argname: item}, [stream_sig], proto.data)
-        yield proto
-    response_stream = self._stream_by_proto(_input_proto_stream(), method_name)
-    for response in response_stream:
-      assert len(response.outputs) == 1, 'streaming methods must have exactly one output'
-      yield deserialize(response.outputs[0].data, output_signature, is_output=True)
-  def _req_iterator(self,
-                    input_iterator: Iterator[List[resources_pb2.Input]],
-                    method_name: str = None,
-                    inference_params: Dict = {},
-                    output_config: Dict = {}):
-    request = service_pb2.PostModelOutputsRequest()
-    request.CopyFrom(self.request_template)
-    if inference_params:
-      request.model.model_version.output_info.params.update(inference_params)
-    if output_config:
-      request.model.model_version.output_info.output_config.MergeFromDict(output_config)
-    for inputs in input_iterator:
-      req = service_pb2.PostModelOutputsRequest()
-      req.CopyFrom(request)
-      if isinstance(inputs, list):
-        req.inputs.extend(inputs)
-      else:
-        req.inputs.append(inputs)
-      # TODO: put into new proto field?
-      if method_name:
-        for inp in req.inputs:
-          inp.data.metadata['_method_name'] = method_name
-      yield req
-  def _stream_by_proto(self,
-                       inputs: Iterator[List[resources_pb2.Input]],
-                       method_name: str = None,
-                       inference_params: Dict = {},
-                       output_config: Dict = {}):
-    """Generate the stream output on model based on the given stream of inputs.
-    """
-    # if not isinstance(inputs, Iterator[List[Input]]):
-    #   raise UserError('Invalid inputs, inputs must be a iterator of list of Input objects.')
-    request = self._req_iterator(inputs, method_name, inference_params, output_config)
-    start_time = time.time()
-    backoff_iterator = BackoffIterator(10)
-    generation_started = False
-    while True:
-      if generation_started:
-        break
-      stream_response = self.STUB.StreamModelOutputs(request)
-      for response in stream_response:
-        if status_is_retryable(response.status.code) and \
-                time.time() - start_time < 60 * 10:
-          logger.info("Model is still deploying, please wait...")
-          time.sleep(next(backoff_iterator))
-          break
+            method_signatures = None
+            if response.status.code == status_code_pb2.SUCCESS:
+                method_signatures = response.model_version.method_signatures
+            if response.status.code != status_code_pb2.SUCCESS:
+                raise Exception(f"Model failed with response {response!r}")
+            self._method_signatures = {}
+            for method_signature in method_signatures:
+                method_name = method_signature.name
+                # check for duplicate method names
+                if method_name in self._method_signatures:
+                    raise ValueError(f"Duplicate method name {method_name}")
+                self._method_signatures[method_name] = method_signature
+            if not self._method_signatures:  # if no method signatures, try to fetch from the model
+                self._fetch_signatures_backup()
+        except Exception:
+            # try to fetch from the model
+            self._fetch_signatures_backup()
+            if not self._method_signatures:
+                raise ValueError("Failed to fetch method signatures from model and backup method")
+    def _fetch_signatures_backup(self):
+        '''
+        This is a temporary method of fetching the method signatures from the model.
+        Returns:
+            Dict: The method signatures.
+        '''
+        request = service_pb2.PostModelOutputsRequest()
+        request.CopyFrom(self.request_template)
+        # request.model.model_version.output_info.params['_method_name'] = '_GET_SIGNATURES'
+        inp = request.inputs.add()  # empty input for this method
+        inp.data.parts.add()  # empty part for this input
+        inp.data.metadata['_method_name'] = '_GET_SIGNATURES'
+        start_time = time.time()
+        backoff_iterator = BackoffIterator(10)
+        while True:
+            response = self.STUB.PostModelOutputs(request)
+            if (
+                status_is_retryable(response.status.code) and time.time() - start_time < 60 * 10
+            ):  # 10 minutes
+                logger.info(f"Retrying model info fetch with response {response.status!r}")
+                time.sleep(next(backoff_iterator))
+                continue
+            break
+        if response.status.code == status_code_pb2.INPUT_UNSUPPORTED_FORMAT or (
+            response.status.code == status_code_pb2.SUCCESS
+            and response.outputs[0].data.text.raw == ''
+        ):
+            # return codes/values from older models that don't support _GET_SIGNATURES
+            self._method_signatures = {}
+            self._define_compatability_functions()
+            return
         if response.status.code != status_code_pb2.SUCCESS:
-          raise Exception(f"Model Predict failed with response {response.status!r}")
-        else:
-          if not generation_started:
-            generation_started = True
-          yield response
+            raise Exception(f"Model failed with response {response!r}")
+        self._method_signatures = signatures_from_json(response.outputs[0].data.text.raw)
+    def _define_functions(self):
+        '''
+        Define the functions based on the method signatures.
+        '''
+        for method_name, method_signature in self._method_signatures.items():
+            # define the function in this client instance
+            if resources_pb2.RunnerMethodType.Name(method_signature.method_type) == 'UNARY_UNARY':
+                call_func = self._predict
+            elif (
+                resources_pb2.RunnerMethodType.Name(method_signature.method_type)
+                == 'UNARY_STREAMING'
+            ):
+                call_func = self._generate
+            elif (
+                resources_pb2.RunnerMethodType.Name(method_signature.method_type)
+                == 'STREAMING_STREAMING'
+            ):
+                call_func = self._stream
+            else:
+                raise ValueError(f"Unknown method type {method_signature.method_type}")
+            # method argnames, in order, collapsing nested keys to corresponding user function args
+            method_argnames = []
+            for var in method_signature.input_fields:
+                outer = var.name.split('.', 1)[0]
+                if outer in method_argnames:
+                    continue
+                method_argnames.append(outer)
+            def bind_f(method_name, method_argnames, call_func):
+                def f(*args, **kwargs):
+                    if len(args) > len(method_argnames):
+                        raise TypeError(
+                            f"{method_name}() takes {len(method_argnames)} positional arguments but {len(args)} were given"
+                        )
+                    if len(args) + len(kwargs) > len(method_argnames):
+                        raise TypeError(
+                            f"{method_name}() got an unexpected keyword argument {next(iter(kwargs))}"
+                        )
+                    if len(args) == 1 and (not kwargs) and isinstance(args[0], list):
+                        batch_inputs = args[0]
+                        # Validate each input is a dictionary
+                        is_batch_input_valid = all(
+                            isinstance(input, dict) for input in batch_inputs
+                        )
+                        if is_batch_input_valid and (not is_openai_chat_format(batch_inputs)):
+                            # If the batch input is valid, call the function with the batch inputs and the method name
+                            return call_func(batch_inputs, method_name)
+                    for name, arg in zip(
+                        method_argnames, args
+                    ):  # handle positional with zip shortest
+                        if name in kwargs:
+                            raise TypeError(f"Multiple values for argument {name}")
+                        kwargs[name] = arg
+                    return call_func(kwargs, method_name)
+                return f
+            # need to bind method_name to the value, not the mutating loop variable
+            f = bind_f(method_name, method_argnames, call_func)
+            # set names, annotations and docstrings
+            f.__name__ = method_name
+            f.__qualname__ = f'{self.__class__.__name__}.{method_name}'
+            input_annotations = code_script._get_annotations_source(method_signature)
+            return_annotation = input_annotations.pop('return', (None, None))[0]
+            sig = inspect.signature(f).replace(
+                parameters=[
+                    inspect.Parameter(k, inspect.Parameter.POSITIONAL_OR_KEYWORD, annotation=v[0])
+                    for k, v in input_annotations.items()
+                ],
+                return_annotation=return_annotation,
+            )
+            f.__signature__ = sig
+            f.__doc__ = method_signature.description
+            setattr(self, method_name, f)
+    def available_methods(self) -> List[str]:
+        """Get the available methods for this model.
+        Returns:
+            List[str]: The available methods.
+        """
+        if not self._defined:
+            self.fetch()
+        return self._method_signatures.keys()
+    def method_signature(self, method_name: str) -> str:
+        """Get the method signature for a method.
+        Args:
+            method_name (str): The name of the method.
+        Returns:
+            str: The method signature.
+        """
+        if not self._defined:
+            self.fetch()
+        return method_signatures.get_method_signature(self._method_signatures[method_name])
+    def generate_client_script(self) -> str:
+        """Generate a client script for this model.
+        Returns:
+            str: The client script.
+        """
+        if not self._defined:
+            self.fetch()
+        method_signatures = []
+        for _, method_signature in self._method_signatures.items():
+            method_signatures.append(method_signature)
+        return code_script.generate_client_script(
+            method_signatures,
+            user_id=self.request_template.user_app_id.user_id,
+            app_id=self.request_template.user_app_id.app_id,
+            model_id=self.request_template.model_id,
+        )
+    def _define_compatability_functions(self):
+        serializer = CompatibilitySerializer()
+        def predict(input: Any) -> Any:
+            proto = resources_pb2.Input()
+            serializer.serialize(proto.data, input)
+            # always use text.raw for compat
+            if proto.data.string_value:
+                proto.data.text.raw = proto.data.string_value
+                proto.data.string_value = ''
+            response = self._predict_by_proto([proto])
+            if response.status.code != status_code_pb2.SUCCESS:
+                raise Exception(f"Model predict failed with response {response!r}")
+            response_data = response.outputs[0].data
+            if response_data.text.raw:
+                response_data.string_value = response_data.text.raw
+                response_data.text.raw = ''
+            return serializer.deserialize(response_data)
+        self.predict = predict
+    def _predict(
+        self,
+        inputs,  # TODO set up functions according to fetched signatures?
+        method_name: str = 'predict',
+    ) -> Any:
+        input_signature = self._method_signatures[method_name].input_fields
+        output_signature = self._method_signatures[method_name].output_fields
+        batch_input = True
+        if isinstance(inputs, dict):
+            inputs = [inputs]
+            batch_input = False
+        proto_inputs = []
+        for input in inputs:
+            proto = resources_pb2.Input()
+            serialize(input, input_signature, proto.data)
+            proto_inputs.append(proto)
+        response = self._predict_by_proto(proto_inputs, method_name)
+        outputs = []
+        for output in response.outputs:
+            outputs.append(deserialize(output.data, output_signature, is_output=True))
+        if batch_input:
+            return outputs
+        return outputs[0]
+    def _predict_by_proto(
+        self,
+        inputs: List[resources_pb2.Input],
+        method_name: str = None,
+        inference_params: Dict = None,
+        output_config: Dict = None,
+    ) -> service_pb2.MultiOutputResponse:
+        """Predicts the model based on the given inputs.
+        Args:
+            inputs (List[resources_pb2.Input]): The inputs to predict.
+            method_name (str): The remote method name to call.
+            inference_params (Dict): Inference parameters to override.
+            output_config (Dict): Output configuration to override.
+        Returns:
+            service_pb2.MultiOutputResponse: The prediction response(s).
+        """
+        if not isinstance(inputs, list):
+            raise UserError('Invalid inputs, inputs must be a list of Input objects.')
+        if len(inputs) > MAX_MODEL_PREDICT_INPUTS:
+            raise UserError(f"Too many inputs. Max is {MAX_MODEL_PREDICT_INPUTS}.")
+        request = service_pb2.PostModelOutputsRequest()
+        request.CopyFrom(self.request_template)
+        request.inputs.extend(inputs)
+        if method_name:
+            # TODO put in new proto field?
+            for inp in request.inputs:
+                inp.data.metadata['_method_name'] = method_name
+        if inference_params:
+            request.model.model_version.output_info.params.update(inference_params)
+        if output_config:
+            request.model.model_version.output_info.output_config.MergeFrom(
+                resources_pb2.OutputConfig(**output_config)
+            )
+        start_time = time.time()
+        backoff_iterator = BackoffIterator(10)
+        while True:
+            response = self.STUB.PostModelOutputs(request)
+            if (
+                status_is_retryable(response.status.code) and time.time() - start_time < 60 * 10
+            ):  # 10 minutes
+                logger.info("Model is still deploying, please wait...")
+                time.sleep(next(backoff_iterator))
+                continue
+            if response.status.code != status_code_pb2.SUCCESS:
+                raise Exception(f"Model predict failed with response {response!r}")
+            break
+        return response
+    def _generate(
+        self,
+        inputs,  # TODO set up functions according to fetched signatures?
+        method_name: str = 'generate',
+    ) -> Any:
+        input_signature = self._method_signatures[method_name].input_fields
+        output_signature = self._method_signatures[method_name].output_fields
+        batch_input = True
+        if isinstance(inputs, dict):
+            inputs = [inputs]
+            batch_input = False
+        proto_inputs = []
+        for input in inputs:
+            proto = resources_pb2.Input()
+            serialize(input, input_signature, proto.data)
+            proto_inputs.append(proto)
+        response_stream = self._generate_by_proto(proto_inputs, method_name)
+        for response in response_stream:
+            outputs = []
+            for output in response.outputs:
+                outputs.append(deserialize(output.data, output_signature, is_output=True))
+            if batch_input:
+                yield outputs
+            else:
+                yield outputs[0]
+    def _generate_by_proto(
+        self,
+        inputs: List[resources_pb2.Input],
+        method_name: str = None,
+        inference_params: Dict = {},
+        output_config: Dict = {},
+    ):
+        """Generate the stream output on model based on the given inputs.
+        Args:
+            inputs (list[Input]): The inputs to generate, must be less than 128.
+            method_name (str): The remote method name to call.
+            inference_params (dict): The inference params to override.
+            output_config (dict): The output config to override.
+        """
+        if not isinstance(inputs, list):
+            raise UserError('Invalid inputs, inputs must be a list of Input objects.')
+        if len(inputs) > MAX_MODEL_PREDICT_INPUTS:
+            raise UserError(
+                f"Too many inputs. Max is {MAX_MODEL_PREDICT_INPUTS}."
+            )  # TODO Use Chunker for inputs len > 128
+        request = service_pb2.PostModelOutputsRequest()
+        request.CopyFrom(self.request_template)
+        request.inputs.extend(inputs)
+        if method_name:
+            # TODO put in new proto field?
+            for inp in request.inputs:
+                inp.data.metadata['_method_name'] = method_name
+        if inference_params:
+            request.model.model_version.output_info.params.update(inference_params)
+        if output_config:
+            request.model.model_version.output_info.output_config.MergeFromDict(output_config)
+        start_time = time.time()
+        backoff_iterator = BackoffIterator(10)
+        started = False
+        while not started:
+            stream_response = self.STUB.GenerateModelOutputs(request)
+            try:
+                response = next(stream_response)  # get the first response
+            except StopIteration:
+                raise Exception("Model Generate failed with no response")
+            if status_is_retryable(response.status.code) and time.time() - start_time < 60 * 10:
+                logger.info("Model is still deploying, please wait...")
+                time.sleep(next(backoff_iterator))
+                continue
+            if response.status.code != status_code_pb2.SUCCESS:
+                raise Exception(f"Model Generate failed with response {response.status!r}")
+            started = True
+        yield response  # yield the first response
+        for response in stream_response:
+            if response.status.code != status_code_pb2.SUCCESS:
+                raise Exception(f"Model Generate failed with response {response.status!r}")
+            yield response
+    def _stream(
+        self,
+        inputs,
+        method_name: str = 'stream',
+    ) -> Any:
+        input_signature = self._method_signatures[method_name].input_fields
+        output_signature = self._method_signatures[method_name].output_fields
+        if isinstance(inputs, list):
+            assert len(inputs) == 1, 'streaming methods do not support batched calls'
+            inputs = inputs[0]
+        assert isinstance(inputs, dict)
+        kwargs = inputs
+        # find the streaming vars in the input signature, and the streaming input python param
+        stream_sig = get_stream_from_signature(input_signature)
+        if stream_sig is None:
+            raise ValueError("Streaming method must have a Stream input")
+        stream_argname = stream_sig.name
+        # get the streaming input generator from the user-provided function arg values
+        user_inputs_generator = kwargs.pop(stream_argname)
+        def _input_proto_stream():
+            # first item contains all the inputs and the first stream item
+            proto = resources_pb2.Input()
+            try:
+                item = next(user_inputs_generator)
+            except StopIteration:
+                return  # no items to stream
+            kwargs[stream_argname] = item
+            serialize(kwargs, input_signature, proto.data)
+            yield proto
+            # subsequent items are just the stream items
+            for item in user_inputs_generator:
+                proto = resources_pb2.Input()
+                serialize({stream_argname: item}, [stream_sig], proto.data)
+                yield proto
+        response_stream = self._stream_by_proto(_input_proto_stream(), method_name)
+        for response in response_stream:
+            assert len(response.outputs) == 1, 'streaming methods must have exactly one output'
+            yield deserialize(response.outputs[0].data, output_signature, is_output=True)
+    def _req_iterator(
+        self,
+        input_iterator: Iterator[List[resources_pb2.Input]],
+        method_name: str = None,
+        inference_params: Dict = {},
+        output_config: Dict = {},
+    ):
+        request = service_pb2.PostModelOutputsRequest()
+        request.CopyFrom(self.request_template)
+        if inference_params:
+            request.model.model_version.output_info.params.update(inference_params)
+        if output_config:
+            request.model.model_version.output_info.output_config.MergeFromDict(output_config)
+        for inputs in input_iterator:
+            req = service_pb2.PostModelOutputsRequest()
+            req.CopyFrom(request)
+            if isinstance(inputs, list):
+                req.inputs.extend(inputs)
+            else:
+                req.inputs.append(inputs)
+            # TODO: put into new proto field?
+            if method_name:
+                for inp in req.inputs:
+                    inp.data.metadata['_method_name'] = method_name
+            yield req
+    def _stream_by_proto(
+        self,
+        inputs: Iterator[List[resources_pb2.Input]],
+        method_name: str = None,
+        inference_params: Dict = {},
+        output_config: Dict = {},
+    ):
+        """Generate the stream output on model based on the given stream of inputs."""
+        # if not isinstance(inputs, Iterator[List[Input]]):
+        #   raise UserError('Invalid inputs, inputs must be a iterator of list of Input objects.')
+        request = self._req_iterator(inputs, method_name, inference_params, output_config)
+        start_time = time.time()
+        backoff_iterator = BackoffIterator(10)
+        generation_started = False
+        while True:
+            if generation_started:
+                break
+            stream_response = self.STUB.StreamModelOutputs(request)
+            for response in stream_response:
+                if (
+                    status_is_retryable(response.status.code)
+                    and time.time() - start_time < 60 * 10
+                ):
+                    logger.info("Model is still deploying, please wait...")
+                    time.sleep(next(backoff_iterator))
+                    break
+                if response.status.code != status_code_pb2.SUCCESS:
+                    raise Exception(f"Model Predict failed with response {response.status!r}")
+                else:
+                    if not generation_started:
+                        generation_started = True
+                    yield response

clarifai 11.3.0rc2__py3-none-any.whl → 11.4.0__py3-none-any.whl

clarifai 11.3.0rc2py3-none-any.whl → 11.4.0py3-none-any.whl