PyPI - clarifai - Versions diffs - 11.3.0rc2__py3-none-any.whl → 11.4.0__py3-none-any.whl - Mend

clarifai 11.3.0rc2py3-none-any.whl → 11.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (300) hide show

clarifai/__init__.py +1 -1
clarifai/cli/__main__.py +1 -1
clarifai/cli/base.py +144 -136
clarifai/cli/compute_cluster.py +45 -31
clarifai/cli/deployment.py +93 -76
clarifai/cli/model.py +578 -180
clarifai/cli/nodepool.py +100 -82
clarifai/client/__init__.py +12 -2
clarifai/client/app.py +973 -911
clarifai/client/auth/helper.py +345 -342
clarifai/client/auth/register.py +7 -7
clarifai/client/auth/stub.py +107 -106
clarifai/client/base.py +185 -178
clarifai/client/compute_cluster.py +214 -180
clarifai/client/dataset.py +793 -698
clarifai/client/deployment.py +55 -50
clarifai/client/input.py +1223 -1088
clarifai/client/lister.py +47 -45
clarifai/client/model.py +1939 -1717
clarifai/client/model_client.py +525 -502
clarifai/client/module.py +82 -73
clarifai/client/nodepool.py +358 -213
clarifai/client/runner.py +58 -0
clarifai/client/search.py +342 -309
clarifai/client/user.py +419 -414
clarifai/client/workflow.py +294 -274
clarifai/constants/dataset.py +11 -17
clarifai/constants/model.py +8 -2
clarifai/datasets/export/inputs_annotations.py +233 -217
clarifai/datasets/upload/base.py +63 -51
clarifai/datasets/upload/features.py +43 -38
clarifai/datasets/upload/image.py +237 -207
clarifai/datasets/upload/loaders/coco_captions.py +34 -32
clarifai/datasets/upload/loaders/coco_detection.py +72 -65
clarifai/datasets/upload/loaders/imagenet_classification.py +57 -53
clarifai/datasets/upload/loaders/xview_detection.py +274 -132
clarifai/datasets/upload/multimodal.py +55 -46
clarifai/datasets/upload/text.py +55 -47
clarifai/datasets/upload/utils.py +250 -234
clarifai/errors.py +51 -50
clarifai/models/api.py +260 -238
clarifai/modules/css.py +50 -50
clarifai/modules/pages.py +33 -33
clarifai/rag/rag.py +312 -288
clarifai/rag/utils.py +91 -84
clarifai/runners/models/model_builder.py +906 -802
clarifai/runners/models/model_class.py +370 -331
clarifai/runners/models/model_run_locally.py +459 -419
clarifai/runners/models/model_runner.py +170 -162
clarifai/runners/models/model_servicer.py +78 -70
clarifai/runners/server.py +111 -101
clarifai/runners/utils/code_script.py +225 -187
clarifai/runners/utils/const.py +4 -1
clarifai/runners/utils/data_types/__init__.py +12 -0
clarifai/runners/utils/data_types/data_types.py +598 -0
clarifai/runners/utils/data_utils.py +387 -440
clarifai/runners/utils/loader.py +247 -227
clarifai/runners/utils/method_signatures.py +411 -386
clarifai/runners/utils/openai_convertor.py +108 -109
clarifai/runners/utils/serializers.py +175 -179
clarifai/runners/utils/url_fetcher.py +35 -35
clarifai/schema/search.py +56 -63
clarifai/urls/helper.py +125 -102
clarifai/utils/cli.py +129 -123
clarifai/utils/config.py +127 -87
clarifai/utils/constants.py +49 -0
clarifai/utils/evaluation/helpers.py +503 -466
clarifai/utils/evaluation/main.py +431 -393
clarifai/utils/evaluation/testset_annotation_parser.py +154 -144
clarifai/utils/logging.py +324 -306
clarifai/utils/misc.py +60 -56
clarifai/utils/model_train.py +165 -146
clarifai/utils/protobuf.py +126 -103
clarifai/versions.py +3 -1
clarifai/workflows/export.py +48 -50
clarifai/workflows/utils.py +39 -36
clarifai/workflows/validate.py +55 -43
{clarifai-11.3.0rc2.dist-info → clarifai-11.4.0.dist-info}/METADATA +16 -6
clarifai-11.4.0.dist-info/RECORD +109 -0
{clarifai-11.3.0rc2.dist-info → clarifai-11.4.0.dist-info}/WHEEL +1 -1
clarifai/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/__pycache__/errors.cpython-310.pyc +0 -0
clarifai/__pycache__/errors.cpython-311.pyc +0 -0
clarifai/__pycache__/versions.cpython-310.pyc +0 -0
clarifai/__pycache__/versions.cpython-311.pyc +0 -0
clarifai/cli/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/cli/__pycache__/base.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/base.cpython-311.pyc +0 -0
clarifai/cli/__pycache__/base_cli.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/compute_cluster.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/compute_cluster.cpython-311.pyc +0 -0
clarifai/cli/__pycache__/deployment.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/deployment.cpython-311.pyc +0 -0
clarifai/cli/__pycache__/model.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/model.cpython-311.pyc +0 -0
clarifai/cli/__pycache__/model_cli.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/nodepool.cpython-310.pyc +0 -0
clarifai/cli/__pycache__/nodepool.cpython-311.pyc +0 -0
clarifai/client/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/client/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/client/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/client/__pycache__/app.cpython-310.pyc +0 -0
clarifai/client/__pycache__/app.cpython-311.pyc +0 -0
clarifai/client/__pycache__/app.cpython-39.pyc +0 -0
clarifai/client/__pycache__/base.cpython-310.pyc +0 -0
clarifai/client/__pycache__/base.cpython-311.pyc +0 -0
clarifai/client/__pycache__/compute_cluster.cpython-310.pyc +0 -0
clarifai/client/__pycache__/compute_cluster.cpython-311.pyc +0 -0
clarifai/client/__pycache__/dataset.cpython-310.pyc +0 -0
clarifai/client/__pycache__/dataset.cpython-311.pyc +0 -0
clarifai/client/__pycache__/deployment.cpython-310.pyc +0 -0
clarifai/client/__pycache__/deployment.cpython-311.pyc +0 -0
clarifai/client/__pycache__/input.cpython-310.pyc +0 -0
clarifai/client/__pycache__/input.cpython-311.pyc +0 -0
clarifai/client/__pycache__/lister.cpython-310.pyc +0 -0
clarifai/client/__pycache__/lister.cpython-311.pyc +0 -0
clarifai/client/__pycache__/model.cpython-310.pyc +0 -0
clarifai/client/__pycache__/model.cpython-311.pyc +0 -0
clarifai/client/__pycache__/module.cpython-310.pyc +0 -0
clarifai/client/__pycache__/module.cpython-311.pyc +0 -0
clarifai/client/__pycache__/nodepool.cpython-310.pyc +0 -0
clarifai/client/__pycache__/nodepool.cpython-311.pyc +0 -0
clarifai/client/__pycache__/search.cpython-310.pyc +0 -0
clarifai/client/__pycache__/search.cpython-311.pyc +0 -0
clarifai/client/__pycache__/user.cpython-310.pyc +0 -0
clarifai/client/__pycache__/user.cpython-311.pyc +0 -0
clarifai/client/__pycache__/workflow.cpython-310.pyc +0 -0
clarifai/client/__pycache__/workflow.cpython-311.pyc +0 -0
clarifai/client/auth/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/client/auth/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/client/auth/__pycache__/helper.cpython-310.pyc +0 -0
clarifai/client/auth/__pycache__/helper.cpython-311.pyc +0 -0
clarifai/client/auth/__pycache__/register.cpython-310.pyc +0 -0
clarifai/client/auth/__pycache__/register.cpython-311.pyc +0 -0
clarifai/client/auth/__pycache__/stub.cpython-310.pyc +0 -0
clarifai/client/auth/__pycache__/stub.cpython-311.pyc +0 -0
clarifai/client/cli/__init__.py +0 -0
clarifai/client/cli/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/client/cli/__pycache__/base_cli.cpython-310.pyc +0 -0
clarifai/client/cli/__pycache__/model_cli.cpython-310.pyc +0 -0
clarifai/client/cli/base_cli.py +0 -88
clarifai/client/cli/model_cli.py +0 -29
clarifai/constants/__pycache__/base.cpython-310.pyc +0 -0
clarifai/constants/__pycache__/base.cpython-311.pyc +0 -0
clarifai/constants/__pycache__/dataset.cpython-310.pyc +0 -0
clarifai/constants/__pycache__/dataset.cpython-311.pyc +0 -0
clarifai/constants/__pycache__/input.cpython-310.pyc +0 -0
clarifai/constants/__pycache__/input.cpython-311.pyc +0 -0
clarifai/constants/__pycache__/model.cpython-310.pyc +0 -0
clarifai/constants/__pycache__/model.cpython-311.pyc +0 -0
clarifai/constants/__pycache__/rag.cpython-310.pyc +0 -0
clarifai/constants/__pycache__/rag.cpython-311.pyc +0 -0
clarifai/constants/__pycache__/search.cpython-310.pyc +0 -0
clarifai/constants/__pycache__/search.cpython-311.pyc +0 -0
clarifai/constants/__pycache__/workflow.cpython-310.pyc +0 -0
clarifai/constants/__pycache__/workflow.cpython-311.pyc +0 -0
clarifai/datasets/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/datasets/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/datasets/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/datasets/export/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/datasets/export/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/datasets/export/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/datasets/export/__pycache__/inputs_annotations.cpython-310.pyc +0 -0
clarifai/datasets/export/__pycache__/inputs_annotations.cpython-311.pyc +0 -0
clarifai/datasets/upload/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/datasets/upload/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/datasets/upload/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/datasets/upload/__pycache__/base.cpython-310.pyc +0 -0
clarifai/datasets/upload/__pycache__/base.cpython-311.pyc +0 -0
clarifai/datasets/upload/__pycache__/features.cpython-310.pyc +0 -0
clarifai/datasets/upload/__pycache__/features.cpython-311.pyc +0 -0
clarifai/datasets/upload/__pycache__/image.cpython-310.pyc +0 -0
clarifai/datasets/upload/__pycache__/image.cpython-311.pyc +0 -0
clarifai/datasets/upload/__pycache__/multimodal.cpython-310.pyc +0 -0
clarifai/datasets/upload/__pycache__/multimodal.cpython-311.pyc +0 -0
clarifai/datasets/upload/__pycache__/text.cpython-310.pyc +0 -0
clarifai/datasets/upload/__pycache__/text.cpython-311.pyc +0 -0
clarifai/datasets/upload/__pycache__/utils.cpython-310.pyc +0 -0
clarifai/datasets/upload/__pycache__/utils.cpython-311.pyc +0 -0
clarifai/datasets/upload/loaders/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/datasets/upload/loaders/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/datasets/upload/loaders/__pycache__/coco_detection.cpython-311.pyc +0 -0
clarifai/datasets/upload/loaders/__pycache__/imagenet_classification.cpython-311.pyc +0 -0
clarifai/models/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/modules/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/rag/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/rag/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/rag/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/rag/__pycache__/rag.cpython-310.pyc +0 -0
clarifai/rag/__pycache__/rag.cpython-311.pyc +0 -0
clarifai/rag/__pycache__/rag.cpython-39.pyc +0 -0
clarifai/rag/__pycache__/utils.cpython-310.pyc +0 -0
clarifai/rag/__pycache__/utils.cpython-311.pyc +0 -0
clarifai/runners/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/runners/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/runners/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/runners/dockerfile_template/Dockerfile.cpu.template +0 -31
clarifai/runners/dockerfile_template/Dockerfile.cuda.template +0 -42
clarifai/runners/dockerfile_template/Dockerfile.nim +0 -71
clarifai/runners/models/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/runners/models/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/runners/models/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/runners/models/__pycache__/base_typed_model.cpython-310.pyc +0 -0
clarifai/runners/models/__pycache__/base_typed_model.cpython-311.pyc +0 -0
clarifai/runners/models/__pycache__/base_typed_model.cpython-39.pyc +0 -0
clarifai/runners/models/__pycache__/model_builder.cpython-311.pyc +0 -0
clarifai/runners/models/__pycache__/model_class.cpython-310.pyc +0 -0
clarifai/runners/models/__pycache__/model_class.cpython-311.pyc +0 -0
clarifai/runners/models/__pycache__/model_run_locally.cpython-310-pytest-7.1.2.pyc +0 -0
clarifai/runners/models/__pycache__/model_run_locally.cpython-310.pyc +0 -0
clarifai/runners/models/__pycache__/model_run_locally.cpython-311.pyc +0 -0
clarifai/runners/models/__pycache__/model_runner.cpython-310.pyc +0 -0
clarifai/runners/models/__pycache__/model_runner.cpython-311.pyc +0 -0
clarifai/runners/models/__pycache__/model_upload.cpython-310.pyc +0 -0
clarifai/runners/models/base_typed_model.py +0 -238
clarifai/runners/models/model_class_refract.py +0 -80
clarifai/runners/models/model_upload.py +0 -607
clarifai/runners/models/temp.py +0 -25
clarifai/runners/utils/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/runners/utils/__pycache__/__init__.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/buffered_stream.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/buffered_stream.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/buffered_stream.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/const.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/const.cpython-311.pyc +0 -0
clarifai/runners/utils/__pycache__/constants.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/constants.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/constants.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/data_handler.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/data_handler.cpython-311.pyc +0 -0
clarifai/runners/utils/__pycache__/data_handler.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/data_handler.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/data_utils.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/data_utils.cpython-311.pyc +0 -0
clarifai/runners/utils/__pycache__/data_utils.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/data_utils.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/grpc_server.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/grpc_server.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/grpc_server.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/health.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/health.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/health.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/loader.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/loader.cpython-311.pyc +0 -0
clarifai/runners/utils/__pycache__/logging.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/logging.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/logging.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/stream_source.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/stream_source.cpython-39.pyc +0 -0
clarifai/runners/utils/__pycache__/url_fetcher.cpython-310.pyc +0 -0
clarifai/runners/utils/__pycache__/url_fetcher.cpython-311.pyc +0 -0
clarifai/runners/utils/__pycache__/url_fetcher.cpython-38.pyc +0 -0
clarifai/runners/utils/__pycache__/url_fetcher.cpython-39.pyc +0 -0
clarifai/runners/utils/data_handler.py +0 -231
clarifai/runners/utils/data_handler_refract.py +0 -213
clarifai/runners/utils/data_types.py +0 -469
clarifai/runners/utils/logger.py +0 -0
clarifai/runners/utils/openai_format.py +0 -87
clarifai/schema/__pycache__/search.cpython-310.pyc +0 -0
clarifai/schema/__pycache__/search.cpython-311.pyc +0 -0
clarifai/urls/__pycache__/helper.cpython-310.pyc +0 -0
clarifai/urls/__pycache__/helper.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/utils/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/utils/__pycache__/cli.cpython-310.pyc +0 -0
clarifai/utils/__pycache__/cli.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/config.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/constants.cpython-310.pyc +0 -0
clarifai/utils/__pycache__/constants.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/logging.cpython-310.pyc +0 -0
clarifai/utils/__pycache__/logging.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/misc.cpython-310.pyc +0 -0
clarifai/utils/__pycache__/misc.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/model_train.cpython-310.pyc +0 -0
clarifai/utils/__pycache__/model_train.cpython-311.pyc +0 -0
clarifai/utils/__pycache__/protobuf.cpython-311.pyc +0 -0
clarifai/utils/evaluation/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/utils/evaluation/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/utils/evaluation/__pycache__/helpers.cpython-311.pyc +0 -0
clarifai/utils/evaluation/__pycache__/main.cpython-311.pyc +0 -0
clarifai/utils/evaluation/__pycache__/main.cpython-39.pyc +0 -0
clarifai/workflows/__pycache__/__init__.cpython-310.pyc +0 -0
clarifai/workflows/__pycache__/__init__.cpython-311.pyc +0 -0
clarifai/workflows/__pycache__/__init__.cpython-39.pyc +0 -0
clarifai/workflows/__pycache__/export.cpython-310.pyc +0 -0
clarifai/workflows/__pycache__/export.cpython-311.pyc +0 -0
clarifai/workflows/__pycache__/utils.cpython-310.pyc +0 -0
clarifai/workflows/__pycache__/utils.cpython-311.pyc +0 -0
clarifai/workflows/__pycache__/validate.cpython-310.pyc +0 -0
clarifai/workflows/__pycache__/validate.cpython-311.pyc +0 -0
clarifai-11.3.0rc2.dist-info/RECORD +0 -322
{clarifai-11.3.0rc2.dist-info → clarifai-11.4.0.dist-info}/entry_points.txt +0 -0
{clarifai-11.3.0rc2.dist-info → clarifai-11.4.0.dist-info/licenses}/LICENSE +0 -0
{clarifai-11.3.0rc2.dist-info → clarifai-11.4.0.dist-info}/top_level.txt +0 -0

clarifai/utils/evaluation/helpers.py CHANGED Viewed

@@ -13,515 +13,552 @@ from clarifai.client.dataset import Dataset
 from clarifai.client.model import Model
 try:
-  import pandas as pd
+    import pandas as pd
 except ImportError:
-  raise ImportError("Can not import pandas. Please run `pip install pandas` to install it")
+    raise ImportError("Can not import pandas. Please run `pip install pandas` to install it")
 try:
-  from loguru import logger
+    from loguru import logger
 except ImportError:
-  from ..logging import logger
+    from ..logging import logger
 MACRO_AVG = "macro_avg"
 class EvalType(Enum):
-  UNDEFINED = 0
-  CLASSIFICATION = 1
-  DETECTION = 2
-  CLUSTERING = 3
-  SEGMENTATION = 4
-  TRACKER = 5
+    UNDEFINED = 0
+    CLASSIFICATION = 1
+    DETECTION = 2
+    CLUSTERING = 3
+    SEGMENTATION = 4
+    TRACKER = 5
 def get_eval_type(model_type):
-  if "classifier" in model_type:
-    return EvalType.CLASSIFICATION
-  elif "visual-detector" in model_type:
-    return EvalType.DETECTION
-  elif "segmenter" in model_type:
-    return EvalType.SEGMENTATION
-  elif "embedder" in model_type:
-    return EvalType.CLUSTERING
-  elif "tracker" in model_type:
-    return EvalType.TRACKER
-  else:
-    return EvalType.UNDEFINED
+    if "classifier" in model_type:
+        return EvalType.CLASSIFICATION
+    elif "visual-detector" in model_type:
+        return EvalType.DETECTION
+    elif "segmenter" in model_type:
+        return EvalType.SEGMENTATION
+    elif "embedder" in model_type:
+        return EvalType.CLUSTERING
+    elif "tracker" in model_type:
+        return EvalType.TRACKER
+    else:
+        return EvalType.UNDEFINED
 def to_file_name(x) -> str:
-  return x.replace('/', '--')
+    return x.replace('/', '--')
 @dataclass
 class _BaseEvalResultHandler:
-  model: Model
-  eval_data: List[resources_pb2.EvalMetrics] = field(default_factory=list)
-  def evaluate_and_wait(self, dataset: Dataset, eval_info: dict = None):
-    from tqdm import tqdm
-    dataset_id = dataset.id
-    dataset_app_id = dataset.app_id
-    dataset_user_id = dataset.user_id
-    _ = self.model.evaluate(
-        dataset_id=dataset_id,
-        dataset_app_id=dataset_app_id,
-        dataset_user_id=dataset_user_id,
-        eval_info=eval_info)
-    latest_eval = self.model.list_evaluations()[0]
-    excepted = 10
-    desc = f"Please wait for the evaluation process between model {self.get_model_name()} and dataset {dataset_user_id}/{dataset_app_id}/{dataset_id} to complete."
-    bar = tqdm(total=excepted, desc=desc, leave=False, ncols=0)
-    while latest_eval.status.code in [
-        status_code_pb2.MODEL_EVALUATING, status_code_pb2.MODEL_QUEUED_FOR_EVALUATION
-    ]:
-      latest_eval = self.model.list_evaluations()[0]
-      time.sleep(1)
-      bar.update(1)
-    if latest_eval.status.code == status_code_pb2.MODEL_EVALUATED:
-      return latest_eval
-    else:
-      raise Exception(
-          f"Model has failed to evaluate \n {latest_eval.status}.\nPlease check your dataset inputs!"
-      )
-  def find_eval_id(self,
-                   datasets: List[Dataset] = [],
-                   attempt_evaluate: bool = False,
-                   eval_info: dict = None):
-    list_eval_outputs = self.model.list_evaluations()
-    self.eval_data = []
-    for dataset in datasets:
-      dataset.app_id = dataset.app_id or self.model.auth_helper.app_id
-      dataset.user_id = dataset.user_id or self.model.auth_helper.user_id
-      dataset_assert_msg = dataset.dataset_info
-      # checking if dataset exists
-      out = dataset.list_versions()
-      try:
-        next(iter(out))
-      except Exception as e:
-        if any(["CONN_DOES_NOT_EXIST" in _e for _e in e.args]):
-          raise Exception(
-              f"Dataset {dataset_assert_msg} does not exists. Please check datasets args")
+    model: Model
+    eval_data: List[resources_pb2.EvalMetrics] = field(default_factory=list)
+    def evaluate_and_wait(self, dataset: Dataset, eval_info: dict = None):
+        from tqdm import tqdm
+        dataset_id = dataset.id
+        dataset_app_id = dataset.app_id
+        dataset_user_id = dataset.user_id
+        _ = self.model.evaluate(
+            dataset_id=dataset_id,
+            dataset_app_id=dataset_app_id,
+            dataset_user_id=dataset_user_id,
+            eval_info=eval_info,
+        )
+        latest_eval = self.model.list_evaluations()[0]
+        excepted = 10
+        desc = f"Please wait for the evaluation process between model {self.get_model_name()} and dataset {dataset_user_id}/{dataset_app_id}/{dataset_id} to complete."
+        bar = tqdm(total=excepted, desc=desc, leave=False, ncols=0)
+        while latest_eval.status.code in [
+            status_code_pb2.MODEL_EVALUATING,
+            status_code_pb2.MODEL_QUEUED_FOR_EVALUATION,
+        ]:
+            latest_eval = self.model.list_evaluations()[0]
+            time.sleep(1)
+            bar.update(1)
+        if latest_eval.status.code == status_code_pb2.MODEL_EVALUATED:
+            return latest_eval
         else:
-          # caused by sdk failure
-          pass
-      # checking if model is evaluated with this dataset
-      _is_found = False
-      for each in list_eval_outputs:
-        if each.status.code == status_code_pb2.MODEL_EVALUATED:
-          eval_dataset = each.ground_truth_dataset
-          # if version_id is empty -> get latest eval result of dataset,app,user id
-          if dataset.app_id == eval_dataset.app_id and dataset.id == eval_dataset.id and dataset.user_id == eval_dataset.user_id and (
-              not dataset.version.id or dataset.version.id == eval_dataset.version.id):
-            # append to eval_data
-            self.eval_data.append(each)
-            _is_found = True
-            break
-      # if not evaluated, but user wants to proceed it
-      if not _is_found:
-        if attempt_evaluate:
-          self.eval_data.append(self.evaluate_and_wait(dataset, eval_info=eval_info))
-        # otherwise raise error
+            raise Exception(
+                f"Model has failed to evaluate \n {latest_eval.status}.\nPlease check your dataset inputs!"
+            )
+    def find_eval_id(
+        self, datasets: List[Dataset] = [], attempt_evaluate: bool = False, eval_info: dict = None
+    ):
+        list_eval_outputs = self.model.list_evaluations()
+        self.eval_data = []
+        for dataset in datasets:
+            dataset.app_id = dataset.app_id or self.model.auth_helper.app_id
+            dataset.user_id = dataset.user_id or self.model.auth_helper.user_id
+            dataset_assert_msg = dataset.dataset_info
+            # checking if dataset exists
+            out = dataset.list_versions()
+            try:
+                next(iter(out))
+            except Exception as e:
+                if any(["CONN_DOES_NOT_EXIST" in _e for _e in e.args]):
+                    raise Exception(
+                        f"Dataset {dataset_assert_msg} does not exists. Please check datasets args"
+                    )
+                else:
+                    # caused by sdk failure
+                    pass
+            # checking if model is evaluated with this dataset
+            _is_found = False
+            for each in list_eval_outputs:
+                if each.status.code == status_code_pb2.MODEL_EVALUATED:
+                    eval_dataset = each.ground_truth_dataset
+                    # if version_id is empty -> get latest eval result of dataset,app,user id
+                    if (
+                        dataset.app_id == eval_dataset.app_id
+                        and dataset.id == eval_dataset.id
+                        and dataset.user_id == eval_dataset.user_id
+                        and (
+                            not dataset.version.id or dataset.version.id == eval_dataset.version.id
+                        )
+                    ):
+                        # append to eval_data
+                        self.eval_data.append(each)
+                        _is_found = True
+                        break
+            # if not evaluated, but user wants to proceed it
+            if not _is_found:
+                if attempt_evaluate:
+                    self.eval_data.append(self.evaluate_and_wait(dataset, eval_info=eval_info))
+                # otherwise raise error
+                else:
+                    raise Exception(
+                        f"Model {self.model.model_info.name} in app {self.model.model_info.app_id} is not evaluated yet with dataset {dataset_assert_msg}"
+                    )
+    @staticmethod
+    def proto_to_dict(value):
+        return MessageToDict(value, preserving_proto_field_name=True)
+    @staticmethod
+    def _f1(x: float, y: float):
+        z = x + y
+        return 2 * x * y / z if z else 0.0
+    def _get_eval(self, index=0, **kwargs):
+        logger.info(
+            f"Model {self.get_model_name(pretify=True)}: retrieving {kwargs} metrics of dataset: {self.get_dataset_name_by_index(index)}"
+        )
+        result = self.model.get_eval_by_id(eval_id=self.eval_data[index].id, **kwargs)
+        for k, v in kwargs.items():
+            if v:
+                getattr(self.eval_data[index], k).MergeFrom(getattr(result, k))
+    def get_eval_data(self, metric_name: str, index=0):
+        if metric_name == 'binary_metrics':
+            if len(self.eval_data[index].binary_metrics) == 0:
+                self._get_eval(index, binary_metrics=True)
+        elif metric_name == 'label_counts':
+            if self.proto_to_dict(self.eval_data[index].label_counts) == {}:
+                self._get_eval(index, label_counts=True)
+        elif metric_name == 'confusion_matrix':
+            if self.eval_data[index].confusion_matrix.ByteSize() == 0:
+                self._get_eval(index, confusion_matrix=True)
+        elif metric_name == 'metrics_by_class':
+            if len(self.eval_data[index].metrics_by_class) == 0:
+                self._get_eval(index, metrics_by_class=True)
+        elif metric_name == 'metrics_by_area':
+            if len(self.eval_data[index].metrics_by_area) == 0:
+                self._get_eval(index, metrics_by_area=True)
+        return getattr(self.eval_data[index], metric_name)
+    def get_threshold_index(self, threshold_list: list, selected_value: float = 0.5) -> int:
+        assert 0 <= selected_value <= 1 and isinstance(selected_value, float)
+        threshold_list = [round(each, 2) for each in threshold_list]
+        def parse_precision(x):
+            return len(str(x).split(".")[1])
+        precision = parse_precision(selected_value)
+        if precision > 2:
+            selected_value = round(selected_value, 2)
+            logger.warning("Round the selected value to .2 decimals")
+        return threshold_list.index(selected_value)
+    def get_dataset_name_by_index(self, index=0, pretify=True):
+        out = self.eval_data[index].ground_truth_dataset
+        if pretify:
+            app_id = out.app_id
+            dataset = out.id
+            # out = f"{app_id}/{dataset}/{ver[:5]}" if ver else f"{app_id}/{dataset}"
+            if self.model.model_info.app_id == app_id:
+                out = dataset
+            else:
+                out = f"{app_id}/{dataset}"
+        return out
+    def get_model_name(self, pretify=True):
+        model = self.model.model_info
+        if pretify:
+            app_id = model.app_id
+            name = model.id
+            ver = model.model_version.id
+            model = f"{app_id}/{name}/{ver[:5]}" if ver else f"{app_id}/{name}"
+        return model
+    def _process_curve(
+        self, data: resources_pb2.BinaryMetrics, metric_name: str, x: str, y: str
+    ) -> Dict[str, Dict[str, np.array]]:
+        """Postprocess curve"""
+        x_arr = []
+        y_arr = []
+        threshold = []
+        outputs = []
+        def _make_df(xcol, ycol, concept_col, th_col):
+            return pd.DataFrame({x: xcol, y: ycol, 'concept': concept_col, 'threshold': th_col})
+        for bd in data:
+            concept_id = bd.concept.id
+            metric = eval(f'bd.{metric_name}')
+            if metric.ByteSize() == 0:
+                continue
+            _x = np.array(eval(f'metric.{x}'))
+            _y = np.array(eval(f'metric.{y}'))
+            threshold = np.array(metric.thresholds)
+            x_arr.append(_x)
+            y_arr.append(_y)
+            concept_cols = [concept_id for _ in range(len(_x))]
+            outputs.append(_make_df(_x, _y, concept_cols, threshold))
+        avg_x = np.mean(x_arr, axis=0)
+        avg_y = np.mean(y_arr, axis=0)
+        if np.isnan(avg_x).all():
+            return None
         else:
-          raise Exception(
-              f"Model {self.model.model_info.name} in app {self.model.model_info.app_id} is not evaluated yet with dataset {dataset_assert_msg}"
-          )
-  @staticmethod
-  def proto_to_dict(value):
-    return MessageToDict(value, preserving_proto_field_name=True)
-  @staticmethod
-  def _f1(x: float, y: float):
-    z = x + y
-    return 2 * x * y / z if z else 0.
-  def _get_eval(self, index=0, **kwargs):
-    logger.info(
-        f"Model {self.get_model_name(pretify=True)}: retrieving {kwargs} metrics of dataset: {self.get_dataset_name_by_index(index)}"
-    )
-    result = self.model.get_eval_by_id(eval_id=self.eval_data[index].id, **kwargs)
-    for k, v in kwargs.items():
-      if v:
-        getattr(self.eval_data[index], k).MergeFrom(getattr(result, k))
-  def get_eval_data(self, metric_name: str, index=0):
-    if metric_name == 'binary_metrics':
-      if len(self.eval_data[index].binary_metrics) == 0:
-        self._get_eval(index, binary_metrics=True)
-    elif metric_name == 'label_counts':
-      if self.proto_to_dict(self.eval_data[index].label_counts) == {}:
-        self._get_eval(index, label_counts=True)
-    elif metric_name == 'confusion_matrix':
-      if self.eval_data[index].confusion_matrix.ByteSize() == 0:
-        self._get_eval(index, confusion_matrix=True)
-    elif metric_name == 'metrics_by_class':
-      if len(self.eval_data[index].metrics_by_class) == 0:
-        self._get_eval(index, metrics_by_class=True)
-    elif metric_name == 'metrics_by_area':
-      if len(self.eval_data[index].metrics_by_area) == 0:
-        self._get_eval(index, metrics_by_area=True)
-    return getattr(self.eval_data[index], metric_name)
-  def get_threshold_index(self, threshold_list: list, selected_value: float = 0.5) -> int:
-    assert 0 <= selected_value <= 1 and isinstance(selected_value, float)
-    threshold_list = [round(each, 2) for each in threshold_list]
-    def parse_precision(x):
-      return len(str(x).split(".")[1])
-    precision = parse_precision(selected_value)
-    if precision > 2:
-      selected_value = round(selected_value, 2)
-      logger.warning("Round the selected value to .2 decimals")
-    return threshold_list.index(selected_value)
-  def get_dataset_name_by_index(self, index=0, pretify=True):
-    out = self.eval_data[index].ground_truth_dataset
-    if pretify:
-      app_id = out.app_id
-      dataset = out.id
-      #out = f"{app_id}/{dataset}/{ver[:5]}" if ver else f"{app_id}/{dataset}"
-      if self.model.model_info.app_id == app_id:
-        out = dataset
-      else:
-        out = f"{app_id}/{dataset}"
-    return out
-  def get_model_name(self, pretify=True):
-    model = self.model.model_info
-    if pretify:
-      app_id = model.app_id
-      name = model.id
-      ver = model.model_version.id
-      model = f"{app_id}/{name}/{ver[:5]}" if ver else f"{app_id}/{name}"
-    return model
-  def _process_curve(self, data: resources_pb2.BinaryMetrics, metric_name: str, x: str,
-                     y: str) -> Dict[str, Dict[str, np.array]]:
-    """ Postprocess curve
-    """
-    x_arr = []
-    y_arr = []
-    threshold = []
-    outputs = []
-    def _make_df(xcol, ycol, concept_col, th_col):
-      return pd.DataFrame({x: xcol, y: ycol, 'concept': concept_col, 'threshold': th_col})
-    for bd in data:
-      concept_id = bd.concept.id
-      metric = eval(f'bd.{metric_name}')
-      if metric.ByteSize() == 0:
-        continue
-      _x = np.array(eval(f'metric.{x}'))
-      _y = np.array(eval(f'metric.{y}'))
-      threshold = np.array(metric.thresholds)
-      x_arr.append(_x)
-      y_arr.append(_y)
-      concept_cols = [concept_id for _ in range(len(_x))]
-      outputs.append(_make_df(_x, _y, concept_cols, threshold))
-    avg_x = np.mean(x_arr, axis=0)
-    avg_y = np.mean(y_arr, axis=0)
-    if np.isnan(avg_x).all():
-      return None
-    else:
-      avg_cols = [MACRO_AVG for _ in range(len(avg_x))]
-    outputs.append(_make_df(avg_x, avg_y, avg_cols, threshold))
+            avg_cols = [MACRO_AVG for _ in range(len(avg_x))]
+        outputs.append(_make_df(avg_x, avg_y, avg_cols, threshold))
-    return pd.concat(outputs, axis=0)
+        return pd.concat(outputs, axis=0)
-  def parse_concept_ids(self, *args, **kwargs) -> List[str]:
-    raise NotImplementedError
+    def parse_concept_ids(self, *args, **kwargs) -> List[str]:
+        raise NotImplementedError
-  def detailed_summary(self, *args, **kwargs):
-    raise NotImplementedError
+    def detailed_summary(self, *args, **kwargs):
+        raise NotImplementedError
-  def pr_curve(self, *args, **kwargs):
-    raise NotImplementedError
+    def pr_curve(self, *args, **kwargs):
+        raise NotImplementedError
-  def roc_curve(self, *args, **kwargs):
-    raise NotImplementedError
+    def roc_curve(self, *args, **kwargs):
+        raise NotImplementedError
-  def confusion_matrix(self, *args, **kwargs):
-    raise NotImplementedError
+    def confusion_matrix(self, *args, **kwargs):
+        raise NotImplementedError
 @dataclass
 class PlaceholderHandler(_BaseEvalResultHandler):
+    def parse_concept_ids(self, *args, **kwargs) -> List[str]:
+        return None
-  def parse_concept_ids(self, *args, **kwargs) -> List[str]:
-    return None
+    def detailed_summary(self, *args, **kwargs):
+        return None
-  def detailed_summary(self, *args, **kwargs):
-    return None
-  def pr_curve(self, *args, **kwargs):
-    return None
+    def pr_curve(self, *args, **kwargs):
+        return None
 @dataclass
 class ClassificationResultHandler(_BaseEvalResultHandler):
-  def parse_concept_ids(self, index=0) -> List[str]:
-    eval_data = self.get_eval_data(metric_name='label_counts', index=index)
-    concept_ids = [temp.concept.id for temp in eval_data.positive_label_counts]
-    return concept_ids
-  def detailed_summary(self, index=0, confidence_threshold: float = 0.5,
-                       **kwargs) -> Union[None, Tuple[pd.DataFrame, pd.DataFrame]]:
-    """Making detailed table per concept and for total concept
-    Args:
-        index (int, optional): Index of eval dataset. Defaults to 0.
-        confidence_threshold (float, optional): confidence threshold. Defaults to 0.5.
-    Returns:
-        tuple: concepts dataframe, total dataframe
-    """
-    eval_data = self.get_eval_data('binary_metrics', index=index)
-    summary = self.get_eval_data('summary', index=index)
-    total_labeled = 0
-    total_predicted = 0
-    total_tp = 0
-    total_fn = 0
-    total_fp = 0
-    metrics = []
-    for bd in eval_data:
-      concept_id = bd.concept.id
-      if bd.precision_recall_curve.ByteSize() == 0:
-        continue
-      pr_th_index = self.get_threshold_index(
-          list(bd.precision_recall_curve.thresholds), selected_value=confidence_threshold)
-      roc_th_index = self.get_threshold_index(
-          list(bd.roc_curve.thresholds), selected_value=confidence_threshold)
-      if pr_th_index is None or roc_th_index is None:
-        continue
-      num_pos_labeled = bd.num_pos
-      num_neg_labeled = bd.num_neg
-      # TP/(TP+FP)
-      precision = bd.precision_recall_curve.precision[pr_th_index]
-      # TP/(TP+FN)
-      recall = bd.precision_recall_curve.recall[pr_th_index]
-      # FP/(FP+TN)
-      fpr = bd.roc_curve.fpr[roc_th_index]
-      # TP/(TP+FN)
-      tpr = bd.roc_curve.tpr[roc_th_index]
-      # TP+FN
-      tp = int(tpr * num_pos_labeled)
-      fn = num_pos_labeled - tp
-      fp = int(fpr * num_neg_labeled)
-      num_pos_pred = tp + fp
-      f1 = self._f1(recall, precision)
-      total_labeled += num_pos_labeled
-      total_predicted += num_pos_pred
-      total_fn += fn
-      total_tp += tp
-      total_fp += fp
-      # roc auc, total labelled, predicted, tp, fn, fp, recall, precision, f1
-      _d = OrderedDict({
-          "Concept": concept_id,
-          "Accuracy (ROC AUC)": round(bd.roc_auc, 3),
-          "Total Labeled": num_pos_labeled,
-          "Total Predicted": num_pos_pred,
-          "True Positives": tp,
-          "False Negatives": fn,
-          "False Positives": fp,
-          "Recall": recall,
-          "Precision": precision,
-          "F1": f1
-      })
-      metrics.append(pd.DataFrame(_d, index=[0]))
-    # If no valid data is found, return None
-    if not metrics:
-      return None
-    # Make per concept df
-    df = pd.concat(metrics, axis=0)
-    # Make total df
-    sum_df_total = sum(df["Total Labeled"])
-    precision = sum(df.Precision * df["Total Labeled"]) / sum_df_total if sum_df_total else 0.
-    recall = sum(df.Recall * df["Total Labeled"]) / sum_df_total if sum_df_total else 0.
-    f1 = self._f1(recall, precision)
-    df_total = pd.DataFrame(
-        [
+    def parse_concept_ids(self, index=0) -> List[str]:
+        eval_data = self.get_eval_data(metric_name='label_counts', index=index)
+        concept_ids = [temp.concept.id for temp in eval_data.positive_label_counts]
+        return concept_ids
+    def detailed_summary(
+        self, index=0, confidence_threshold: float = 0.5, **kwargs
+    ) -> Union[None, Tuple[pd.DataFrame, pd.DataFrame]]:
+        """Making detailed table per concept and for total concept
+        Args:
+            index (int, optional): Index of eval dataset. Defaults to 0.
+            confidence_threshold (float, optional): confidence threshold. Defaults to 0.5.
+        Returns:
+            tuple: concepts dataframe, total dataframe
+        """
+        eval_data = self.get_eval_data('binary_metrics', index=index)
+        summary = self.get_eval_data('summary', index=index)
+        total_labeled = 0
+        total_predicted = 0
+        total_tp = 0
+        total_fn = 0
+        total_fp = 0
+        metrics = []
+        for bd in eval_data:
+            concept_id = bd.concept.id
+            if bd.precision_recall_curve.ByteSize() == 0:
+                continue
+            pr_th_index = self.get_threshold_index(
+                list(bd.precision_recall_curve.thresholds), selected_value=confidence_threshold
+            )
+            roc_th_index = self.get_threshold_index(
+                list(bd.roc_curve.thresholds), selected_value=confidence_threshold
+            )
+            if pr_th_index is None or roc_th_index is None:
+                continue
+            num_pos_labeled = bd.num_pos
+            num_neg_labeled = bd.num_neg
+            # TP/(TP+FP)
+            precision = bd.precision_recall_curve.precision[pr_th_index]
+            # TP/(TP+FN)
+            recall = bd.precision_recall_curve.recall[pr_th_index]
+            # FP/(FP+TN)
+            fpr = bd.roc_curve.fpr[roc_th_index]
+            # TP/(TP+FN)
+            tpr = bd.roc_curve.tpr[roc_th_index]
+            # TP+FN
+            tp = int(tpr * num_pos_labeled)
+            fn = num_pos_labeled - tp
+            fp = int(fpr * num_neg_labeled)
+            num_pos_pred = tp + fp
+            f1 = self._f1(recall, precision)
+            total_labeled += num_pos_labeled
+            total_predicted += num_pos_pred
+            total_fn += fn
+            total_tp += tp
+            total_fp += fp
+            # roc auc, total labelled, predicted, tp, fn, fp, recall, precision, f1
+            _d = OrderedDict(
+                {
+                    "Concept": concept_id,
+                    "Accuracy (ROC AUC)": round(bd.roc_auc, 3),
+                    "Total Labeled": num_pos_labeled,
+                    "Total Predicted": num_pos_pred,
+                    "True Positives": tp,
+                    "False Negatives": fn,
+                    "False Positives": fp,
+                    "Recall": recall,
+                    "Precision": precision,
+                    "F1": f1,
+                }
+            )
+            metrics.append(pd.DataFrame(_d, index=[0]))
+        # If no valid data is found, return None
+        if not metrics:
+            return None
+        # Make per concept df
+        df = pd.concat(metrics, axis=0)
+        # Make total df
+        sum_df_total = sum(df["Total Labeled"])
+        precision = sum(df.Precision * df["Total Labeled"]) / sum_df_total if sum_df_total else 0.0
+        recall = sum(df.Recall * df["Total Labeled"]) / sum_df_total if sum_df_total else 0.0
+        f1 = self._f1(recall, precision)
+        df_total = pd.DataFrame(
             [
-                'Total', summary.macro_avg_roc_auc, total_labeled, total_predicted, total_tp,
-                total_fn, total_fp, recall, precision, f1
+                [
+                    'Total',
+                    summary.macro_avg_roc_auc,
+                    total_labeled,
+                    total_predicted,
+                    total_tp,
+                    total_fn,
+                    total_fp,
+                    recall,
+                    precision,
+                    f1,
+                ],
             ],
-        ],
-        columns=df.columns,
-        index=[0])
-    return df, df_total
-  def pr_curve(self, index=0, **kwargs) -> Union[None, pd.DataFrame]:
-    """Making PR curve
-    Args:
-        index (int, optional): Index of eval dataset. Defaults to 0.
-    Returns:
-        dictionary: Keys are concept ids and 'macro_avg'. Values are dictionaries of {precision: np.array, recall: np.array}
-    """
-    eval_data = self.get_eval_data(metric_name='binary_metrics', index=index)
-    outputs = self._process_curve(
-        eval_data, metric_name='precision_recall_curve', x='recall', y='precision')
-    return outputs
-  def roc_curve(self, index=0, **kwargs) -> Union[None, pd.DataFrame]:
-    eval_data = self.get_eval_data(metric_name='binary_metrics', index=index)
-    outputs = self._process_curve(eval_data, metric_name='roc_curve', x='tpr', y='fpr')
-    return outputs
-  def confusion_matrix(self, index=0, **kwargs):
-    eval_data = self.get_eval_data(metric_name='confusion_matrix', index=index)
-    concept_ids = self.parse_concept_ids(index)
-    concept_ids.sort()
-    data = np.zeros((len(concept_ids), len(concept_ids)), np.float32)
-    for entry in eval_data.matrix:
-      p = entry.predicted_concept.id
-      a = entry.actual_concept.id
-      if p in concept_ids and a in concept_ids:
-        data[concept_ids.index(a), concept_ids.index(p)] = np.around(entry.value, decimals=3)
-      else:
-        continue
-    rownames = pd.MultiIndex.from_arrays([concept_ids], names=['Actual'])
-    colnames = pd.MultiIndex.from_arrays([concept_ids], names=['Predicted'])
-    df = pd.DataFrame(data, columns=colnames, index=rownames)
-    return df
+            columns=df.columns,
+            index=[0],
+        )
+        return df, df_total
+    def pr_curve(self, index=0, **kwargs) -> Union[None, pd.DataFrame]:
+        """Making PR curve
+        Args:
+            index (int, optional): Index of eval dataset. Defaults to 0.
+        Returns:
+            dictionary: Keys are concept ids and 'macro_avg'. Values are dictionaries of {precision: np.array, recall: np.array}
+        """
+        eval_data = self.get_eval_data(metric_name='binary_metrics', index=index)
+        outputs = self._process_curve(
+            eval_data, metric_name='precision_recall_curve', x='recall', y='precision'
+        )
+        return outputs
+    def roc_curve(self, index=0, **kwargs) -> Union[None, pd.DataFrame]:
+        eval_data = self.get_eval_data(metric_name='binary_metrics', index=index)
+        outputs = self._process_curve(eval_data, metric_name='roc_curve', x='tpr', y='fpr')
+        return outputs
+    def confusion_matrix(self, index=0, **kwargs):
+        eval_data = self.get_eval_data(metric_name='confusion_matrix', index=index)
+        concept_ids = self.parse_concept_ids(index)
+        concept_ids.sort()
+        data = np.zeros((len(concept_ids), len(concept_ids)), np.float32)
+        for entry in eval_data.matrix:
+            p = entry.predicted_concept.id
+            a = entry.actual_concept.id
+            if p in concept_ids and a in concept_ids:
+                data[concept_ids.index(a), concept_ids.index(p)] = np.around(
+                    entry.value, decimals=3
+                )
+            else:
+                continue
+        rownames = pd.MultiIndex.from_arrays([concept_ids], names=['Actual'])
+        colnames = pd.MultiIndex.from_arrays([concept_ids], names=['Predicted'])
+        df = pd.DataFrame(data, columns=colnames, index=rownames)
+        return df
 @dataclass
 class DetectionResultHandler(_BaseEvalResultHandler):
-  AREA_LIST = ["all", "medium", "small"]
-  IOU_LIST = list(np.arange(0.5, 1., 0.1))
-  def parse_concept_ids(self, index=0) -> List[str]:
-    eval_data = self.get_eval_data(metric_name='metrics_by_class', index=index)
-    concept_ids = [temp.concept.id for temp in eval_data]
-    return concept_ids
-  def detailed_summary(self,
-                       index=0,
-                       confidence_threshold: float = 0.5,
-                       iou_threshold: float = 0.5,
-                       area: str = "all",
-                       bypass_const: bool = False,
-                       **kwargs):
-    if not bypass_const:
-      assert iou_threshold in self.IOU_LIST, f"Expected iou_threshold in {self.IOU_LIST}, got {iou_threshold}"
-      assert area in self.AREA_LIST, f"Expected area in {self.AREA_LIST}, got {area}"
-    eval_data = self.get_eval_data('metrics_by_class', index=index)
-    #summary = self.get_eval_data('summary', index=index)
-    metrics = []
-    for bd in eval_data:
-      # total label
-      _iou = round(bd.iou, 1)
-      if not (area and bd.area_name == area) or not (iou_threshold and iou_threshold == _iou):
-        continue
-      concept_id = bd.concept.id
-      total = round(bd.num_tot, 3)
-      # TP / (TP + FP)
-      if len(bd.precision_recall_curve.precision) > 0:
-        pr_th_index = self.get_threshold_index(
-            list(bd.precision_recall_curve.thresholds), selected_value=confidence_threshold)
-        p = round(bd.precision_recall_curve.precision[pr_th_index], 3)
-      else:
-        p = 0
-      # TP / (TP + FN)
-      if len(bd.precision_recall_curve.recall) > 0:
-        pr_th_index = self.get_threshold_index(
-            list(bd.precision_recall_curve.thresholds), selected_value=confidence_threshold)
-        r = round(bd.precision_recall_curve.recall[pr_th_index], 3)
-      else:
-        r = 0
-      tp = int(round(r * total, 0))
-      fn = total - tp
-      fp = float(tp) / p - tp if p else 0
-      fp = int(round(fp, 1))
-      f1 = self._f1(r, p)
-      _d = {
-          "Concept": concept_id,
-          "Average Precision": round(float(bd.avg_precision), 3),
-          "Total Labeled": total,
-          "True Positives": tp,
-          "False Positives": fp,
-          "False Negatives": fn,
-          "Recall": r,
-          "Precision": p,
-          "F1": f1,
-      }
-      metrics.append(pd.DataFrame(_d, index=[0]))
-    if not metrics:
-      return None
-    df = pd.concat(metrics, axis=0)
-    df_total = defaultdict()
-    sum_df_total = df["Total Labeled"].sum()
-    df_total["Concept"] = "Total"
-    df_total["Average Precision"] = df["Average Precision"].mean()
-    df_total["Total Labeled"] = sum_df_total
-    df_total["True Positives"] = df["True Positives"].sum()
-    df_total["False Positives"] = df["False Positives"].sum()
-    df_total["False Negatives"] = df["False Negatives"].sum()
-    df_total["Recall"] = sum(
-        df.Recall * df["Total Labeled"]) / sum_df_total if sum_df_total else 0.
-    df_total["Precision"] = df_total["True Positives"] / (
-        df_total["True Positives"] + df_total["False Positives"]) if sum_df_total else 0.
-    df_total["F1"] = self._f1(df_total["Recall"], df_total["Precision"])
-    df_total = pd.DataFrame(df_total, index=[0])
-    return [df, df_total]
-  def pr_curve(self,
-               index=0,
-               iou_threshold: float = 0.5,
-               area: str = "all",
-               bypass_const=False,
-               **kwargs):
-    if not bypass_const:
-      assert iou_threshold in self.IOU_LIST, f"Expected iou_threshold in {self.IOU_LIST}, got {iou_threshold}"
-      assert area in self.AREA_LIST, f"Expected area in {self.AREA_LIST}, got {area}"
-    eval_data = self.get_eval_data(metric_name='metrics_by_class', index=index)
-    _valid_eval_data = []
-    for bd in eval_data:
-      _iou = round(bd.iou, 1)
-      if not (area and bd.area_name == area) or not (iou_threshold and iou_threshold == _iou):
-        continue
-      _valid_eval_data.append(bd)
-    outputs = self._process_curve(
-        _valid_eval_data, metric_name='precision_recall_curve', x='recall', y='precision')
-    return outputs
-  def roc_curve(self, index=0, **kwargs) -> None:
-    return None
-  def confusion_matrix(self, index=0, **kwargs) -> None:
-    return None
+    AREA_LIST = ["all", "medium", "small"]
+    IOU_LIST = list(np.arange(0.5, 1.0, 0.1))
+    def parse_concept_ids(self, index=0) -> List[str]:
+        eval_data = self.get_eval_data(metric_name='metrics_by_class', index=index)
+        concept_ids = [temp.concept.id for temp in eval_data]
+        return concept_ids
+    def detailed_summary(
+        self,
+        index=0,
+        confidence_threshold: float = 0.5,
+        iou_threshold: float = 0.5,
+        area: str = "all",
+        bypass_const: bool = False,
+        **kwargs,
+    ):
+        if not bypass_const:
+            assert iou_threshold in self.IOU_LIST, (
+                f"Expected iou_threshold in {self.IOU_LIST}, got {iou_threshold}"
+            )
+            assert area in self.AREA_LIST, f"Expected area in {self.AREA_LIST}, got {area}"
+        eval_data = self.get_eval_data('metrics_by_class', index=index)
+        # summary = self.get_eval_data('summary', index=index)
+        metrics = []
+        for bd in eval_data:
+            # total label
+            _iou = round(bd.iou, 1)
+            if not (area and bd.area_name == area) or not (
+                iou_threshold and iou_threshold == _iou
+            ):
+                continue
+            concept_id = bd.concept.id
+            total = round(bd.num_tot, 3)
+            # TP / (TP + FP)
+            if len(bd.precision_recall_curve.precision) > 0:
+                pr_th_index = self.get_threshold_index(
+                    list(bd.precision_recall_curve.thresholds), selected_value=confidence_threshold
+                )
+                p = round(bd.precision_recall_curve.precision[pr_th_index], 3)
+            else:
+                p = 0
+            # TP / (TP + FN)
+            if len(bd.precision_recall_curve.recall) > 0:
+                pr_th_index = self.get_threshold_index(
+                    list(bd.precision_recall_curve.thresholds), selected_value=confidence_threshold
+                )
+                r = round(bd.precision_recall_curve.recall[pr_th_index], 3)
+            else:
+                r = 0
+            tp = int(round(r * total, 0))
+            fn = total - tp
+            fp = float(tp) / p - tp if p else 0
+            fp = int(round(fp, 1))
+            f1 = self._f1(r, p)
+            _d = {
+                "Concept": concept_id,
+                "Average Precision": round(float(bd.avg_precision), 3),
+                "Total Labeled": total,
+                "True Positives": tp,
+                "False Positives": fp,
+                "False Negatives": fn,
+                "Recall": r,
+                "Precision": p,
+                "F1": f1,
+            }
+            metrics.append(pd.DataFrame(_d, index=[0]))
+        if not metrics:
+            return None
+        df = pd.concat(metrics, axis=0)
+        df_total = defaultdict()
+        sum_df_total = df["Total Labeled"].sum()
+        df_total["Concept"] = "Total"
+        df_total["Average Precision"] = df["Average Precision"].mean()
+        df_total["Total Labeled"] = sum_df_total
+        df_total["True Positives"] = df["True Positives"].sum()
+        df_total["False Positives"] = df["False Positives"].sum()
+        df_total["False Negatives"] = df["False Negatives"].sum()
+        df_total["Recall"] = (
+            sum(df.Recall * df["Total Labeled"]) / sum_df_total if sum_df_total else 0.0
+        )
+        df_total["Precision"] = (
+            df_total["True Positives"] / (df_total["True Positives"] + df_total["False Positives"])
+            if sum_df_total
+            else 0.0
+        )
+        df_total["F1"] = self._f1(df_total["Recall"], df_total["Precision"])
+        df_total = pd.DataFrame(df_total, index=[0])
+        return [df, df_total]
+    def pr_curve(
+        self, index=0, iou_threshold: float = 0.5, area: str = "all", bypass_const=False, **kwargs
+    ):
+        if not bypass_const:
+            assert iou_threshold in self.IOU_LIST, (
+                f"Expected iou_threshold in {self.IOU_LIST}, got {iou_threshold}"
+            )
+            assert area in self.AREA_LIST, f"Expected area in {self.AREA_LIST}, got {area}"
+        eval_data = self.get_eval_data(metric_name='metrics_by_class', index=index)
+        _valid_eval_data = []
+        for bd in eval_data:
+            _iou = round(bd.iou, 1)
+            if not (area and bd.area_name == area) or not (
+                iou_threshold and iou_threshold == _iou
+            ):
+                continue
+            _valid_eval_data.append(bd)
+        outputs = self._process_curve(
+            _valid_eval_data, metric_name='precision_recall_curve', x='recall', y='precision'
+        )
+        return outputs
+    def roc_curve(self, index=0, **kwargs) -> None:
+        return None
+    def confusion_matrix(self, index=0, **kwargs) -> None:
+        return None
 def make_handler_by_type(model_type: str) -> _BaseEvalResultHandler:
-  _eval_type = get_eval_type(model_type)
-  if _eval_type == EvalType.CLASSIFICATION:
-    return ClassificationResultHandler
-  elif _eval_type == EvalType.DETECTION:
-    return DetectionResultHandler
-  else:
-    return PlaceholderHandler
+    _eval_type = get_eval_type(model_type)
+    if _eval_type == EvalType.CLASSIFICATION:
+        return ClassificationResultHandler
+    elif _eval_type == EvalType.DETECTION:
+        return DetectionResultHandler
+    else:
+        return PlaceholderHandler

clarifai 11.3.0rc2__py3-none-any.whl → 11.4.0__py3-none-any.whl

clarifai 11.3.0rc2py3-none-any.whl → 11.4.0py3-none-any.whl