PyPI - triton-model-analyzer - Versions diffs - 1.48.0__py3-none-any.whl - Mend

triton-model-analyzer 1.48.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (204) hide show

model_analyzer/__init__.py +15 -0
model_analyzer/analyzer.py +448 -0
model_analyzer/cli/__init__.py +15 -0
model_analyzer/cli/cli.py +193 -0
model_analyzer/config/__init__.py +15 -0
model_analyzer/config/generate/__init__.py +15 -0
model_analyzer/config/generate/automatic_model_config_generator.py +164 -0
model_analyzer/config/generate/base_model_config_generator.py +352 -0
model_analyzer/config/generate/brute_plus_binary_parameter_search_run_config_generator.py +164 -0
model_analyzer/config/generate/brute_run_config_generator.py +154 -0
model_analyzer/config/generate/concurrency_sweeper.py +75 -0
model_analyzer/config/generate/config_generator_interface.py +52 -0
model_analyzer/config/generate/coordinate.py +143 -0
model_analyzer/config/generate/coordinate_data.py +86 -0
model_analyzer/config/generate/generator_utils.py +116 -0
model_analyzer/config/generate/manual_model_config_generator.py +187 -0
model_analyzer/config/generate/model_config_generator_factory.py +92 -0
model_analyzer/config/generate/model_profile_spec.py +74 -0
model_analyzer/config/generate/model_run_config_generator.py +154 -0
model_analyzer/config/generate/model_variant_name_manager.py +150 -0
model_analyzer/config/generate/neighborhood.py +536 -0
model_analyzer/config/generate/optuna_plus_concurrency_sweep_run_config_generator.py +141 -0
model_analyzer/config/generate/optuna_run_config_generator.py +838 -0
model_analyzer/config/generate/perf_analyzer_config_generator.py +312 -0
model_analyzer/config/generate/quick_plus_concurrency_sweep_run_config_generator.py +130 -0
model_analyzer/config/generate/quick_run_config_generator.py +753 -0
model_analyzer/config/generate/run_config_generator_factory.py +329 -0
model_analyzer/config/generate/search_config.py +112 -0
model_analyzer/config/generate/search_dimension.py +73 -0
model_analyzer/config/generate/search_dimensions.py +85 -0
model_analyzer/config/generate/search_parameter.py +49 -0
model_analyzer/config/generate/search_parameters.py +388 -0
model_analyzer/config/input/__init__.py +15 -0
model_analyzer/config/input/config_command.py +483 -0
model_analyzer/config/input/config_command_profile.py +1747 -0
model_analyzer/config/input/config_command_report.py +267 -0
model_analyzer/config/input/config_defaults.py +236 -0
model_analyzer/config/input/config_enum.py +83 -0
model_analyzer/config/input/config_field.py +216 -0
model_analyzer/config/input/config_list_generic.py +112 -0
model_analyzer/config/input/config_list_numeric.py +151 -0
model_analyzer/config/input/config_list_string.py +111 -0
model_analyzer/config/input/config_none.py +71 -0
model_analyzer/config/input/config_object.py +129 -0
model_analyzer/config/input/config_primitive.py +81 -0
model_analyzer/config/input/config_status.py +75 -0
model_analyzer/config/input/config_sweep.py +83 -0
model_analyzer/config/input/config_union.py +113 -0
model_analyzer/config/input/config_utils.py +128 -0
model_analyzer/config/input/config_value.py +243 -0
model_analyzer/config/input/objects/__init__.py +15 -0
model_analyzer/config/input/objects/config_model_profile_spec.py +325 -0
model_analyzer/config/input/objects/config_model_report_spec.py +173 -0
model_analyzer/config/input/objects/config_plot.py +198 -0
model_analyzer/config/input/objects/config_protobuf_utils.py +101 -0
model_analyzer/config/input/yaml_config_validator.py +82 -0
model_analyzer/config/run/__init__.py +15 -0
model_analyzer/config/run/model_run_config.py +313 -0
model_analyzer/config/run/run_config.py +168 -0
model_analyzer/constants.py +76 -0
model_analyzer/device/__init__.py +15 -0
model_analyzer/device/device.py +24 -0
model_analyzer/device/gpu_device.py +87 -0
model_analyzer/device/gpu_device_factory.py +248 -0
model_analyzer/entrypoint.py +307 -0
model_analyzer/log_formatter.py +65 -0
model_analyzer/model_analyzer_exceptions.py +24 -0
model_analyzer/model_manager.py +255 -0
model_analyzer/monitor/__init__.py +15 -0
model_analyzer/monitor/cpu_monitor.py +69 -0
model_analyzer/monitor/dcgm/DcgmDiag.py +191 -0
model_analyzer/monitor/dcgm/DcgmFieldGroup.py +83 -0
model_analyzer/monitor/dcgm/DcgmGroup.py +815 -0
model_analyzer/monitor/dcgm/DcgmHandle.py +141 -0
model_analyzer/monitor/dcgm/DcgmJsonReader.py +69 -0
model_analyzer/monitor/dcgm/DcgmReader.py +623 -0
model_analyzer/monitor/dcgm/DcgmStatus.py +57 -0
model_analyzer/monitor/dcgm/DcgmSystem.py +412 -0
model_analyzer/monitor/dcgm/__init__.py +15 -0
model_analyzer/monitor/dcgm/common/__init__.py +13 -0
model_analyzer/monitor/dcgm/common/dcgm_client_cli_parser.py +194 -0
model_analyzer/monitor/dcgm/common/dcgm_client_main.py +86 -0
model_analyzer/monitor/dcgm/dcgm_agent.py +887 -0
model_analyzer/monitor/dcgm/dcgm_collectd_plugin.py +369 -0
model_analyzer/monitor/dcgm/dcgm_errors.py +395 -0
model_analyzer/monitor/dcgm/dcgm_field_helpers.py +546 -0
model_analyzer/monitor/dcgm/dcgm_fields.py +815 -0
model_analyzer/monitor/dcgm/dcgm_fields_collectd.py +671 -0
model_analyzer/monitor/dcgm/dcgm_fields_internal.py +29 -0
model_analyzer/monitor/dcgm/dcgm_fluentd.py +45 -0
model_analyzer/monitor/dcgm/dcgm_monitor.py +138 -0
model_analyzer/monitor/dcgm/dcgm_prometheus.py +326 -0
model_analyzer/monitor/dcgm/dcgm_structs.py +2357 -0
model_analyzer/monitor/dcgm/dcgm_telegraf.py +65 -0
model_analyzer/monitor/dcgm/dcgm_value.py +151 -0
model_analyzer/monitor/dcgm/dcgmvalue.py +155 -0
model_analyzer/monitor/dcgm/denylist_recommendations.py +573 -0
model_analyzer/monitor/dcgm/pydcgm.py +47 -0
model_analyzer/monitor/monitor.py +143 -0
model_analyzer/monitor/remote_monitor.py +137 -0
model_analyzer/output/__init__.py +15 -0
model_analyzer/output/file_writer.py +63 -0
model_analyzer/output/output_writer.py +42 -0
model_analyzer/perf_analyzer/__init__.py +15 -0
model_analyzer/perf_analyzer/genai_perf_config.py +206 -0
model_analyzer/perf_analyzer/perf_analyzer.py +882 -0
model_analyzer/perf_analyzer/perf_config.py +479 -0
model_analyzer/plots/__init__.py +15 -0
model_analyzer/plots/detailed_plot.py +266 -0
model_analyzer/plots/plot_manager.py +224 -0
model_analyzer/plots/simple_plot.py +213 -0
model_analyzer/record/__init__.py +15 -0
model_analyzer/record/gpu_record.py +68 -0
model_analyzer/record/metrics_manager.py +887 -0
model_analyzer/record/record.py +280 -0
model_analyzer/record/record_aggregator.py +256 -0
model_analyzer/record/types/__init__.py +15 -0
model_analyzer/record/types/cpu_available_ram.py +93 -0
model_analyzer/record/types/cpu_used_ram.py +93 -0
model_analyzer/record/types/gpu_free_memory.py +96 -0
model_analyzer/record/types/gpu_power_usage.py +107 -0
model_analyzer/record/types/gpu_total_memory.py +96 -0
model_analyzer/record/types/gpu_used_memory.py +96 -0
model_analyzer/record/types/gpu_utilization.py +108 -0
model_analyzer/record/types/inter_token_latency_avg.py +60 -0
model_analyzer/record/types/inter_token_latency_base.py +74 -0
model_analyzer/record/types/inter_token_latency_max.py +60 -0
model_analyzer/record/types/inter_token_latency_min.py +60 -0
model_analyzer/record/types/inter_token_latency_p25.py +60 -0
model_analyzer/record/types/inter_token_latency_p50.py +60 -0
model_analyzer/record/types/inter_token_latency_p75.py +60 -0
model_analyzer/record/types/inter_token_latency_p90.py +60 -0
model_analyzer/record/types/inter_token_latency_p95.py +60 -0
model_analyzer/record/types/inter_token_latency_p99.py +60 -0
model_analyzer/record/types/output_token_throughput.py +105 -0
model_analyzer/record/types/perf_client_response_wait.py +97 -0
model_analyzer/record/types/perf_client_send_recv.py +97 -0
model_analyzer/record/types/perf_latency.py +111 -0
model_analyzer/record/types/perf_latency_avg.py +60 -0
model_analyzer/record/types/perf_latency_base.py +74 -0
model_analyzer/record/types/perf_latency_p90.py +60 -0
model_analyzer/record/types/perf_latency_p95.py +60 -0
model_analyzer/record/types/perf_latency_p99.py +60 -0
model_analyzer/record/types/perf_server_compute_infer.py +97 -0
model_analyzer/record/types/perf_server_compute_input.py +97 -0
model_analyzer/record/types/perf_server_compute_output.py +97 -0
model_analyzer/record/types/perf_server_queue.py +97 -0
model_analyzer/record/types/perf_throughput.py +105 -0
model_analyzer/record/types/time_to_first_token_avg.py +60 -0
model_analyzer/record/types/time_to_first_token_base.py +74 -0
model_analyzer/record/types/time_to_first_token_max.py +60 -0
model_analyzer/record/types/time_to_first_token_min.py +60 -0
model_analyzer/record/types/time_to_first_token_p25.py +60 -0
model_analyzer/record/types/time_to_first_token_p50.py +60 -0
model_analyzer/record/types/time_to_first_token_p75.py +60 -0
model_analyzer/record/types/time_to_first_token_p90.py +60 -0
model_analyzer/record/types/time_to_first_token_p95.py +60 -0
model_analyzer/record/types/time_to_first_token_p99.py +60 -0
model_analyzer/reports/__init__.py +15 -0
model_analyzer/reports/html_report.py +195 -0
model_analyzer/reports/pdf_report.py +50 -0
model_analyzer/reports/report.py +86 -0
model_analyzer/reports/report_factory.py +62 -0
model_analyzer/reports/report_manager.py +1376 -0
model_analyzer/reports/report_utils.py +42 -0
model_analyzer/result/__init__.py +15 -0
model_analyzer/result/constraint_manager.py +150 -0
model_analyzer/result/model_config_measurement.py +354 -0
model_analyzer/result/model_constraints.py +105 -0
model_analyzer/result/parameter_search.py +246 -0
model_analyzer/result/result_manager.py +430 -0
model_analyzer/result/result_statistics.py +159 -0
model_analyzer/result/result_table.py +217 -0
model_analyzer/result/result_table_manager.py +646 -0
model_analyzer/result/result_utils.py +42 -0
model_analyzer/result/results.py +277 -0
model_analyzer/result/run_config_measurement.py +658 -0
model_analyzer/result/run_config_result.py +210 -0
model_analyzer/result/run_config_result_comparator.py +110 -0
model_analyzer/result/sorted_results.py +151 -0
model_analyzer/state/__init__.py +15 -0
model_analyzer/state/analyzer_state.py +76 -0
model_analyzer/state/analyzer_state_manager.py +215 -0
model_analyzer/triton/__init__.py +15 -0
model_analyzer/triton/client/__init__.py +15 -0
model_analyzer/triton/client/client.py +234 -0
model_analyzer/triton/client/client_factory.py +57 -0
model_analyzer/triton/client/grpc_client.py +104 -0
model_analyzer/triton/client/http_client.py +107 -0
model_analyzer/triton/model/__init__.py +15 -0
model_analyzer/triton/model/model_config.py +556 -0
model_analyzer/triton/model/model_config_variant.py +29 -0
model_analyzer/triton/server/__init__.py +15 -0
model_analyzer/triton/server/server.py +76 -0
model_analyzer/triton/server/server_config.py +269 -0
model_analyzer/triton/server/server_docker.py +229 -0
model_analyzer/triton/server/server_factory.py +306 -0
model_analyzer/triton/server/server_local.py +158 -0
triton_model_analyzer-1.48.0.dist-info/METADATA +52 -0
triton_model_analyzer-1.48.0.dist-info/RECORD +204 -0
triton_model_analyzer-1.48.0.dist-info/WHEEL +5 -0
triton_model_analyzer-1.48.0.dist-info/entry_points.txt +2 -0
triton_model_analyzer-1.48.0.dist-info/licenses/LICENSE +67 -0
triton_model_analyzer-1.48.0.dist-info/top_level.txt +1 -0

model_analyzer/config/generate/neighborhood.py ADDED Viewed

@@ -0,0 +1,536 @@
+#!/usr/bin/env python3
+# Copyright 2022-2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import math
+from copy import deepcopy
+from typing import Dict, List, Optional, Tuple, Union
+from model_analyzer.config.generate.coordinate import Coordinate
+from model_analyzer.config.generate.coordinate_data import CoordinateData
+from model_analyzer.config.generate.search_config import NeighborhoodConfig
+from model_analyzer.result.run_config_measurement import RunConfigMeasurement
+class Neighborhood:
+    """
+    Defines and operates on a set of coordinates within a radius around
+    a 'home' coordinate
+    """
+    # This defines the bounds of how the vector calculated from
+    # measurements is converted to a step vector.
+    #
+    # The translation will return the lowest index that has a value greater
+    # than the input value.
+    #
+    # For example, if the input is greater than the value in index 1 but less than
+    # the value in index 2, the resulting step will be 1
+    #
+    TRANSLATION_LIST = [0.09, 0.3, 1.0]
+    def __init__(
+        self,
+        neighborhood_config: NeighborhoodConfig,
+        home_coordinate: Coordinate,
+        coordinate_data: CoordinateData,
+    ):
+        """
+        Parameters
+        ----------
+        neighborhood_config:
+            NeighborhoodConfig object
+        home_coordinate:
+            Coordinate object to center the neighborhood around
+        """
+        assert type(neighborhood_config) == NeighborhoodConfig
+        self._config = neighborhood_config
+        self._home_coordinate = home_coordinate
+        self._coordinate_data = coordinate_data
+        self._radius = self._config.get_radius()
+        self._neighborhood = self._create_neighborhood()
+        self._force_slow_mode = False
+    @classmethod
+    def calc_distance(
+        cls,
+        coordinate1: Union[Coordinate, List[int]],
+        coordinate2: Union[Coordinate, List[int]],
+    ) -> float:
+        """
+        Return the euclidean distance between two coordinates
+        """
+        distance = 0.0
+        for i, _ in enumerate(coordinate1):
+            diff = coordinate1[i] - coordinate2[i]
+            distance += math.pow(diff, 2)
+        distance = math.sqrt(distance)
+        return distance
+    def enough_coordinates_initialized(self) -> bool:
+        """
+        Returns true if enough coordinates inside of the neighborhood
+        have been initialized with valid measurements. Else false
+        If the neighborhood is in slow mode, this means all adjacent neighbors
+        must be visited
+        """
+        if self._is_slow_mode():
+            return self._are_all_adjacent_neighbors_measured()
+        else:
+            min_initialized = self._config.get_min_initialized()
+            num_initialized = len(self._get_coordinates_with_valid_measurements())
+            return num_initialized >= min_initialized
+    def force_slow_mode(self) -> None:
+        """
+        When called, forces the neighborhood into slow mode
+        """
+        self._force_slow_mode = True
+    def determine_new_home(self) -> Coordinate:
+        """
+        Based on the measurements in the neighborhood, determine where
+        the next location should be.
+        If the neighborhood is in slow mode, return the best found measurement
+        Otherwise calculate a new coordinate from the measurements
+        Returns
+        -------
+        new_coordinate
+            The new coordinate computed based on the neighborhood measurements.
+        """
+        if self._is_slow_mode():
+            return self._get_best_coordinate_found()
+        else:
+            return self._calculate_new_home()
+    def _get_best_coordinate_found(self) -> Coordinate:
+        vectors, measurements = self._get_measurements_passing_constraints()
+        if len(vectors) == 0:
+            return self._home_coordinate
+        home_measurement = self._get_home_measurement()
+        if home_measurement and home_measurement.is_passing_constraints():
+            vectors.append(Coordinate([0] * self._config.get_num_dimensions()))
+            measurements.append(home_measurement)
+        _, best_vector = sorted(zip(measurements, vectors))[-1]
+        best_coordinate = self._home_coordinate + best_vector
+        return best_coordinate
+    def _calculate_new_home(self) -> Coordinate:
+        step_vector = self._get_step_vector()
+        step_vector_coordinate = self._translate_step_vector(
+            step_vector, Neighborhood.TRANSLATION_LIST
+        )
+        tmp_new_coordinate = self._home_coordinate + step_vector_coordinate
+        new_coordinate = self._clamp_coordinate_to_bounds(tmp_new_coordinate)
+        return new_coordinate
+    def _translate_step_vector(
+        self, step_vector: List[float], translate_list: List[float]
+    ) -> Coordinate:
+        translated_step_vector = Coordinate([0] * len(step_vector))
+        for i, v in enumerate(step_vector):
+            translated_step_vector[i] = self._translate_value(v, translate_list)
+        return translated_step_vector
+    def _translate_value(self, value: float, translation_list: List[float]) -> int:
+        ret = 0
+        for index, bound in enumerate(translation_list):
+            if value > 0 and value > bound:
+                ret = index + 1
+            if value < 0 and value < -1 * bound:
+                ret = -1 * (index + 1)
+        return ret
+    def pick_coordinate_to_initialize(self) -> Optional[Coordinate]:
+        """
+        Based on the initialized coordinate values, pick an unvisited
+        coordinate to initialize next.
+        If the neighborhood is in slow mode, only pick from within the adjacent neighbors
+        """
+        if self._is_slow_mode():
+            return self._pick_slow_mode_coordinate_to_initialize()
+        else:
+            return self._pick_fast_mode_coordinate_to_initialize()
+    def _pick_slow_mode_coordinate_to_initialize(self) -> Coordinate:
+        for neighbor in self._get_all_adjacent_neighbors():
+            if not self._is_coordinate_measured(neighbor):
+                return neighbor
+        raise Exception("Picking slow mode coordinate, but none are unvisited")
+    def _pick_fast_mode_coordinate_to_initialize(self) -> Optional[Coordinate]:
+        covered_values_per_dimension = self._get_covered_values_per_dimension()
+        max_num_uncovered = -1
+        best_coordinate = None
+        for coordinate in self._neighborhood:
+            if not self._is_coordinate_measured(coordinate):
+                num_uncovered = self._get_num_uncovered_values(
+                    coordinate, covered_values_per_dimension
+                )
+                if num_uncovered > max_num_uncovered:
+                    max_num_uncovered = num_uncovered
+                    best_coordinate = coordinate
+        return best_coordinate
+    def get_nearest_neighbor(self, coordinate_in: Coordinate) -> Coordinate:
+        """
+        Find the nearest coordinate to the `coordinate_in` among the
+        coordinates within the current neighborhood.
+        """
+        min_distance = float("inf")
+        nearest_neighbor = self._home_coordinate
+        for coordinate in self._neighborhood:
+            distance = Neighborhood.calc_distance(coordinate, coordinate_in)
+            if distance < min_distance:
+                nearest_neighbor = coordinate
+                min_distance = distance
+        return nearest_neighbor
+    def _create_neighborhood(self) -> List[Coordinate]:
+        """
+        Create and return a neighborhood of all Coordinates within
+        range <_radius> that are also within all bounds
+        """
+        neighborhood = []
+        potential_steps = self._get_potential_steps(
+            self._config.get_num_dimensions(), self._radius
+        )
+        for potential_step in potential_steps:
+            for i, v in enumerate(self._home_coordinate):
+                potential_step[i] += v
+            if self._is_in_bounds(potential_step):
+                neighborhood.append(Coordinate(potential_step))
+        return neighborhood
+    def _is_in_bounds(self, potential_coordinate: List[int]) -> bool:
+        for i, v in enumerate(potential_coordinate):
+            dim = self._config.get_dimension(i)
+            if v > dim.get_max_idx() or v < dim.get_min_idx():
+                return False
+        return True
+    def _get_potential_steps(
+        self, num_coordinates: int, radius: int
+    ) -> List[List[int]]:
+        """
+        Create and return a list of all possible step vectors that are
+        within <_radius> distance
+        """
+        result_list: List[List[int]] = []
+        v = [0] * num_coordinates
+        self._permute_steps_in_range(v, radius, 0, result_list)
+        return result_list
+    def _append_combinations_to_results(
+        self, curr_val: List[int], index: int, result_list: List[List[int]]
+    ) -> None:
+        """
+        Given a List of integers (a potential step vector) with all positive
+        values, permutate all combinations of positive/negative values and
+        append it to the result_list
+        For example, an input of [1,0,2] will append the following:
+        [1,0,2], [1,0,-2], [-1,0,2], [-1,0,-2]
+        """
+        if index + 1 == len(curr_val):
+            result_list.append(deepcopy(curr_val))
+            if curr_val[index]:
+                curr_val[index] = -curr_val[index]
+                result_list.append(deepcopy(curr_val))
+        else:
+            self._append_combinations_to_results(curr_val, index + 1, result_list)
+            if curr_val[index]:
+                curr_val[index] = -curr_val[index]
+                self._append_combinations_to_results(curr_val, index + 1, result_list)
+    def _permute_steps_in_range(
+        self,
+        curr_step: List[int],
+        radius: int,
+        index: int,
+        result_list: List[List[int]],
+    ) -> None:
+        """
+        Recursively walk all combinations of steps within the desired radius
+        """
+        base = [0] * len(curr_step)
+        for i in range(radius + 1):
+            curr_step[index] = i
+            # Leaf (rightmost) coordinate index: Add to results if in range
+            if index == len(curr_step) - 1:
+                d = Neighborhood.calc_distance(base, curr_step)
+                if d <= radius:
+                    self._append_combinations_to_results(curr_step, 0, result_list)
+                else:
+                    return
+            # Non-leaf coordinate index: Recurse
+            else:
+                self._permute_steps_in_range(curr_step, radius, index + 1, result_list)
+    def _get_coordinates_with_valid_measurements(self) -> List[Coordinate]:
+        initialized_coordinates = []
+        for coordinate in self._neighborhood:
+            if (
+                coordinate != self._home_coordinate
+                and self._coordinate_data.has_valid_measurement(coordinate)
+            ):
+                initialized_coordinates.append(deepcopy(coordinate))
+        return initialized_coordinates
+    def _get_step_vector(self) -> List[float]:
+        """
+        Calculate a vector that indicates a direction to step from the
+        home coordinate (current center).
+        Returns
+        -------
+        step_vector
+            a coordinate that tells the direction to move.
+        """
+        compare_constraints = not self._is_home_passing_constraints()
+        return self._calculate_step_vector_from_measurements(
+            compare_constraints=compare_constraints
+        )
+    def _calculate_step_vector_from_measurements(
+        self, compare_constraints: bool
+    ) -> List[float]:
+        home_measurement = self._get_home_measurement()
+        if not home_measurement:
+            raise Exception("Can't step from home if it has no measurement")
+        vectors, measurements = self._get_all_measurements()
+        # This function should only ever be called if all are passing or none are passing
+        _, p = self._get_measurements_passing_constraints()
+        assert len(p) == 0 or len(p) == len(measurements)
+        if not vectors:
+            return [0.0] * self._config.get_num_dimensions()
+        weights = []
+        for m in measurements:
+            if compare_constraints:
+                weight = home_measurement.compare_constraints(m)
+            else:
+                weight = home_measurement.compare_measurements(m)
+            if not weight:
+                weight = 0.0
+            weights.append(weight)
+        return self._calculate_step_vector_from_vectors_and_weights(vectors, weights)
+    def _calculate_step_vector_from_vectors_and_weights(
+        self, vectors: List[Coordinate], weights: List[float]
+    ) -> List[float]:
+        step_vector = [0.0] * self._config.get_num_dimensions()
+        dim_sum_vector = [0.0] * self._config.get_num_dimensions()
+        # For each dimension -
+        #   if non zero, add weight (inverting if dimension is negative)
+        #   divide by sum of coordinate of that dimension
+        for vector, weight in zip(vectors, weights):
+            for dim, v in enumerate(vector):
+                if v:
+                    if v > 0:
+                        step_vector[dim] += weight
+                        dim_sum_vector[dim] += v
+                    else:
+                        step_vector[dim] -= weight
+                        dim_sum_vector[dim] -= v
+        for dim, v in enumerate(dim_sum_vector):
+            if v:
+                step_vector[dim] /= v
+        return step_vector
+    def _get_all_measurements(
+        self,
+    ) -> Tuple[List[Coordinate], List[RunConfigMeasurement]]:
+        """
+        Gather all the visited vectors (directions from the home coordinate)
+        and their corresponding measurements.
+        Returns
+        -------
+        (vectors, measurements)
+            collection of vectors and their measurements.
+        """
+        coordinates = self._get_coordinates_with_valid_measurements()
+        vectors = []
+        measurements = []
+        for coordinate in coordinates:
+            measurement = self._coordinate_data.get_measurement(coordinate)
+            if measurement:
+                vectors.append(coordinate - self._home_coordinate)
+                measurements.append(measurement)
+        return vectors, measurements
+    def _get_measurements_passing_constraints(
+        self,
+    ) -> Tuple[List[Coordinate], List[RunConfigMeasurement]]:
+        """
+        Gather all the vectors (directions from the home coordinate)
+        and their corresponding measurements that are passing constraints.
+        Returns
+        -------
+        (vectors, measurements)
+            collection of vectors and their measurements.
+        """
+        coordinates = self._get_coordinates_with_valid_measurements()
+        vectors = []
+        measurements = []
+        for coordinate in coordinates:
+            measurement = self._coordinate_data.get_measurement(coordinate)
+            if measurement and measurement.is_passing_constraints():
+                vectors.append(coordinate - self._home_coordinate)
+                measurements.append(measurement)
+        return vectors, measurements
+    def _is_coordinate_measured(self, coordinate: Coordinate) -> bool:
+        return self._coordinate_data.is_measured(coordinate)
+    def _clamp_coordinate_to_bounds(self, coordinate: Coordinate) -> Coordinate:
+        clamped_coordinate = deepcopy(coordinate)
+        for i, v in enumerate(coordinate):
+            sd = self._config.get_dimension(i)
+            v = min(sd.get_max_idx(), v)
+            v = max(sd.get_min_idx(), v)
+            clamped_coordinate[i] = v
+        return clamped_coordinate
+    def _get_covered_values_per_dimension(self) -> List[Dict[Coordinate, bool]]:
+        """
+        Returns a list of dicts that indicates which values have been
+        covered in each dimension.
+        (e.g.)
+            covered_values_per_dimension[dimension][value] = bool
+        """
+        measured_coordinates = self._get_coordinates_with_valid_measurements()
+        covered_values_per_dimension: List[Dict[Coordinate, bool]] = [
+            {} for _ in range(self._config.get_num_dimensions())
+        ]
+        for coordinate in measured_coordinates:
+            for i, v in enumerate(coordinate):
+                covered_values_per_dimension[i][v] = True
+        return covered_values_per_dimension
+    def _get_num_uncovered_values(
+        self,
+        coordinate: Coordinate,
+        covered_values_per_dimension: List[Dict[Coordinate, bool]],
+    ) -> int:
+        """
+        Determine how many of the coordinate dimensions in the input coordinate have values
+        that are not covered in covered_values_per_dimension
+        """
+        num_uncovered = 0
+        for i, v in enumerate(coordinate):
+            if not covered_values_per_dimension[i].get(v, False):
+                num_uncovered += 1
+        return num_uncovered
+    def _is_slow_mode(self) -> bool:
+        if self._force_slow_mode:
+            return True
+        if not self._is_home_measured():
+            return False
+        passing_vectors, _ = self._get_measurements_passing_constraints()
+        all_vectors, _ = self._get_all_measurements()
+        any_failing = len(all_vectors) != len(passing_vectors)
+        any_passing = len(passing_vectors) != 0
+        home_passing = self._is_home_passing_constraints()
+        return (home_passing and any_failing) or (not home_passing and any_passing)
+    def _are_all_adjacent_neighbors_measured(self) -> bool:
+        for neighbor in self._get_all_adjacent_neighbors():
+            if not self._is_coordinate_measured(neighbor):
+                return False
+        return True
+    def _get_all_adjacent_neighbors(self) -> List[Coordinate]:
+        adjacent_neighbors = []
+        for dim in range(self._config.get_num_dimensions()):
+            dimension = self._config.get_dimension(dim)
+            down_neighbor = Coordinate(self._home_coordinate)
+            down_neighbor[dim] -= 1
+            if down_neighbor[dim] >= dimension.get_min_idx():
+                adjacent_neighbors.append(down_neighbor)
+            up_neighbor = Coordinate(self._home_coordinate)
+            up_neighbor[dim] += 1
+            if up_neighbor[dim] <= dimension.get_max_idx():
+                adjacent_neighbors.append(up_neighbor)
+        return adjacent_neighbors
+    def _get_home_measurement(self) -> Optional[RunConfigMeasurement]:
+        return self._coordinate_data.get_measurement(coordinate=self._home_coordinate)
+    def _is_home_measured(self) -> bool:
+        return self._get_home_measurement() is not None
+    def _is_home_passing_constraints(self) -> bool:
+        home_measurement = self._get_home_measurement()
+        if not home_measurement:
+            raise Exception("Can't check home passing if it isn't measured yet")
+        return home_measurement.is_passing_constraints()

model_analyzer/config/generate/optuna_plus_concurrency_sweep_run_config_generator.py ADDED Viewed

@@ -0,0 +1,141 @@
+#!/usr/bin/env python3
+# Copyright 2024, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import logging
+from copy import deepcopy
+from typing import Dict, Generator, List, Optional
+from model_analyzer.config.generate.concurrency_sweeper import ConcurrencySweeper
+from model_analyzer.config.generate.model_profile_spec import ModelProfileSpec
+from model_analyzer.config.generate.model_variant_name_manager import (
+    ModelVariantNameManager,
+)
+from model_analyzer.config.generate.optuna_run_config_generator import (
+    OptunaRunConfigGenerator,
+)
+from model_analyzer.config.generate.search_parameters import SearchParameters
+from model_analyzer.config.input.config_command_profile import ConfigCommandProfile
+from model_analyzer.config.run.run_config import RunConfig
+from model_analyzer.constants import LOGGER_NAME
+from model_analyzer.result.parameter_search import ParameterSearch
+from model_analyzer.result.result_manager import ResultManager
+from model_analyzer.result.run_config_measurement import RunConfigMeasurement
+from model_analyzer.state.analyzer_state_manager import AnalyzerStateManager
+from .config_generator_interface import ConfigGeneratorInterface
+logger = logging.getLogger(LOGGER_NAME)
+class OptunaPlusConcurrencySweepRunConfigGenerator(ConfigGeneratorInterface):
+    """
+    First run OptunaConfigGenerator for an Optuna search, then use
+    ParameterSearch for a concurrency sweep + binary search of the default
+    and Top N results
+    """
+    def __init__(
+        self,
+        config: ConfigCommandProfile,
+        state_manager: AnalyzerStateManager,
+        gpu_count: int,
+        models: List[ModelProfileSpec],
+        composing_models: List[ModelProfileSpec],
+        result_manager: ResultManager,
+        model_variant_name_manager: ModelVariantNameManager,
+        search_parameters: Dict[str, SearchParameters],
+        composing_search_parameters: Dict[str, SearchParameters],
+    ):
+        """
+        Parameters
+        ----------
+        config: ConfigCommandProfile
+            Profile configuration information
+        state_manager: AnalyzerStateManager
+            The object that allows control and update of checkpoint state
+        gpu_count: Number of gpus in the system
+        models: List of ModelProfileSpec
+            List of models to profile
+        composing_models: List of ModelProfileSpec
+            List of composing models that exist inside of the supplied models
+        result_manager: ResultManager
+            The object that handles storing and sorting the results from the perf analyzer
+        model_variant_name_manager: ModelVariantNameManager
+            Maps model variants to config names
+        search_parameters: SearchParameters
+            The object that handles the users configuration search parameters
+        composing_search_parameters: SearchParameters
+            The object that handles the users configuration search parameters for composing models
+        """
+        self._config = config
+        self._state_manager = state_manager
+        self._gpu_count = gpu_count
+        self._models = models
+        self._composing_models = composing_models
+        self._result_manager = result_manager
+        self._model_variant_name_manager = model_variant_name_manager
+        self._search_parameters = search_parameters
+        self._composing_search_parameters = composing_search_parameters
+    def set_last_results(
+        self, measurements: List[Optional[RunConfigMeasurement]]
+    ) -> None:
+        self._last_measurement = measurements[-1]
+        self._rcg.set_last_results(measurements)
+    def get_configs(self) -> Generator[RunConfig, None, None]:
+        """
+        Returns
+        -------
+        RunConfig
+            The next RunConfig generated by this class
+        """
+        logger.info("")
+        logger.info("Starting Optuna mode search to find optimal configs")
+        logger.info("")
+        yield from self._execute_optuna_search()
+        logger.info("")
+        if self._config.concurrency_sweep_disable:
+            logger.info("Done with Optuna mode search.")
+        else:
+            logger.info(
+                "Done with Optuna mode search. Gathering concurrency sweep measurements for reports"
+            )
+            logger.info("")
+            yield from ConcurrencySweeper(
+                config=self._config, result_manager=self._result_manager
+            ).get_configs()
+            logger.info("")
+            logger.info("Done gathering concurrency sweep measurements for reports")
+        logger.info("")
+    def _execute_optuna_search(self) -> Generator[RunConfig, None, None]:
+        self._rcg: ConfigGeneratorInterface = self._create_optuna_run_config_generator()
+        yield from self._rcg.get_configs()
+    def _create_optuna_run_config_generator(self) -> OptunaRunConfigGenerator:
+        return OptunaRunConfigGenerator(
+            config=self._config,
+            state_manager=self._state_manager,
+            gpu_count=self._gpu_count,
+            models=self._models,
+            composing_models=self._composing_models,
+            model_variant_name_manager=self._model_variant_name_manager,
+            search_parameters=self._search_parameters,
+            composing_search_parameters=self._composing_search_parameters,
+        )