PyPI - triton-model-analyzer - Versions diffs - 1.48.0__py3-none-any.whl - Mend

triton-model-analyzer 1.48.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (204) hide show

model_analyzer/__init__.py +15 -0
model_analyzer/analyzer.py +448 -0
model_analyzer/cli/__init__.py +15 -0
model_analyzer/cli/cli.py +193 -0
model_analyzer/config/__init__.py +15 -0
model_analyzer/config/generate/__init__.py +15 -0
model_analyzer/config/generate/automatic_model_config_generator.py +164 -0
model_analyzer/config/generate/base_model_config_generator.py +352 -0
model_analyzer/config/generate/brute_plus_binary_parameter_search_run_config_generator.py +164 -0
model_analyzer/config/generate/brute_run_config_generator.py +154 -0
model_analyzer/config/generate/concurrency_sweeper.py +75 -0
model_analyzer/config/generate/config_generator_interface.py +52 -0
model_analyzer/config/generate/coordinate.py +143 -0
model_analyzer/config/generate/coordinate_data.py +86 -0
model_analyzer/config/generate/generator_utils.py +116 -0
model_analyzer/config/generate/manual_model_config_generator.py +187 -0
model_analyzer/config/generate/model_config_generator_factory.py +92 -0
model_analyzer/config/generate/model_profile_spec.py +74 -0
model_analyzer/config/generate/model_run_config_generator.py +154 -0
model_analyzer/config/generate/model_variant_name_manager.py +150 -0
model_analyzer/config/generate/neighborhood.py +536 -0
model_analyzer/config/generate/optuna_plus_concurrency_sweep_run_config_generator.py +141 -0
model_analyzer/config/generate/optuna_run_config_generator.py +838 -0
model_analyzer/config/generate/perf_analyzer_config_generator.py +312 -0
model_analyzer/config/generate/quick_plus_concurrency_sweep_run_config_generator.py +130 -0
model_analyzer/config/generate/quick_run_config_generator.py +753 -0
model_analyzer/config/generate/run_config_generator_factory.py +329 -0
model_analyzer/config/generate/search_config.py +112 -0
model_analyzer/config/generate/search_dimension.py +73 -0
model_analyzer/config/generate/search_dimensions.py +85 -0
model_analyzer/config/generate/search_parameter.py +49 -0
model_analyzer/config/generate/search_parameters.py +388 -0
model_analyzer/config/input/__init__.py +15 -0
model_analyzer/config/input/config_command.py +483 -0
model_analyzer/config/input/config_command_profile.py +1747 -0
model_analyzer/config/input/config_command_report.py +267 -0
model_analyzer/config/input/config_defaults.py +236 -0
model_analyzer/config/input/config_enum.py +83 -0
model_analyzer/config/input/config_field.py +216 -0
model_analyzer/config/input/config_list_generic.py +112 -0
model_analyzer/config/input/config_list_numeric.py +151 -0
model_analyzer/config/input/config_list_string.py +111 -0
model_analyzer/config/input/config_none.py +71 -0
model_analyzer/config/input/config_object.py +129 -0
model_analyzer/config/input/config_primitive.py +81 -0
model_analyzer/config/input/config_status.py +75 -0
model_analyzer/config/input/config_sweep.py +83 -0
model_analyzer/config/input/config_union.py +113 -0
model_analyzer/config/input/config_utils.py +128 -0
model_analyzer/config/input/config_value.py +243 -0
model_analyzer/config/input/objects/__init__.py +15 -0
model_analyzer/config/input/objects/config_model_profile_spec.py +325 -0
model_analyzer/config/input/objects/config_model_report_spec.py +173 -0
model_analyzer/config/input/objects/config_plot.py +198 -0
model_analyzer/config/input/objects/config_protobuf_utils.py +101 -0
model_analyzer/config/input/yaml_config_validator.py +82 -0
model_analyzer/config/run/__init__.py +15 -0
model_analyzer/config/run/model_run_config.py +313 -0
model_analyzer/config/run/run_config.py +168 -0
model_analyzer/constants.py +76 -0
model_analyzer/device/__init__.py +15 -0
model_analyzer/device/device.py +24 -0
model_analyzer/device/gpu_device.py +87 -0
model_analyzer/device/gpu_device_factory.py +248 -0
model_analyzer/entrypoint.py +307 -0
model_analyzer/log_formatter.py +65 -0
model_analyzer/model_analyzer_exceptions.py +24 -0
model_analyzer/model_manager.py +255 -0
model_analyzer/monitor/__init__.py +15 -0
model_analyzer/monitor/cpu_monitor.py +69 -0
model_analyzer/monitor/dcgm/DcgmDiag.py +191 -0
model_analyzer/monitor/dcgm/DcgmFieldGroup.py +83 -0
model_analyzer/monitor/dcgm/DcgmGroup.py +815 -0
model_analyzer/monitor/dcgm/DcgmHandle.py +141 -0
model_analyzer/monitor/dcgm/DcgmJsonReader.py +69 -0
model_analyzer/monitor/dcgm/DcgmReader.py +623 -0
model_analyzer/monitor/dcgm/DcgmStatus.py +57 -0
model_analyzer/monitor/dcgm/DcgmSystem.py +412 -0
model_analyzer/monitor/dcgm/__init__.py +15 -0
model_analyzer/monitor/dcgm/common/__init__.py +13 -0
model_analyzer/monitor/dcgm/common/dcgm_client_cli_parser.py +194 -0
model_analyzer/monitor/dcgm/common/dcgm_client_main.py +86 -0
model_analyzer/monitor/dcgm/dcgm_agent.py +887 -0
model_analyzer/monitor/dcgm/dcgm_collectd_plugin.py +369 -0
model_analyzer/monitor/dcgm/dcgm_errors.py +395 -0
model_analyzer/monitor/dcgm/dcgm_field_helpers.py +546 -0
model_analyzer/monitor/dcgm/dcgm_fields.py +815 -0
model_analyzer/monitor/dcgm/dcgm_fields_collectd.py +671 -0
model_analyzer/monitor/dcgm/dcgm_fields_internal.py +29 -0
model_analyzer/monitor/dcgm/dcgm_fluentd.py +45 -0
model_analyzer/monitor/dcgm/dcgm_monitor.py +138 -0
model_analyzer/monitor/dcgm/dcgm_prometheus.py +326 -0
model_analyzer/monitor/dcgm/dcgm_structs.py +2357 -0
model_analyzer/monitor/dcgm/dcgm_telegraf.py +65 -0
model_analyzer/monitor/dcgm/dcgm_value.py +151 -0
model_analyzer/monitor/dcgm/dcgmvalue.py +155 -0
model_analyzer/monitor/dcgm/denylist_recommendations.py +573 -0
model_analyzer/monitor/dcgm/pydcgm.py +47 -0
model_analyzer/monitor/monitor.py +143 -0
model_analyzer/monitor/remote_monitor.py +137 -0
model_analyzer/output/__init__.py +15 -0
model_analyzer/output/file_writer.py +63 -0
model_analyzer/output/output_writer.py +42 -0
model_analyzer/perf_analyzer/__init__.py +15 -0
model_analyzer/perf_analyzer/genai_perf_config.py +206 -0
model_analyzer/perf_analyzer/perf_analyzer.py +882 -0
model_analyzer/perf_analyzer/perf_config.py +479 -0
model_analyzer/plots/__init__.py +15 -0
model_analyzer/plots/detailed_plot.py +266 -0
model_analyzer/plots/plot_manager.py +224 -0
model_analyzer/plots/simple_plot.py +213 -0
model_analyzer/record/__init__.py +15 -0
model_analyzer/record/gpu_record.py +68 -0
model_analyzer/record/metrics_manager.py +887 -0
model_analyzer/record/record.py +280 -0
model_analyzer/record/record_aggregator.py +256 -0
model_analyzer/record/types/__init__.py +15 -0
model_analyzer/record/types/cpu_available_ram.py +93 -0
model_analyzer/record/types/cpu_used_ram.py +93 -0
model_analyzer/record/types/gpu_free_memory.py +96 -0
model_analyzer/record/types/gpu_power_usage.py +107 -0
model_analyzer/record/types/gpu_total_memory.py +96 -0
model_analyzer/record/types/gpu_used_memory.py +96 -0
model_analyzer/record/types/gpu_utilization.py +108 -0
model_analyzer/record/types/inter_token_latency_avg.py +60 -0
model_analyzer/record/types/inter_token_latency_base.py +74 -0
model_analyzer/record/types/inter_token_latency_max.py +60 -0
model_analyzer/record/types/inter_token_latency_min.py +60 -0
model_analyzer/record/types/inter_token_latency_p25.py +60 -0
model_analyzer/record/types/inter_token_latency_p50.py +60 -0
model_analyzer/record/types/inter_token_latency_p75.py +60 -0
model_analyzer/record/types/inter_token_latency_p90.py +60 -0
model_analyzer/record/types/inter_token_latency_p95.py +60 -0
model_analyzer/record/types/inter_token_latency_p99.py +60 -0
model_analyzer/record/types/output_token_throughput.py +105 -0
model_analyzer/record/types/perf_client_response_wait.py +97 -0
model_analyzer/record/types/perf_client_send_recv.py +97 -0
model_analyzer/record/types/perf_latency.py +111 -0
model_analyzer/record/types/perf_latency_avg.py +60 -0
model_analyzer/record/types/perf_latency_base.py +74 -0
model_analyzer/record/types/perf_latency_p90.py +60 -0
model_analyzer/record/types/perf_latency_p95.py +60 -0
model_analyzer/record/types/perf_latency_p99.py +60 -0
model_analyzer/record/types/perf_server_compute_infer.py +97 -0
model_analyzer/record/types/perf_server_compute_input.py +97 -0
model_analyzer/record/types/perf_server_compute_output.py +97 -0
model_analyzer/record/types/perf_server_queue.py +97 -0
model_analyzer/record/types/perf_throughput.py +105 -0
model_analyzer/record/types/time_to_first_token_avg.py +60 -0
model_analyzer/record/types/time_to_first_token_base.py +74 -0
model_analyzer/record/types/time_to_first_token_max.py +60 -0
model_analyzer/record/types/time_to_first_token_min.py +60 -0
model_analyzer/record/types/time_to_first_token_p25.py +60 -0
model_analyzer/record/types/time_to_first_token_p50.py +60 -0
model_analyzer/record/types/time_to_first_token_p75.py +60 -0
model_analyzer/record/types/time_to_first_token_p90.py +60 -0
model_analyzer/record/types/time_to_first_token_p95.py +60 -0
model_analyzer/record/types/time_to_first_token_p99.py +60 -0
model_analyzer/reports/__init__.py +15 -0
model_analyzer/reports/html_report.py +195 -0
model_analyzer/reports/pdf_report.py +50 -0
model_analyzer/reports/report.py +86 -0
model_analyzer/reports/report_factory.py +62 -0
model_analyzer/reports/report_manager.py +1376 -0
model_analyzer/reports/report_utils.py +42 -0
model_analyzer/result/__init__.py +15 -0
model_analyzer/result/constraint_manager.py +150 -0
model_analyzer/result/model_config_measurement.py +354 -0
model_analyzer/result/model_constraints.py +105 -0
model_analyzer/result/parameter_search.py +246 -0
model_analyzer/result/result_manager.py +430 -0
model_analyzer/result/result_statistics.py +159 -0
model_analyzer/result/result_table.py +217 -0
model_analyzer/result/result_table_manager.py +646 -0
model_analyzer/result/result_utils.py +42 -0
model_analyzer/result/results.py +277 -0
model_analyzer/result/run_config_measurement.py +658 -0
model_analyzer/result/run_config_result.py +210 -0
model_analyzer/result/run_config_result_comparator.py +110 -0
model_analyzer/result/sorted_results.py +151 -0
model_analyzer/state/__init__.py +15 -0
model_analyzer/state/analyzer_state.py +76 -0
model_analyzer/state/analyzer_state_manager.py +215 -0
model_analyzer/triton/__init__.py +15 -0
model_analyzer/triton/client/__init__.py +15 -0
model_analyzer/triton/client/client.py +234 -0
model_analyzer/triton/client/client_factory.py +57 -0
model_analyzer/triton/client/grpc_client.py +104 -0
model_analyzer/triton/client/http_client.py +107 -0
model_analyzer/triton/model/__init__.py +15 -0
model_analyzer/triton/model/model_config.py +556 -0
model_analyzer/triton/model/model_config_variant.py +29 -0
model_analyzer/triton/server/__init__.py +15 -0
model_analyzer/triton/server/server.py +76 -0
model_analyzer/triton/server/server_config.py +269 -0
model_analyzer/triton/server/server_docker.py +229 -0
model_analyzer/triton/server/server_factory.py +306 -0
model_analyzer/triton/server/server_local.py +158 -0
triton_model_analyzer-1.48.0.dist-info/METADATA +52 -0
triton_model_analyzer-1.48.0.dist-info/RECORD +204 -0
triton_model_analyzer-1.48.0.dist-info/WHEEL +5 -0
triton_model_analyzer-1.48.0.dist-info/entry_points.txt +2 -0
triton_model_analyzer-1.48.0.dist-info/licenses/LICENSE +67 -0
triton_model_analyzer-1.48.0.dist-info/top_level.txt +1 -0

model_analyzer/plots/detailed_plot.py ADDED Viewed

@@ -0,0 +1,266 @@
+#!/usr/bin/env python3
+# Copyright 2021-2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import logging
+import os
+from collections import defaultdict
+import matplotlib.pyplot as plt
+from matplotlib import patches as mpatches
+from model_analyzer.constants import LOGGER_NAME
+from model_analyzer.record.metrics_manager import MetricsManager
+logging.getLogger("matplotlib").setLevel(logging.ERROR)
+logger = logging.getLogger(LOGGER_NAME)
+class DetailedPlot:
+    """
+    A wrapper class around a matplotlib
+    plot that adapts with the kinds of
+    plots the model analyzer wants to generates
+    Detailed plots detail th
+    """
+    detailed_metrics = [
+        "perf_server_queue",
+        "perf_server_compute_input",
+        "perf_server_compute_infer",
+        "perf_server_compute_output",
+    ]
+    def __init__(self, name, title, bar_width=0.5):
+        """
+        Parameters
+        ----------
+        name: str
+            The name of the file that the plot
+            will be saved as
+        title : str
+            The title of this plot/figure
+        bar_width: float
+            width of the latency breakdown bars
+        """
+        self._name = name
+        self._title = title
+        self._fig, self._ax_latency = plt.subplots()
+        self._ax_latency.set_title(title)
+        self._ax_throughput = self._ax_latency.twinx()
+        latency_axis_label, throughput_axis_label = [
+            metric.header(aggregation_tag="")
+            for metric in MetricsManager.get_metric_types(
+                ["perf_latency_avg", "perf_throughput"]
+            )
+        ]
+        # Okabe-Ito guideline colors for colorblind
+        # https://jfly.uni-koeln.de/color/#select
+        self._bar_colors = {
+            "perf_server_queue": "#e69f00",
+            "perf_server_compute_input": "#56b4e9",
+            "perf_server_compute_infer": "#009e73",
+            "perf_server_compute_output": "#f0e442",
+            "perf_throughput": "#000000",
+        }
+        self._bar_width = bar_width
+        self._legend_x = 0.92
+        self._legend_y = 1.15
+        self._legend_font_size = 10
+        self._fig.set_figheight(8)
+        self._fig.set_figwidth(12)
+        self._ax_latency.set_xlabel("Concurrent Client Requests")
+        self._ax_latency.set_ylabel(latency_axis_label)
+        self._ax_throughput.set_ylabel(throughput_axis_label)
+        self._data = defaultdict(list)
+    def data(self):
+        """
+        Get the data in this plot
+        Returns
+        -------
+        dict
+            keys are line labels
+            and values are lists of floats
+        """
+        return self._data
+    def add_run_config_measurement(self, run_config_measurement):
+        """
+        Adds a measurement to this plot
+        Parameters
+        ----------
+        measurement : Measurement
+            The measurement containing the data to
+            be plotted.
+        """
+        # TODO-TMA-568: This needs to be updated because there will be multiple model configs
+        if (
+            "concurrency-range" in run_config_measurement.model_specific_pa_params()[0]
+            and run_config_measurement.model_specific_pa_params()[0][
+                "concurrency-range"
+            ]
+        ):
+            self._data["concurrency"].append(
+                run_config_measurement.model_specific_pa_params()[0][
+                    "concurrency-range"
+                ]
+            )
+        if (
+            "request-rate-range" in run_config_measurement.model_specific_pa_params()[0]
+            and run_config_measurement.model_specific_pa_params()[0][
+                "request-rate-range"
+            ]
+        ):
+            self._data["request_rate"].append(
+                run_config_measurement.model_specific_pa_params()[0][
+                    "request-rate-range"
+                ]
+            )
+        self._data["perf_throughput"].append(
+            run_config_measurement.get_non_gpu_metric_value(tag="perf_throughput")
+        )
+        for metric in self.detailed_metrics:
+            if MetricsManager.is_gpu_metric(tag=metric):
+                self._data[metric].append(
+                    run_config_measurement.get_gpu_metric_value(tag=metric)
+                )
+            else:
+                self._data[metric].append(
+                    run_config_measurement.get_non_gpu_metric_value(tag=metric)
+                )
+    def plot_data(self):
+        """
+        Calls plotting function
+        on this plot's Axes object
+        """
+        # Need to change the default x-axis plot title for request rates
+        if "request_rate" in self._data and self._data["request_rate"][0]:
+            self._ax_latency.set_xlabel("Client Request Rate")
+        # Sort the data by request rate or concurrency
+        if "request_rate" in self._data and self._data["request_rate"][0]:
+            sort_indices = list(
+                zip(*sorted(enumerate(self._data["request_rate"]), key=lambda x: x[1]))
+            )[0]
+        else:
+            sort_indices = list(
+                zip(*sorted(enumerate(self._data["concurrency"]), key=lambda x: x[1]))
+            )[0]
+        sorted_data = {
+            key: [data_list[i] for i in sort_indices]
+            for key, data_list in self._data.items()
+        }
+        # Plot latency breakdown bars
+        labels = dict(
+            zip(
+                self.detailed_metrics,
+                [
+                    metric.header()
+                    for metric in MetricsManager.get_metric_types(
+                        tags=self.detailed_metrics
+                    )
+                ],
+            )
+        )
+        bottoms = None
+        if "request_rate" in self._data:
+            sorted_data["indices"] = list(map(str, sorted_data["request_rate"]))
+        else:
+            sorted_data["indices"] = list(map(str, sorted_data["concurrency"]))
+        # Plot latency breakdown with concurrency casted as string to make uniform x
+        for metric, label in labels.items():
+            self._ax_latency.bar(
+                sorted_data["indices"],
+                sorted_data[metric],
+                width=self._bar_width,
+                label=label,
+                bottom=bottoms,
+                color=self._bar_colors[metric],
+            )
+            if not bottoms:
+                bottoms = sorted_data[metric]
+            else:
+                bottoms = list(map(lambda x, y: x + y, bottoms, sorted_data[metric]))
+        # Plot the inference line
+        inference_line = self._ax_throughput.plot(
+            sorted_data["indices"],
+            sorted_data["perf_throughput"],
+            label="Inferences/second",
+            marker="o",
+            color=self._bar_colors["perf_throughput"],
+        )
+        # Create legend handles
+        handles = [
+            mpatches.Patch(color=self._bar_colors[m], label=labels[m])
+            for m in self._bar_colors
+            if m != "perf_throughput"
+        ]
+        handles.append(inference_line[0])
+        self._ax_latency.legend(
+            handles=handles,
+            ncol=(len(self._bar_colors) // 2) + 1,
+            bbox_to_anchor=(self._legend_x, self._legend_y),
+            prop=dict(size=self._legend_font_size),
+        )
+        # Annotate inferences
+        for x, y in zip(sorted_data["indices"], sorted_data["perf_throughput"]):
+            self._ax_throughput.annotate(
+                str(round(y, 2)),
+                xy=(x, y),
+                textcoords="offset points",  # how to position the text
+                xytext=(0, 10),  # distance from text to points (x,y)
+                ha="center",
+            )
+        self._ax_latency.grid()
+        self._ax_latency.set_axisbelow(True)
+    def save(self, filepath):
+        """
+        Saves a .png of the plot to disk
+        Parameters
+        ----------
+        filepath : the path to the directory
+            this plot should be saved to
+        """
+        self._fig.savefig(os.path.join(filepath, self._name))

model_analyzer/plots/plot_manager.py ADDED Viewed

@@ -0,0 +1,224 @@
+#!/usr/bin/env python3
+# Copyright 2021-2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import os
+from collections import defaultdict
+from typing import DefaultDict, Dict, Union
+from model_analyzer.config.input.config_command_profile import ConfigCommandProfile
+from model_analyzer.config.input.config_command_report import ConfigCommandReport
+from model_analyzer.config.input.config_defaults import DEFAULT_CPU_MEM_PLOT
+from model_analyzer.config.input.objects.config_plot import ConfigPlot
+from model_analyzer.constants import GLOBAL_CONSTRAINTS_KEY, TOP_MODELS_REPORT_KEY
+from model_analyzer.result.constraint_manager import ConstraintManager
+from model_analyzer.result.result_manager import ResultManager
+from .detailed_plot import DetailedPlot
+from .simple_plot import SimplePlot
+class PlotManager:
+    """
+    This class manages the construction and arrangement
+    of plots generated by model analyzer
+    """
+    def __init__(
+        self,
+        config: Union[ConfigCommandProfile, ConfigCommandReport],
+        result_manager: ResultManager,
+        constraint_manager: ConstraintManager,
+    ):
+        """
+        Parameters
+        ----------
+        config : ConfigCommandProfile or ConfigCommandReport
+            The model analyzer's config containing information
+            about the kind of plots to generate
+        result_manager : ResultManager
+            instance that manages the result tables and
+            adding results
+        constraint_manager: ConstraintManager
+            instance that manages constraints
+        """
+        self._config = config
+        self._result_manager = result_manager
+        # Constraints should be plotted as well
+        self._constraints = constraint_manager.get_constraints_for_all_models()
+        # Construct plot output directory
+        self._plot_export_directory = os.path.join(config.export_path, "plots")
+        os.makedirs(self._plot_export_directory, exist_ok=True)
+        # Dict of list of plots
+        self._simple_plots: DefaultDict[str, Dict[str, SimplePlot]] = defaultdict()
+        self._detailed_plots: Dict[str, DetailedPlot] = {}
+    def create_summary_plots(self):
+        """
+        Constructs simple plots based on config specs
+        """
+        model_names = self._result_manager._profile_model_names
+        for plots_key in model_names:
+            self._create_summary_plot_for_model(
+                plots_key=plots_key,
+                model_name=plots_key,
+                num_results=self._config.num_configs_per_model,
+            )
+        if self._config.num_top_model_configs:
+            self._create_summary_plot_for_model(
+                plots_key=TOP_MODELS_REPORT_KEY,
+                model_name=None,
+                num_results=self._config.num_top_model_configs,
+            )
+    def _create_summary_plot_for_model(self, model_name, plots_key, num_results):
+        """
+        helper function that creates the summary plots
+        for a given model
+        """
+        for plot_config in self._config.plots:
+            constraints = self._constraints[GLOBAL_CONSTRAINTS_KEY]
+            if plots_key in self._constraints:
+                constraints = self._constraints[plots_key]
+            for run_config_result in self._result_manager.top_n_results(
+                model_name=model_name, n=num_results, include_default=True
+            ):
+                if run_config_result.run_config().cpu_only():
+                    if plot_config.y_axis() == "gpu_used_memory":
+                        plot_name, plot_config_dict = list(
+                            DEFAULT_CPU_MEM_PLOT.items()
+                        )[0]
+                        plot_config = ConfigPlot(plot_name, **plot_config_dict)
+                self._create_update_simple_plot(
+                    plots_key=plots_key,
+                    plot_config=plot_config,
+                    run_config_measurements=run_config_result.run_config_measurements(),
+                    constraints=constraints,
+                )
+    def _create_update_simple_plot(
+        self, plots_key, plot_config, run_config_measurements, constraints
+    ):
+        """
+        Creates or updates a single simple plot, given a config name,
+        some measurements, and a key to put the plot into the simple plots
+        """
+        if plots_key not in self._simple_plots:
+            self._simple_plots[plots_key] = {}
+        if plot_config.name() not in self._simple_plots[plots_key]:
+            self._simple_plots[plots_key][plot_config.name()] = SimplePlot(
+                name=plot_config.name(),
+                title=plot_config.title(),
+                x_axis=plot_config.x_axis(),
+                y_axis=plot_config.y_axis(),
+                monotonic=plot_config.monotonic(),
+            )
+        for run_config_measurement in run_config_measurements:
+            self._simple_plots[plots_key][
+                plot_config.name()
+            ].add_run_config_measurement(
+                label=run_config_measurement.model_variants_name(),
+                run_config_measurement=run_config_measurement,
+            )
+        # In case this plot already had lines, we want to clear and replot
+        self._simple_plots[plots_key][plot_config.name()].clear()
+        self._simple_plots[plots_key][plot_config.name()].plot_data_and_constraints(
+            constraints=constraints
+        )
+    def create_detailed_plots(self):
+        """
+        Constructs detailed plots based on
+        requested config specs
+        """
+        # Create detailed plots
+        for model in self._config.report_model_configs:
+            model_config_name = model.model_config_name()
+            self._detailed_plots[model_config_name] = DetailedPlot(
+                f"latency_breakdown", "Online Performance"
+            )
+            (
+                model_config,
+                run_config_measurements,
+            ) = self._result_manager.get_model_configs_run_config_measurements(
+                model_config_name
+            )
+            # If model_config_name was present in results
+            if run_config_measurements:
+                for run_config_measurement in run_config_measurements:
+                    self._detailed_plots[model_config_name].add_run_config_measurement(
+                        run_config_measurement
+                    )
+                self._detailed_plots[model_config_name].plot_data()
+            # Create the simple plots for the detailed reports
+            for plot_config in model.plots():
+                if model_config.cpu_only() and (
+                    plot_config.y_axis().startswith("gpu_")
+                    or plot_config.x_axis().startswith("gpu_")
+                ):
+                    continue
+                self._create_update_simple_plot(
+                    plots_key=model_config_name,
+                    plot_config=plot_config,
+                    run_config_measurements=run_config_measurements,
+                    constraints=None,
+                )
+    def export_summary_plots(self):
+        """
+        write the plots to disk
+        """
+        simple_plot_dir = os.path.join(self._plot_export_directory, "simple")
+        for plots_key, plot_dicts in self._simple_plots.items():
+            model_plot_dir = os.path.join(simple_plot_dir, plots_key)
+            os.makedirs(model_plot_dir, exist_ok=True)
+            for plot in plot_dicts.values():
+                plot.save(model_plot_dir)
+    def export_detailed_plots(self):
+        """
+        Write detailed plots to disk
+        """
+        detailed_plot_dir = os.path.join(self._plot_export_directory, "detailed")
+        simple_plot_dir = os.path.join(self._plot_export_directory, "simple")
+        for model_config_name, detailed_plot in self._detailed_plots.items():
+            detailed_model_config_plot_dir = os.path.join(
+                detailed_plot_dir, model_config_name
+            )
+            os.makedirs(detailed_model_config_plot_dir, exist_ok=True)
+            detailed_plot.save(detailed_model_config_plot_dir)
+            simple_model_config_plot_dir = os.path.join(
+                simple_plot_dir, model_config_name
+            )
+            os.makedirs(simple_model_config_plot_dir, exist_ok=True)
+            for simple_plot in self._simple_plots[model_config_name].values():
+                simple_plot.save(simple_model_config_plot_dir)

model_analyzer/plots/simple_plot.py ADDED Viewed

@@ -0,0 +1,213 @@
+#!/usr/bin/env python3
+# Copyright 2021-2023, NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import os
+from collections import defaultdict
+import matplotlib.pyplot as plt
+from model_analyzer.perf_analyzer.perf_config import PerfAnalyzerConfig
+from model_analyzer.record.metrics_manager import MetricsManager
+from model_analyzer.reports.report_utils import truncate_model_config_name
+class SimplePlot:
+    """
+    A wrapper class around a matplotlib
+    plot that adapts with the kinds of
+    plots the model analyzer wants to generates
+    A singe plot holds data for multiple
+    model configs, but only holds one
+    type of plot
+    """
+    def __init__(self, name, title, x_axis, y_axis, monotonic=False):
+        """
+        Parameters
+        ----------
+        name: str
+            The name of the file that the plot
+            will be saved as
+        title : str
+            The title of this plot/figure
+        x_axis : str
+            The metric tag for the x-axis of this plot
+        y_axis : str
+            The metric tag for the y-axis of this plot
+        monotonic: bool
+            Whether or not to prune decreasing points in this
+            plot
+        """
+        self._name = name
+        self._title = title
+        self._x_axis = x_axis
+        self._y_axis = y_axis
+        self._monotonic = monotonic
+        self._fig, self._ax = plt.subplots()
+        self._data = {}
+    def add_run_config_measurement(self, label, run_config_measurement):
+        """
+        Adds a measurement to this plot
+        Parameters
+        ----------
+        label : str
+            The name of the config(s) this measurement
+            is taken from.
+        run_config_measurement : RunConfigMeasurement
+            The measurement containing the data to
+            be plotted.
+        """
+        if label not in self._data:
+            self._data[label] = defaultdict(list)
+        if self._x_axis.replace("_", "-") in PerfAnalyzerConfig.allowed_keys():
+            self._data[label]["x_data"].append(
+                run_config_measurement.model_specific_pa_params()[0][
+                    self._x_axis.replace("_", "-")
+                ]
+            )
+        else:
+            if MetricsManager.is_gpu_metric(tag=self._x_axis):
+                self._data[label]["x_data"].append(
+                    run_config_measurement.get_gpu_metric_value(tag=self._x_axis)
+                )
+            else:
+                self._data[label]["x_data"].append(
+                    run_config_measurement.get_non_gpu_metric_value(tag=self._x_axis)
+                )
+        if self._y_axis.replace("_", "-") in PerfAnalyzerConfig.allowed_keys():
+            self._data[label]["y_data"].append(
+                run_config_measurement.model_specific_pa_params()[0][
+                    self._y_axis.replace("_", "-")
+                ]
+            )
+        else:
+            if MetricsManager.is_gpu_metric(tag=self._y_axis):
+                self._data[label]["y_data"].append(
+                    run_config_measurement.get_gpu_metric_value(tag=self._y_axis)
+                )
+            else:
+                self._data[label]["y_data"].append(
+                    run_config_measurement.get_non_gpu_metric_value(tag=self._y_axis)
+                )
+    def clear(self):
+        """
+        Clear the contents of the current Axes object
+        """
+        self._ax.clear()
+    def plot_data_and_constraints(self, constraints):
+        """
+        Calls plotting function
+        on this plot's Axes object
+        Parameters
+        ----------
+        constraints: ModelConstraints object
+            The keys are metric tags and values are dicts whose
+            keys are constraint types (min, max) and values are their
+            values
+        """
+        self._ax.set_title(self._title)
+        if self._x_axis.replace("_", "-") in PerfAnalyzerConfig.allowed_keys():
+            self._x_header = self._x_axis.replace("_", " ").title()
+        else:
+            self._x_header = MetricsManager.get_metric_types([self._x_axis])[0].header(
+                aggregation_tag=""
+            )
+        if self._y_axis.replace("_", "-") in PerfAnalyzerConfig.allowed_keys():
+            self._y_header = self._y_axis.replace("_", " ").title()
+        else:
+            self._y_header = MetricsManager.get_metric_types([self._y_axis])[0].header(
+                aggregation_tag=""
+            )
+        self._ax.set_xlabel(self._x_header)
+        self._ax.set_ylabel(self._y_header)
+        for model_config_name, data in self._data.items():
+            # Sort the data by x-axis
+            x_data, y_data = (
+                list(t) for t in zip(*sorted(zip(data["x_data"], data["y_data"])))
+            )
+            model_config_name = truncate_model_config_name(model_config_name)
+            if self._monotonic:
+                filtered_x, filtered_y = [x_data[0]], [y_data[0]]
+                for i in range(1, len(x_data)):
+                    if y_data[i] > filtered_y[-1]:
+                        filtered_x.append(x_data[i])
+                        filtered_y.append(y_data[i])
+                x_data, y_data = filtered_x, filtered_y
+            self._ax.plot(x_data, y_data, marker="o", label=model_config_name)
+        # Plot constraints
+        if constraints:
+            if constraints.has_metric(self._x_axis):
+                for _, constraint_val in constraints[self._x_axis].items():
+                    constraint_label = f"Target {self._x_header.rsplit(' ',1)[0]}"
+                    self._ax.axvline(
+                        x=constraint_val, linestyle="--", label=constraint_label
+                    )
+            if constraints.has_metric(self._y_axis):
+                for _, constraint_val in constraints[self._y_axis].items():
+                    constraint_label = f"Target {self._y_header.rsplit(' ', 1)[0]}"
+                    self._ax.axhline(
+                        y=constraint_val, linestyle="--", label=constraint_label
+                    )
+            # plot h lines
+        self._ax.legend()
+        self._ax.grid()
+    def data(self):
+        """
+        Get the data in this plot
+        Returns
+        -------
+        dict
+            keys are line labels
+            and values are lists of floats
+        """
+        return self._data
+    def save(self, filepath):
+        """
+        Saves a .png of the plot to disk
+        Parameters
+        ----------
+        filepath : the path to the directory
+            this plot should be saved to
+        """
+        self._fig.savefig(os.path.join(filepath, self._name))