PyPI - tt-perf-report - Versions diffs - 1.1.5__tar.gz → 1.1.6__tar.gz - Mend

tt-perf-report 1.1.5tar.gz → 1.1.6tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of tt-perf-report might be problematic. Click here for more details.

Files changed (14) hide show

{tt_perf_report-1.1.5/src/tt_perf_report.egg-info → tt_perf_report-1.1.6}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: tt-perf-report
-Version: 1.1.5
+Version: 1.1.6
 Summary: This tool analyzes performance traces from TT-Metal operations, providing insights into throughput, bottlenecks, and optimization opportunities.
 License:                                  Apache License
                                    Version 2.0, January 2004

{tt_perf_report-1.1.5 → tt_perf_report-1.1.6}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 [project]
 name = "tt-perf-report"
-version = "1.1.5"
+version = "1.1.6"
 description = "This tool analyzes performance traces from TT-Metal operations, providing insights into throughput, bottlenecks, and optimization opportunities."
 license = {file = "LICENSE"}
 readme = "README.md"

{tt_perf_report-1.1.5 → tt_perf_report-1.1.6}/src/tt_perf_report/perf_report.py RENAMED Viewed

@@ -866,11 +866,14 @@ def generate_matmul_advice(op_data):
 def generate_stacked_report(rows, visible_headers, stack_by_input0_layout:bool = False):
+    # Ensure we filter out signpost rows before processing because they aren't useful in the stacked report
+    filtered_rows = [row for row in rows if row["OP TYPE"].raw_value != "signpost"]
     if stack_by_input0_layout:
         visible_headers.append("Input 0 Memory")
     # Create a pandas DataFrame from rows and headers
-    data = {header: [row[header].raw_value for row in rows] for header in visible_headers}
+    data = {header: [row[header].raw_value for row in filtered_rows] for header in visible_headers}
     df = pd.DataFrame(data)
     if (stack_by_input0_layout):
@@ -882,7 +885,7 @@ def generate_stacked_report(rows, visible_headers, stack_by_input0_layout:bool =
     # Group by the joined OP Code and aggregate the data
     stacked_df = df.groupby("OP Code Joined").agg(
         Device_Time_Sum_us=("Device Time", "sum"),
-        Ops_Count=("Device Time", "count"),
+        Ops_Count=("Device Time", "size"),
         Flops_min=("FLOPs %", "min"),
         Flops_max=("FLOPs %", "max"),
         Flops_mean=("FLOPs %", "mean"),
@@ -897,7 +900,6 @@ def generate_stacked_report(rows, visible_headers, stack_by_input0_layout:bool =
     else:
         stacked_df["%"] = 0
-    stacked_df["%"] = (stacked_df["Device_Time_Sum_us"] / total_device_time) * 100
     # Reorder columns to move Device_Time_Percentage to be the 3rd column
     cols = stacked_df.columns.tolist()
     cols.insert(0, cols.pop(cols.index("%")))

{tt_perf_report-1.1.5 → tt_perf_report-1.1.6/src/tt_perf_report.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: tt-perf-report
-Version: 1.1.5
+Version: 1.1.6
 Summary: This tool analyzes performance traces from TT-Metal operations, providing insights into throughput, bottlenecks, and optimization opportunities.
 License:                                  Apache License
                                    Version 2.0, January 2004