PyPI - tt-perf-report - Versions diffs - 1.1.5__py3-none-any.whl → 1.1.7__py3-none-any.whl - Mend

tt-perf-report 1.1.5py3-none-any.whl → 1.1.7py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of tt-perf-report might be problematic. Click here for more details.

Files changed (9) hide show

tt_perf_report/perf_report.py CHANGED Viewed

@@ -695,7 +695,7 @@ def color_row(op_data, percentage, min_percentage):
     return op_data
-def print_performance_table(rows, headers, col_widths, device_ops, host_ops):
+def print_performance_table(rows, headers, col_widths, device_ops, host_ops, signpost_count):
     print("\n🚀 Performance Report 🚀\n========================\n")
     print("  ".join(pad_string(header, col_widths[i], align="left") for i, header in enumerate(headers)))
@@ -716,7 +716,7 @@ def print_performance_table(rows, headers, col_widths, device_ops, host_ops):
         "ID": Cell(""),
         "Total %": Cell(100.0, unit="%", decimals=1),
         "Bound": Cell(""),
-        "OP Code": Cell(f"{device_ops} device ops, {host_ops} host ops"),
+        "OP Code": Cell(f"{device_ops} device ops, {host_ops} host ops, {signpost_count} signposts"),
         "Device Time": Cell(total_device_time, unit="us", decimals=0),
         "Op-to-Op Gap": Cell(total_visible_gap, unit="us", decimals=0),
     }
@@ -866,11 +866,14 @@ def generate_matmul_advice(op_data):
 def generate_stacked_report(rows, visible_headers, stack_by_input0_layout:bool = False):
+    # Ensure we filter out signpost rows before processing because they aren't useful in the stacked report
+    filtered_rows = filter_signposts(rows)
     if stack_by_input0_layout:
         visible_headers.append("Input 0 Memory")
     # Create a pandas DataFrame from rows and headers
-    data = {header: [row[header].raw_value for row in rows] for header in visible_headers}
+    data = {header: [row[header].raw_value for row in filtered_rows] for header in visible_headers}
     df = pd.DataFrame(data)
     if (stack_by_input0_layout):
@@ -882,7 +885,7 @@ def generate_stacked_report(rows, visible_headers, stack_by_input0_layout:bool =
     # Group by the joined OP Code and aggregate the data
     stacked_df = df.groupby("OP Code Joined").agg(
         Device_Time_Sum_us=("Device Time", "sum"),
-        Ops_Count=("Device Time", "count"),
+        Ops_Count=("Device Time", "size"),
         Flops_min=("FLOPs %", "min"),
         Flops_max=("FLOPs %", "max"),
         Flops_mean=("FLOPs %", "mean"),
@@ -897,7 +900,6 @@ def generate_stacked_report(rows, visible_headers, stack_by_input0_layout:bool =
     else:
         stacked_df["%"] = 0
-    stacked_df["%"] = (stacked_df["Device_Time_Sum_us"] / total_device_time) * 100
     # Reorder columns to move Device_Time_Percentage to be the 3rd column
     cols = stacked_df.columns.tolist()
     cols.insert(0, cols.pop(cols.index("%")))
@@ -1054,6 +1056,8 @@ def filter_by_id_range(rows, id_range):
 def filter_host_ops(rows):
     return [row for row in rows if not is_host_op(row)]
+def filter_signposts(rows):
+    return [row for row in rows if not is_signpost_op(row)]
 def main():
     args, id_range = parse_args()
@@ -1137,18 +1141,26 @@ def generate_perf_report(csv_file, signpost, ignore_signposts, min_percentage,
     prev_row = None
     device_ops = 0
     host_ops = 0
+    signpost_count = 0
     for _, row in df.iterrows():
         op_data, current_gap = analyze_op(row, prev_row, csv_format)
         op_data["ID"] = Cell(row["ORIGINAL_ROW"])  # Use the original row number
         op_data["Global Call Count"] = Cell(row["GLOBAL CALL COUNT"])
         if raw_op_codes:
             op_data["Raw OP Code"] = Cell(row["OP CODE"])
+        # OP TYPE column is only present in raw format/df and is not part of the op_data/rows dictionary used later
+        # append " (signpost)" to the OP Code if this row is a signpost to distinguish it
+        if "signpost" in row["OP TYPE"]:
+            op_data["OP Code"].raw_value = f"{row['OP CODE']} (signpost)"
         rows.append(op_data)
         prev_row = row
-        # Count device and host ops
+        # Count device and host ops, ignore signposts
         if is_host_op(op_data):
             host_ops += 1
+        elif is_signpost_op(op_data):
+            signpost_count += 1
         else:
             device_ops += 1
@@ -1216,7 +1228,7 @@ def generate_perf_report(csv_file, signpost, ignore_signposts, min_percentage,
             max(max(visible_length(str(row[header])) for row in rows), visible_length(header))
             for header in visible_headers
         ]
-        print_performance_table(rows, visible_headers, col_widths, device_ops, host_ops)
+        print_performance_table(rows, visible_headers, col_widths, device_ops, host_ops, signpost_count)
         if not no_advice:
             print_advice_section(rows, visible_headers, col_widths)
@@ -1240,6 +1252,8 @@ def generate_perf_report(csv_file, signpost, ignore_signposts, min_percentage,
 def is_host_op(op_data):
     return "(torch)" in op_data["OP Code"].raw_value
+def is_signpost_op(op_data):
+    return  "signpost" in op_data["OP Code"].raw_value
 if __name__ == "__main__":
     main()

{tt_perf_report-1.1.5.dist-info → tt_perf_report-1.1.7.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: tt-perf-report
-Version: 1.1.5
+Version: 1.1.7
 Summary: This tool analyzes performance traces from TT-Metal operations, providing insights into throughput, bottlenecks, and optimization opportunities.
 License:                                  Apache License
                                    Version 2.0, January 2004

tt_perf_report-1.1.7.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,9 @@
+tt_perf_report/__init__.py,sha256=-j4iFYebIwgdS8uphk8-M6zasRqGBL3CQGnJH9keRuI,92
+tt_perf_report/perf_report.py,sha256=V1oJ_cyJyFm4UGMzwMBn3XcDgvE1YoYnvdGvMldjLQE,50697
+tt_perf_report-1.1.7.dist-info/licenses/LICENSE,sha256=6dZGjPECz_ULS-sf40FLlt6OmQFcrRvmzG5mJRZCQ5I,11825
+tt_perf_report-1.1.7.dist-info/licenses/LICENSE_understanding.txt,sha256=pymi-yb_RvYM9p2ZA4iSNsImcvhDBBxlGuJCY9dTq7M,233
+tt_perf_report-1.1.7.dist-info/METADATA,sha256=VP1UPkbAKmOXhj6h4KBU1BofDAZ17JKJRLnT3qHI2zY,18393
+tt_perf_report-1.1.7.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+tt_perf_report-1.1.7.dist-info/entry_points.txt,sha256=ReAziglcjbAkPbklqheUISkfoEVI5ptlFrBAJTIk5dI,67
+tt_perf_report-1.1.7.dist-info/top_level.txt,sha256=mEQ-BK3rRbmz9QyWitTCLy2xwmC5rmJno_TY_H9s9CE,15
+tt_perf_report-1.1.7.dist-info/RECORD,,

tt_perf_report-1.1.5.dist-info/RECORD DELETED Viewed

@@ -1,9 +0,0 @@
-tt_perf_report/__init__.py,sha256=-j4iFYebIwgdS8uphk8-M6zasRqGBL3CQGnJH9keRuI,92
-tt_perf_report/perf_report.py,sha256=Ziln0oeY7zQVUcVLaHwkh17taz6CGyR9r32Yd3PhKko,49951
-tt_perf_report-1.1.5.dist-info/licenses/LICENSE,sha256=6dZGjPECz_ULS-sf40FLlt6OmQFcrRvmzG5mJRZCQ5I,11825
-tt_perf_report-1.1.5.dist-info/licenses/LICENSE_understanding.txt,sha256=pymi-yb_RvYM9p2ZA4iSNsImcvhDBBxlGuJCY9dTq7M,233
-tt_perf_report-1.1.5.dist-info/METADATA,sha256=iGf6JsPN_wjHpDlSLC99Pso9J9Ez2x7wZHGK0JY-yR0,18393
-tt_perf_report-1.1.5.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-tt_perf_report-1.1.5.dist-info/entry_points.txt,sha256=ReAziglcjbAkPbklqheUISkfoEVI5ptlFrBAJTIk5dI,67
-tt_perf_report-1.1.5.dist-info/top_level.txt,sha256=mEQ-BK3rRbmz9QyWitTCLy2xwmC5rmJno_TY_H9s9CE,15
-tt_perf_report-1.1.5.dist-info/RECORD,,

{tt_perf_report-1.1.5.dist-info → tt_perf_report-1.1.7.dist-info}/WHEEL RENAMED Viewed

File without changes

{tt_perf_report-1.1.5.dist-info → tt_perf_report-1.1.7.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{tt_perf_report-1.1.5.dist-info → tt_perf_report-1.1.7.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{tt_perf_report-1.1.5.dist-info → tt_perf_report-1.1.7.dist-info}/licenses/LICENSE_understanding.txt RENAMED Viewed

File without changes

{tt_perf_report-1.1.5.dist-info → tt_perf_report-1.1.7.dist-info}/top_level.txt RENAMED Viewed

File without changes

tt-perf-report 1.1.5__py3-none-any.whl → 1.1.7__py3-none-any.whl

Potentially problematic release.

tt-perf-report 1.1.5py3-none-any.whl → 1.1.7py3-none-any.whl