tt-perf-report 1.0.4__py3-none-any.whl → 1.0.5__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of tt-perf-report might be problematic. Click here for more details.
- tt_perf_report/perf_report.py +24 -2
- tt_perf_report-1.0.5.dist-info/LICENSE_understanding.txt +3 -0
- {tt_perf_report-1.0.4.dist-info → tt_perf_report-1.0.5.dist-info}/METADATA +2 -1
- tt_perf_report-1.0.5.dist-info/RECORD +9 -0
- tt_perf_report-1.0.4.dist-info/RECORD +0 -8
- {tt_perf_report-1.0.4.dist-info → tt_perf_report-1.0.5.dist-info}/LICENSE +0 -0
- {tt_perf_report-1.0.4.dist-info → tt_perf_report-1.0.5.dist-info}/WHEEL +0 -0
- {tt_perf_report-1.0.4.dist-info → tt_perf_report-1.0.5.dist-info}/entry_points.txt +0 -0
- {tt_perf_report-1.0.4.dist-info → tt_perf_report-1.0.5.dist-info}/top_level.txt +0 -0
tt_perf_report/perf_report.py
CHANGED
|
@@ -742,8 +742,28 @@ def merge_device_rows(df):
|
|
|
742
742
|
device_ids = sorted(block_by_device.keys())
|
|
743
743
|
merged_blocks = []
|
|
744
744
|
|
|
745
|
-
|
|
746
|
-
|
|
745
|
+
global_index = 0
|
|
746
|
+
while max(len(block_by_device[device_id]) for device_id in device_ids) > 0:
|
|
747
|
+
blocks = []
|
|
748
|
+
op_name = None
|
|
749
|
+
missing_devices = []
|
|
750
|
+
for device_id in device_ids:
|
|
751
|
+
if not len(block_by_device[device_id]):
|
|
752
|
+
print(colored(f"Warning: Device {device_id} is missing operation {op_name} at index {global_index}", "yellow"))
|
|
753
|
+
continue
|
|
754
|
+
if op_name is None:
|
|
755
|
+
op_name = block_by_device[device_id][0][0]
|
|
756
|
+
elif op_name != block_by_device[device_id][0][0]:
|
|
757
|
+
missing_devices.append(device_id)
|
|
758
|
+
continue
|
|
759
|
+
|
|
760
|
+
blocks.append(block_by_device[device_id].pop(0))
|
|
761
|
+
|
|
762
|
+
if missing_devices:
|
|
763
|
+
print(colored(f"Warning: {op_name} at index {global_index} not present in CSV for {len(missing_devices)} devices {missing_devices} - do not trust data for this op or directly subsequent ops with the same name", "yellow"))
|
|
764
|
+
|
|
765
|
+
if not blocks:
|
|
766
|
+
break
|
|
747
767
|
|
|
748
768
|
if "AllGather" in op_name or "ReduceScatter" in op_name:
|
|
749
769
|
# For collective ops, take the row with minimum duration
|
|
@@ -754,6 +774,8 @@ def merge_device_rows(df):
|
|
|
754
774
|
max_duration_block = max(blocks, key=lambda x: x[1]["DEVICE KERNEL DURATION [ns]"])
|
|
755
775
|
merged_blocks.append(max_duration_block[1])
|
|
756
776
|
|
|
777
|
+
global_index += 1
|
|
778
|
+
|
|
757
779
|
return pd.DataFrame(merged_blocks)
|
|
758
780
|
|
|
759
781
|
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.2
|
|
2
2
|
Name: tt-perf-report
|
|
3
|
-
Version: 1.0.
|
|
3
|
+
Version: 1.0.5
|
|
4
4
|
Summary: This tool analyzes performance traces from TT-Metal operations, providing insights into throughput, bottlenecks, and optimization opportunities.
|
|
5
5
|
License: Apache License
|
|
6
6
|
Version 2.0, January 2004
|
|
@@ -216,6 +216,7 @@ Project-URL: Repository, https://github.com/tenstorrent/tt-perf-report
|
|
|
216
216
|
Keywords: tenstorrent,tt-metal
|
|
217
217
|
Description-Content-Type: text/markdown
|
|
218
218
|
License-File: LICENSE
|
|
219
|
+
License-File: LICENSE_understanding.txt
|
|
219
220
|
Requires-Dist: pandas
|
|
220
221
|
|
|
221
222
|
# Performance Report Analysis Tool
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
tt_perf_report/__init__.py,sha256=-j4iFYebIwgdS8uphk8-M6zasRqGBL3CQGnJH9keRuI,92
|
|
2
|
+
tt_perf_report/perf_report.py,sha256=14gQ3UMfd6pSqgbaVAhEO62u9lZrls_dx_XxlAqfrkQ,37876
|
|
3
|
+
tt_perf_report-1.0.5.dist-info/LICENSE,sha256=6dZGjPECz_ULS-sf40FLlt6OmQFcrRvmzG5mJRZCQ5I,11825
|
|
4
|
+
tt_perf_report-1.0.5.dist-info/LICENSE_understanding.txt,sha256=pymi-yb_RvYM9p2ZA4iSNsImcvhDBBxlGuJCY9dTq7M,233
|
|
5
|
+
tt_perf_report-1.0.5.dist-info/METADATA,sha256=dOYnleQMhtLCVE3W0aDQNNd92fouRnpfcb66nodBtag,18345
|
|
6
|
+
tt_perf_report-1.0.5.dist-info/WHEEL,sha256=jB7zZ3N9hIM9adW7qlTAyycLYW9npaWKLRzaoVcLKcM,91
|
|
7
|
+
tt_perf_report-1.0.5.dist-info/entry_points.txt,sha256=ReAziglcjbAkPbklqheUISkfoEVI5ptlFrBAJTIk5dI,67
|
|
8
|
+
tt_perf_report-1.0.5.dist-info/top_level.txt,sha256=mEQ-BK3rRbmz9QyWitTCLy2xwmC5rmJno_TY_H9s9CE,15
|
|
9
|
+
tt_perf_report-1.0.5.dist-info/RECORD,,
|
|
@@ -1,8 +0,0 @@
|
|
|
1
|
-
tt_perf_report/__init__.py,sha256=-j4iFYebIwgdS8uphk8-M6zasRqGBL3CQGnJH9keRuI,92
|
|
2
|
-
tt_perf_report/perf_report.py,sha256=MJHgosbw7kD7MrJ6-ZtLhdny_iX9bR_UB-ZaHoyjTsE,36952
|
|
3
|
-
tt_perf_report-1.0.4.dist-info/LICENSE,sha256=6dZGjPECz_ULS-sf40FLlt6OmQFcrRvmzG5mJRZCQ5I,11825
|
|
4
|
-
tt_perf_report-1.0.4.dist-info/METADATA,sha256=fZKE2o9edCU0N6v-_tkUqSZ39j8mimeGBU_SIuuFi84,18305
|
|
5
|
-
tt_perf_report-1.0.4.dist-info/WHEEL,sha256=jB7zZ3N9hIM9adW7qlTAyycLYW9npaWKLRzaoVcLKcM,91
|
|
6
|
-
tt_perf_report-1.0.4.dist-info/entry_points.txt,sha256=ReAziglcjbAkPbklqheUISkfoEVI5ptlFrBAJTIk5dI,67
|
|
7
|
-
tt_perf_report-1.0.4.dist-info/top_level.txt,sha256=mEQ-BK3rRbmz9QyWitTCLy2xwmC5rmJno_TY_H9s9CE,15
|
|
8
|
-
tt_perf_report-1.0.4.dist-info/RECORD,,
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|