mindstudio-probe 1.2.2__py3-none-any.whl → 8.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (261) hide show
  1. {mindstudio_probe-1.2.2.dist-info → mindstudio_probe-8.1.0.dist-info}/METADATA +4 -3
  2. {mindstudio_probe-1.2.2.dist-info → mindstudio_probe-8.1.0.dist-info}/RECORD +243 -191
  3. msprobe/README.md +57 -21
  4. msprobe/core/__init__.py +17 -0
  5. msprobe/core/common/const.py +224 -82
  6. msprobe/core/common/decorator.py +50 -0
  7. msprobe/core/common/exceptions.py +5 -3
  8. msprobe/core/common/file_utils.py +274 -40
  9. msprobe/core/common/framework_adapter.py +169 -0
  10. msprobe/core/common/global_lock.py +86 -0
  11. msprobe/core/common/runtime.py +25 -0
  12. msprobe/core/common/utils.py +148 -72
  13. msprobe/core/common_config.py +7 -0
  14. msprobe/core/compare/acc_compare.py +640 -462
  15. msprobe/core/compare/check.py +36 -107
  16. msprobe/core/compare/compare_cli.py +4 -0
  17. msprobe/core/compare/config.py +72 -0
  18. msprobe/core/compare/highlight.py +217 -215
  19. msprobe/core/compare/layer_mapping/layer_mapping.py +4 -1
  20. msprobe/core/compare/merge_result/merge_result.py +12 -6
  21. msprobe/core/compare/multiprocessing_compute.py +227 -107
  22. msprobe/core/compare/npy_compare.py +32 -16
  23. msprobe/core/compare/utils.py +218 -244
  24. msprobe/{mindspore/runtime.py → core/config_check/__init__.py} +2 -4
  25. msprobe/{pytorch/dump/kernel_dump/kernel_config.py → core/config_check/checkers/__init__.py} +8 -16
  26. msprobe/core/config_check/checkers/base_checker.py +60 -0
  27. msprobe/core/config_check/checkers/dataset_checker.py +138 -0
  28. msprobe/core/config_check/checkers/env_args_checker.py +96 -0
  29. msprobe/core/config_check/checkers/hyperparameter_checker.py +170 -0
  30. msprobe/core/config_check/checkers/pip_checker.py +90 -0
  31. msprobe/core/config_check/checkers/random_checker.py +367 -0
  32. msprobe/core/config_check/checkers/weights_checker.py +147 -0
  33. msprobe/core/config_check/ckpt_compare/ckpt_comparator.py +74 -0
  34. msprobe/core/config_check/ckpt_compare/megatron_loader.py +302 -0
  35. msprobe/core/config_check/ckpt_compare/metrics.py +83 -0
  36. msprobe/core/config_check/ckpt_compare/name_mapping.yaml +12 -0
  37. msprobe/core/config_check/config_check_cli.py +51 -0
  38. msprobe/core/config_check/config_checker.py +100 -0
  39. msprobe/{pytorch/parse.py → core/config_check/resource/dependency.yaml} +7 -4
  40. msprobe/core/config_check/resource/env.yaml +57 -0
  41. msprobe/core/config_check/resource/hyperparameter.yaml +21 -0
  42. msprobe/core/config_check/utils/hyperparameter_parser.py +115 -0
  43. msprobe/core/config_check/utils/utils.py +107 -0
  44. msprobe/core/data_dump/api_registry.py +239 -0
  45. msprobe/core/data_dump/data_collector.py +36 -9
  46. msprobe/core/data_dump/data_processor/base.py +74 -53
  47. msprobe/core/data_dump/data_processor/mindspore_processor.py +119 -78
  48. msprobe/core/data_dump/data_processor/pytorch_processor.py +134 -96
  49. msprobe/core/data_dump/json_writer.py +146 -57
  50. msprobe/core/debugger/precision_debugger.py +143 -0
  51. msprobe/core/grad_probe/constant.py +2 -1
  52. msprobe/core/grad_probe/grad_compare.py +2 -2
  53. msprobe/core/grad_probe/utils.py +1 -1
  54. msprobe/core/hook_manager.py +242 -0
  55. msprobe/core/monitor/anomaly_processor.py +384 -0
  56. msprobe/core/overflow_check/abnormal_scene.py +2 -0
  57. msprobe/core/service.py +356 -0
  58. msprobe/core/single_save/__init__.py +0 -0
  59. msprobe/core/single_save/single_comparator.py +243 -0
  60. msprobe/core/single_save/single_saver.py +157 -0
  61. msprobe/docs/01.installation.md +6 -5
  62. msprobe/docs/02.config_introduction.md +89 -30
  63. msprobe/docs/03.config_examples.md +1 -0
  64. msprobe/docs/04.kernel_dump_PyTorch.md +1 -1
  65. msprobe/docs/05.data_dump_PyTorch.md +184 -50
  66. msprobe/docs/06.data_dump_MindSpore.md +193 -28
  67. msprobe/docs/07.accuracy_checker_PyTorch.md +13 -3
  68. msprobe/docs/08.accuracy_checker_online_PyTorch.md +72 -10
  69. msprobe/docs/09.accuracy_checker_MindSpore.md +19 -7
  70. msprobe/docs/10.accuracy_compare_PyTorch.md +266 -102
  71. msprobe/docs/11.accuracy_compare_MindSpore.md +117 -43
  72. msprobe/docs/12.overflow_check_PyTorch.md +5 -3
  73. msprobe/docs/13.overflow_check_MindSpore.md +6 -4
  74. msprobe/docs/14.data_parse_PyTorch.md +4 -10
  75. msprobe/docs/17.grad_probe.md +2 -1
  76. msprobe/docs/18.online_dispatch.md +3 -3
  77. msprobe/docs/19.monitor.md +211 -103
  78. msprobe/docs/21.visualization_PyTorch.md +100 -28
  79. msprobe/docs/22.visualization_MindSpore.md +103 -31
  80. msprobe/docs/23.generate_operator_PyTorch.md +9 -9
  81. msprobe/docs/25.tool_function_introduction.md +23 -22
  82. msprobe/docs/26.data_dump_PyTorch_baseline.md +14 -3
  83. msprobe/docs/27.dump_json_instruction.md +278 -8
  84. msprobe/docs/28.debugger_save_instruction.md +111 -20
  85. msprobe/docs/28.kernel_dump_MindSpore.md +1 -1
  86. msprobe/docs/29.data_dump_MSAdapter.md +229 -0
  87. msprobe/docs/30.overflow_check_MSAdapter.md +31 -0
  88. msprobe/docs/31.config_check.md +95 -0
  89. msprobe/docs/32.ckpt_compare.md +69 -0
  90. msprobe/docs/33.generate_operator_MindSpore.md +190 -0
  91. msprobe/docs/34.RL_collect.md +92 -0
  92. msprobe/docs/35.nan_analyze.md +72 -0
  93. msprobe/docs/FAQ.md +3 -11
  94. msprobe/docs/data_dump_MindSpore/data_dump_MindSpore_baseline.md +12 -1
  95. msprobe/docs/data_dump_MindSpore/dynamic_graph_quick_start_example.md +3 -1
  96. msprobe/docs/img/compare_result.png +0 -0
  97. msprobe/docs/img/merge_result.png +0 -0
  98. msprobe/docs/img/save_compare_result_sample.png +0 -0
  99. msprobe/docs/img/visualization/proxy.png +0 -0
  100. msprobe/docs/img/visualization/vis_browser_1.png +0 -0
  101. msprobe/docs/img/visualization/vis_match_info.png +0 -0
  102. msprobe/docs/img/visualization/vis_precision_info.png +0 -0
  103. msprobe/docs/img/visualization/vis_search_info.png +0 -0
  104. msprobe/docs/img/visualization/vis_show_info.png +0 -0
  105. msprobe/docs/img/visualization/vis_showcase.png +0 -0
  106. msprobe/docs/img/visualization/vis_unmatch_info.png +0 -0
  107. msprobe/mindspore/__init__.py +3 -3
  108. msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +151 -55
  109. msprobe/mindspore/api_accuracy_checker/api_runner.py +25 -11
  110. msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +2 -1
  111. msprobe/mindspore/api_accuracy_checker/bench_functions/flash_attention_score.py +580 -0
  112. msprobe/mindspore/api_accuracy_checker/bench_functions/fusion_operator.py +41 -0
  113. msprobe/mindspore/api_accuracy_checker/cmd_parser.py +4 -0
  114. msprobe/mindspore/api_accuracy_checker/data_manager.py +4 -3
  115. msprobe/mindspore/api_accuracy_checker/generate_op_script/config_op.json +9 -0
  116. msprobe/mindspore/api_accuracy_checker/generate_op_script/op_generator.py +451 -0
  117. msprobe/mindspore/api_accuracy_checker/generate_op_script/operator_replication.template +2081 -0
  118. msprobe/mindspore/api_accuracy_checker/multi_api_accuracy_checker.py +11 -1
  119. msprobe/mindspore/api_accuracy_checker/torch_mindtorch_importer.py +2 -1
  120. msprobe/mindspore/cell_processor.py +204 -33
  121. msprobe/mindspore/code_mapping/graph_parser.py +4 -21
  122. msprobe/mindspore/common/const.py +73 -2
  123. msprobe/mindspore/common/utils.py +157 -29
  124. msprobe/mindspore/compare/common_dir_compare.py +382 -0
  125. msprobe/mindspore/compare/distributed_compare.py +2 -26
  126. msprobe/mindspore/compare/ms_compare.py +18 -398
  127. msprobe/mindspore/compare/ms_graph_compare.py +20 -10
  128. msprobe/mindspore/compare/utils.py +37 -0
  129. msprobe/mindspore/debugger/debugger_config.py +59 -7
  130. msprobe/mindspore/debugger/precision_debugger.py +83 -90
  131. msprobe/mindspore/dump/cell_dump_process.py +902 -0
  132. msprobe/mindspore/dump/cell_dump_with_insert_gradient.py +889 -0
  133. msprobe/mindspore/dump/dump_tool_factory.py +18 -8
  134. msprobe/mindspore/dump/graph_mode_cell_dump.py +139 -0
  135. msprobe/mindspore/dump/graph_tensor_dump.py +123 -0
  136. msprobe/mindspore/dump/hook_cell/api_register.py +176 -0
  137. msprobe/mindspore/dump/hook_cell/hook_cell.py +22 -12
  138. msprobe/mindspore/dump/hook_cell/ms_hook_manager.py +88 -0
  139. msprobe/mindspore/dump/hook_cell/primitive_hooks.py +8 -2
  140. msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +42 -26
  141. msprobe/mindspore/dump/jit_dump.py +35 -27
  142. msprobe/mindspore/dump/kernel_kbyk_dump.py +6 -3
  143. msprobe/mindspore/dym_loader/hook_dynamic_loader.cpp +110 -0
  144. msprobe/mindspore/dym_loader/hook_dynamic_loader.h +15 -16
  145. msprobe/mindspore/free_benchmark/api_pynative_self_check.py +22 -12
  146. msprobe/mindspore/free_benchmark/common/utils.py +1 -1
  147. msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +4 -2
  148. msprobe/mindspore/free_benchmark/self_check_tool_factory.py +6 -3
  149. msprobe/mindspore/grad_probe/global_context.py +9 -2
  150. msprobe/mindspore/grad_probe/grad_analyzer.py +2 -1
  151. msprobe/mindspore/grad_probe/grad_stat_csv.py +3 -2
  152. msprobe/mindspore/grad_probe/hook.py +2 -4
  153. msprobe/mindspore/mindspore_service.py +111 -0
  154. msprobe/mindspore/monitor/common_func.py +52 -0
  155. msprobe/mindspore/monitor/data_writers.py +237 -0
  156. msprobe/mindspore/monitor/distributed/wrap_distributed.py +1 -1
  157. msprobe/mindspore/monitor/features.py +13 -1
  158. msprobe/mindspore/monitor/module_hook.py +568 -444
  159. msprobe/mindspore/monitor/optimizer_collect.py +331 -0
  160. msprobe/mindspore/monitor/utils.py +71 -9
  161. msprobe/mindspore/ms_config.py +16 -15
  162. msprobe/mindspore/overflow_check/overflow_check_tool_factory.py +5 -3
  163. msprobe/mindspore/task_handler_factory.py +5 -2
  164. msprobe/msprobe.py +19 -0
  165. msprobe/nan_analyze/__init__.py +14 -0
  166. msprobe/nan_analyze/analyzer.py +255 -0
  167. msprobe/nan_analyze/graph.py +189 -0
  168. msprobe/nan_analyze/utils.py +211 -0
  169. msprobe/pytorch/api_accuracy_checker/common/config.py +2 -2
  170. msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +3 -6
  171. msprobe/pytorch/api_accuracy_checker/compare/compare.py +36 -34
  172. msprobe/pytorch/api_accuracy_checker/generate_op_script/op_generator.py +15 -13
  173. msprobe/pytorch/api_accuracy_checker/generate_op_script/operator_replication.template +206 -4
  174. msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +9 -9
  175. msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +6 -5
  176. msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +31 -9
  177. msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +28 -20
  178. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +3 -1
  179. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +29 -13
  180. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/device_dispatch.py +12 -2
  181. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +45 -31
  182. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/utils.py +154 -0
  183. msprobe/pytorch/attl_manager.py +65 -0
  184. msprobe/pytorch/bench_functions/moe_gating_top_k_softmax.py +6 -0
  185. msprobe/pytorch/bench_functions/npu_fusion_attention.py +27 -0
  186. msprobe/pytorch/common/utils.py +53 -19
  187. msprobe/pytorch/compare/distributed_compare.py +4 -36
  188. msprobe/pytorch/compare/pt_compare.py +13 -84
  189. msprobe/pytorch/compare/utils.py +47 -0
  190. msprobe/pytorch/debugger/debugger_config.py +34 -17
  191. msprobe/pytorch/debugger/precision_debugger.py +50 -96
  192. msprobe/pytorch/dump/module_dump/hook_wrapper.py +93 -0
  193. msprobe/pytorch/dump/module_dump/module_dump.py +15 -61
  194. msprobe/pytorch/dump/module_dump/module_processer.py +150 -114
  195. msprobe/pytorch/free_benchmark/common/utils.py +1 -1
  196. msprobe/pytorch/free_benchmark/compare/single_benchmark.py +1 -1
  197. msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +3 -3
  198. msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +3 -3
  199. msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +1 -1
  200. msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +1 -1
  201. msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +1 -1
  202. msprobe/pytorch/function_factory.py +1 -1
  203. msprobe/pytorch/grad_probe/grad_monitor.py +2 -2
  204. msprobe/pytorch/grad_probe/grad_stat_csv.py +3 -2
  205. msprobe/pytorch/hook_module/api_register.py +155 -0
  206. msprobe/pytorch/hook_module/hook_module.py +18 -22
  207. msprobe/pytorch/hook_module/jit_script_wrapper.py +33 -0
  208. msprobe/pytorch/hook_module/pt_hook_manager.py +68 -0
  209. msprobe/pytorch/hook_module/register_optimizer_hook.py +2 -1
  210. msprobe/pytorch/hook_module/support_wrap_ops.yaml +193 -75
  211. msprobe/pytorch/hook_module/utils.py +28 -2
  212. msprobe/pytorch/monitor/csv2tb.py +14 -4
  213. msprobe/pytorch/monitor/data_writers.py +259 -0
  214. msprobe/pytorch/monitor/distributed/wrap_distributed.py +8 -2
  215. msprobe/pytorch/monitor/module_hook.py +336 -241
  216. msprobe/pytorch/monitor/module_metric.py +17 -0
  217. msprobe/pytorch/monitor/optimizer_collect.py +244 -224
  218. msprobe/pytorch/monitor/utils.py +84 -4
  219. msprobe/pytorch/online_dispatch/compare.py +0 -2
  220. msprobe/pytorch/online_dispatch/dispatch.py +13 -2
  221. msprobe/pytorch/online_dispatch/dump_compare.py +8 -2
  222. msprobe/pytorch/online_dispatch/utils.py +3 -0
  223. msprobe/pytorch/parse_tool/lib/interactive_cli.py +1 -6
  224. msprobe/pytorch/parse_tool/lib/utils.py +5 -4
  225. msprobe/pytorch/pt_config.py +16 -11
  226. msprobe/pytorch/pytorch_service.py +70 -0
  227. msprobe/visualization/builder/graph_builder.py +69 -10
  228. msprobe/visualization/builder/msprobe_adapter.py +24 -12
  229. msprobe/visualization/compare/graph_comparator.py +63 -51
  230. msprobe/visualization/compare/mode_adapter.py +22 -20
  231. msprobe/visualization/graph/base_node.py +11 -4
  232. msprobe/visualization/graph/distributed_analyzer.py +1 -10
  233. msprobe/visualization/graph/graph.py +2 -13
  234. msprobe/visualization/graph/node_op.py +1 -2
  235. msprobe/visualization/graph_service.py +251 -104
  236. msprobe/visualization/utils.py +26 -44
  237. msprobe/mindspore/dump/hook_cell/api_registry.py +0 -207
  238. msprobe/mindspore/dump/hook_cell/wrap_api.py +0 -212
  239. msprobe/mindspore/dym_loader/hook_dynamic_loader.cc +0 -140
  240. msprobe/mindspore/monitor/anomaly_detect.py +0 -404
  241. msprobe/mindspore/monitor/module_spec_verifier.py +0 -94
  242. msprobe/mindspore/service.py +0 -543
  243. msprobe/pytorch/hook_module/api_registry.py +0 -166
  244. msprobe/pytorch/hook_module/wrap_distributed.py +0 -79
  245. msprobe/pytorch/hook_module/wrap_functional.py +0 -66
  246. msprobe/pytorch/hook_module/wrap_npu_custom.py +0 -85
  247. msprobe/pytorch/hook_module/wrap_tensor.py +0 -69
  248. msprobe/pytorch/hook_module/wrap_torch.py +0 -84
  249. msprobe/pytorch/hook_module/wrap_vf.py +0 -60
  250. msprobe/pytorch/monitor/anomaly_analyse.py +0 -201
  251. msprobe/pytorch/monitor/anomaly_detect.py +0 -410
  252. msprobe/pytorch/monitor/module_spec_verifier.py +0 -95
  253. msprobe/pytorch/monitor/unittest/test_monitor.py +0 -160
  254. msprobe/pytorch/service.py +0 -470
  255. {mindstudio_probe-1.2.2.dist-info → mindstudio_probe-8.1.0.dist-info}/LICENSE +0 -0
  256. {mindstudio_probe-1.2.2.dist-info → mindstudio_probe-8.1.0.dist-info}/WHEEL +0 -0
  257. {mindstudio_probe-1.2.2.dist-info → mindstudio_probe-8.1.0.dist-info}/entry_points.txt +0 -0
  258. {mindstudio_probe-1.2.2.dist-info → mindstudio_probe-8.1.0.dist-info}/top_level.txt +0 -0
  259. /msprobe/{mindspore → core}/compare/ms_to_pt_api.yaml +0 -0
  260. /msprobe/{mindspore/dump → core}/kernel_dump/kernel_config.py +0 -0
  261. /msprobe/{pytorch/monitor/unittest → core/monitor}/__init__.py +0 -0
@@ -149,9 +149,9 @@ tensor:
149
149
  - __bool__
150
150
  - __div__
151
151
  - __eq__
152
+ - __floordiv__
152
153
  - __ge__
153
154
  - __gt__
154
- - __getitem__
155
155
  - __iadd__
156
156
  - __iand__
157
157
  - __idiv__
@@ -160,23 +160,33 @@ tensor:
160
160
  - __imod__
161
161
  - __imul__
162
162
  - __ior__
163
+ - __ipow__
163
164
  - __irshift__
164
165
  - __isub__
165
166
  - __ixor__
167
+ - __le__
166
168
  - __lshift__
169
+ - __lt__
167
170
  - __matmul__
168
171
  - __mod__
169
172
  - __mul__
173
+ - __ne__
170
174
  - __nonzero__
171
175
  - __or__
176
+ - __pow__
172
177
  - __radd__
178
+ - __rdiv__
179
+ - __rmod__
173
180
  - __rmul__
181
+ - __ror__
182
+ - __rpow__
174
183
  - __rshift__
184
+ - __rsub__
185
+ - __rxor__
175
186
  - __setitem__
176
187
  - __sub__
177
188
  - __truediv__
178
189
  - __xor__
179
- - __pow__
180
190
  - abs
181
191
  - abs_
182
192
  - absolute
@@ -199,12 +209,14 @@ tensor:
199
209
  - addmv_
200
210
  - addr
201
211
  - addr_
212
+ - adjoint
202
213
  - align_as
203
214
  - align_to
204
215
  - all
205
216
  - allclose
206
217
  - amax
207
218
  - amin
219
+ - aminmax
208
220
  - angle
209
221
  - any
210
222
  - arccos
@@ -216,12 +228,15 @@ tensor:
216
228
  - arcsinh
217
229
  - arcsinh_
218
230
  - arctan
231
+ - arctan2
232
+ - arctan2_
219
233
  - arctan_
220
234
  - arctanh
221
235
  - arctanh_
222
236
  - argmax
223
237
  - argmin
224
238
  - argsort
239
+ - argwhere
225
240
  - asin
226
241
  - asin_
227
242
  - asinh
@@ -236,39 +251,51 @@ tensor:
236
251
  - baddbmm_
237
252
  - bernoulli
238
253
  - bernoulli_
254
+ - bfloat16
239
255
  - bincount
240
256
  - bitwise_and
241
257
  - bitwise_and_
258
+ - bitwise_left_shift
259
+ - bitwise_left_shift_
242
260
  - bitwise_not
243
261
  - bitwise_not_
244
262
  - bitwise_or
245
263
  - bitwise_or_
264
+ - bitwise_right_shift
265
+ - bitwise_right_shift_
246
266
  - bitwise_xor
247
267
  - bitwise_xor_
248
268
  - bmm
269
+ - bool
249
270
  - broadcast_to
271
+ - byte
250
272
  - cauchy_
251
273
  - ceil
252
274
  - ceil_
275
+ - cfloat
276
+ - char
253
277
  - cholesky
278
+ - cholesky_inverse
279
+ - cholesky_solve
254
280
  - chunk
255
281
  - clamp
256
- - cholesky_solve
257
- - cholesky_inverse
258
282
  - clamp_
259
283
  - clamp_max
260
284
  - clamp_max_
261
- - clip
262
285
  - clamp_min
263
286
  - clamp_min_
287
+ - clip
264
288
  - clip_
289
+ - conj_physical
265
290
  - copysign
266
291
  - copysign_
292
+ - corrcoef
267
293
  - cos
268
294
  - cos_
269
295
  - cosh
270
296
  - cosh_
271
297
  - count_nonzero
298
+ - cov
272
299
  - cummax
273
300
  - cummin
274
301
  - cumprod
@@ -282,20 +309,23 @@ tensor:
282
309
  - diag_embed
283
310
  - diagflat
284
311
  - diagonal
312
+ - diagonal_scatter
285
313
  - diff
286
- - dist
287
314
  - digamma
288
315
  - digamma_
316
+ - dist
289
317
  - div
290
318
  - div_
291
319
  - divide
292
320
  - divide_
293
321
  - dot
322
+ - double
323
+ - dsplit
294
324
  - eig
295
325
  - eq
296
326
  - eq_
297
- - erf
298
327
  - equal
328
+ - erf
299
329
  - erf_
300
330
  - erfc
301
331
  - erfc_
@@ -304,18 +334,21 @@ tensor:
304
334
  - exp
305
335
  - exp2
306
336
  - exp2_
307
- - expm1
308
337
  - exp_
338
+ - expand
339
+ - expand_as
340
+ - expm1
309
341
  - expm1_
310
342
  - exponential_
311
343
  - fill_
312
- - fix
313
344
  - fill_diagonal_
345
+ - fix
314
346
  - fix_
347
+ - flatten
315
348
  - flip
316
349
  - fliplr
317
- - flatten
318
350
  - flipud
351
+ - float
319
352
  - float_power
320
353
  - float_power_
321
354
  - floor
@@ -328,6 +361,7 @@ tensor:
328
361
  - fmod_
329
362
  - frac
330
363
  - frac_
364
+ - frexp
331
365
  - gather
332
366
  - gcd
333
367
  - gcd_
@@ -338,31 +372,37 @@ tensor:
338
372
  - ger
339
373
  - greater
340
374
  - greater_
341
- - gt
342
- - gt_
343
375
  - greater_equal
344
376
  - greater_equal_
377
+ - gt
378
+ - gt_
379
+ - half
345
380
  - hardshrink
346
381
  - heaviside
347
382
  - heaviside_
348
383
  - histc
384
+ - histogram
385
+ - hsplit
349
386
  - hypot
350
387
  - hypot_
388
+ - i0
389
+ - i0_
351
390
  - igamma
352
391
  - igamma_
353
392
  - igammac
354
393
  - igammac_
355
394
  - index_add
356
395
  - index_add_
357
- - inverse
358
396
  - index_copy
359
397
  - index_copy_
360
398
  - index_fill
361
399
  - index_fill_
362
400
  - index_put
363
401
  - index_put_
364
- - inner
365
402
  - index_select
403
+ - inner
404
+ - int
405
+ - inverse
366
406
  - isclose
367
407
  - isfinite
368
408
  - isinf
@@ -380,7 +420,6 @@ tensor:
380
420
  - le_
381
421
  - lerp
382
422
  - lerp_
383
- - where
384
423
  - less
385
424
  - less_
386
425
  - less_equal
@@ -397,43 +436,47 @@ tensor:
397
436
  - log_
398
437
  - log_normal_
399
438
  - log_softmax
400
- - logcumsumexp
401
- - logdet
402
439
  - logaddexp
403
440
  - logaddexp2
441
+ - logcumsumexp
442
+ - logdet
404
443
  - logical_and
405
444
  - logical_and_
406
445
  - logical_not
407
- - logit
408
446
  - logical_not_
409
447
  - logical_or
410
448
  - logical_or_
411
449
  - logical_xor
412
450
  - logical_xor_
451
+ - logit
413
452
  - logit_
414
453
  - logsumexp
454
+ - long
415
455
  - lstsq
416
456
  - lt
417
457
  - lt_
458
+ - lu
418
459
  - lu_solve
419
460
  - map2_
420
461
  - map_
421
462
  - masked_fill
422
- - matmul
423
463
  - masked_fill_
424
464
  - masked_scatter
425
465
  - masked_scatter_
426
466
  - masked_select
467
+ - matmul
427
468
  - matrix_exp
469
+ - matrix_power
428
470
  - max
429
471
  - maximum
430
472
  - mean
431
- - matrix_power
432
473
  - median
433
474
  - min
434
475
  - minimum
435
476
  - mm
436
477
  - mode
478
+ - moveaxis
479
+ - movedim
437
480
  - msort
438
481
  - mul
439
482
  - mul_
@@ -443,6 +486,11 @@ tensor:
443
486
  - mv
444
487
  - mvlgamma
445
488
  - mvlgamma_
489
+ - nan_to_num
490
+ - nan_to_num_
491
+ - nanmean
492
+ - nanmedian
493
+ - nanquantile
446
494
  - nansum
447
495
  - narrow
448
496
  - narrow_copy
@@ -452,20 +500,29 @@ tensor:
452
500
  - neg_
453
501
  - negative
454
502
  - negative_
503
+ - nextafter
504
+ - nextafter_
455
505
  - nonzero
456
506
  - norm
457
507
  - normal_
458
508
  - not_equal
459
509
  - not_equal_
510
+ - numpy
511
+ - orgqr
512
+ - ormqr
513
+ - outer
460
514
  - permute
461
515
  - pinverse
462
516
  - polygamma
517
+ - polygamma_
463
518
  - pow
464
519
  - pow_
465
- - polygamma_
466
520
  - prelu
467
521
  - prod
468
522
  - put_
523
+ - q_zero_point
524
+ - qr
525
+ - quantile
469
526
  - rad2deg
470
527
  - rad2deg_
471
528
  - ravel
@@ -474,15 +531,16 @@ tensor:
474
531
  - relu
475
532
  - relu_
476
533
  - remainder
477
- - repeat_interleave
478
- - reshape
479
534
  - remainder_
480
535
  - renorm
481
536
  - renorm_
482
537
  - repeat
538
+ - repeat_interleave
539
+ - reshape
483
540
  - reshape_as
484
541
  - resize_
485
542
  - resize_as_
543
+ - resolve_neg
486
544
  - roll
487
545
  - rot90
488
546
  - round
@@ -496,6 +554,7 @@ tensor:
496
554
  - select
497
555
  - sgn
498
556
  - sgn_
557
+ - short
499
558
  - sigmoid
500
559
  - sigmoid_
501
560
  - sign
@@ -507,11 +566,13 @@ tensor:
507
566
  - sinc_
508
567
  - sinh
509
568
  - sinh_
569
+ - slice_scatter
510
570
  - slogdet
511
571
  - smm
512
572
  - softmax
513
573
  - solve
514
574
  - sort
575
+ - split
515
576
  - split_with_sizes
516
577
  - sqrt
517
578
  - sqrt_
@@ -521,21 +582,29 @@ tensor:
521
582
  - squeeze_
522
583
  - sspaddmm
523
584
  - std
585
+ - stft
586
+ - stride
524
587
  - sub
525
588
  - sub_
589
+ - subtract
526
590
  - sum
527
591
  - sum_to_size
528
592
  - svd
593
+ - swapaxes
594
+ - swapdims
595
+ - swapdims_
529
596
  - symeig
530
597
  - t
531
598
  - t_
532
599
  - take
600
+ - take_along_dim
533
601
  - tan
534
602
  - tan_
535
603
  - tanh
536
604
  - tanh_
537
605
  - tensor_split
538
606
  - tile
607
+ - to
539
608
  - topk
540
609
  - transpose
541
610
  - transpose_
@@ -543,8 +612,8 @@ tensor:
543
612
  - tril
544
613
  - tril_
545
614
  - triu
546
- - true_divide
547
615
  - triu_
616
+ - true_divide
548
617
  - true_divide_
549
618
  - trunc
550
619
  - trunc_
@@ -552,37 +621,20 @@ tensor:
552
621
  - unbind
553
622
  - unflatten
554
623
  - unfold
624
+ - unique
625
+ - unique_consecutive
555
626
  - unsafe_chunk
556
- - unsqueeze
557
627
  - unsafe_split
558
628
  - unsafe_split_with_sizes
629
+ - unsqueeze
630
+ - unsqueeze_
559
631
  - var
560
632
  - vdot
561
- - unsqueeze_
562
633
  - view_as
634
+ - vsplit
635
+ - where
563
636
  - xlogy
564
637
  - xlogy_
565
- - split
566
- - stft
567
- - nan_to_num
568
- - dsplit
569
- - orgqr
570
- - bitwise_left_shift_
571
- - arctan2
572
- - histogram
573
- - q_zero_point
574
- - adjoint
575
- - ormqr
576
- - bitwise_right_shift_
577
- - nanquantile
578
- - lu
579
- - quantile
580
- - arctan2_
581
- - qr
582
- - diagonal_scatter
583
- - corrcoef
584
- - vsplit
585
- - aminmax
586
638
 
587
639
  torch:
588
640
  - linalg.norm
@@ -624,6 +676,7 @@ torch:
624
676
  - _batch_norm_impl_index
625
677
  - _convolution
626
678
  - _foreach_norm
679
+ - _fused_adamw_
627
680
  - _softmax_backward_data
628
681
  - abs
629
682
  - abs_
@@ -642,13 +695,14 @@ torch:
642
695
  - addmv
643
696
  - addmv_
644
697
  - addr
645
- - amax
646
698
  - affine_grid_generator
647
699
  - align_tensors
648
700
  - all
649
701
  - alpha_dropout
650
- - amin
651
702
  - alpha_dropout_
703
+ - amax
704
+ - amin
705
+ - aminmax
652
706
  - angle
653
707
  - any
654
708
  - arange
@@ -661,12 +715,14 @@ torch:
661
715
  - arcsinh
662
716
  - arcsinh_
663
717
  - arctan
718
+ - arctan2
664
719
  - arctan_
665
720
  - arctanh
666
721
  - arctanh_
667
722
  - argmax
668
723
  - argmin
669
724
  - argsort
725
+ - argwhere
670
726
  - asin
671
727
  - asin_
672
728
  - asinh
@@ -687,13 +743,13 @@ torch:
687
743
  - batch_norm_elemt
688
744
  - batch_norm_gather_stats
689
745
  - batch_norm_gather_stats_with_counts
690
- - bernoulli
691
746
  - batch_norm_stats
692
747
  - batch_norm_update_stats
748
+ - bernoulli
693
749
  - bilinear
750
+ - binary_cross_entropy_with_logits
694
751
  - bincount
695
752
  - binomial
696
- - binary_cross_entropy_with_logits
697
753
  - bitwise_and
698
754
  - bitwise_not
699
755
  - bitwise_or
@@ -739,9 +795,9 @@ torch:
739
795
  - conv_transpose1d
740
796
  - conv_transpose2d
741
797
  - conv_transpose3d
742
- - cos
743
798
  - convolution
744
799
  - copysign
800
+ - cos
745
801
  - cos_
746
802
  - cosh
747
803
  - cosh_
@@ -755,14 +811,16 @@ torch:
755
811
  - cummin
756
812
  - cumprod
757
813
  - cumsum
814
+ - cumulative_trapezoid
758
815
  - deg2rad
759
816
  - deg2rad_
760
817
  - det
761
818
  - diag
762
819
  - diag_embed
763
- - diff
764
820
  - diagflat
765
821
  - diagonal
822
+ - diagonal_scatter
823
+ - diff
766
824
  - digamma
767
825
  - dist
768
826
  - div
@@ -771,12 +829,15 @@ torch:
771
829
  - dropout
772
830
  - dropout_
773
831
  - dsmm
832
+ - dsplit
774
833
  - dstack
775
834
  - eig
776
835
  - einsum
777
836
  - embedding
778
837
  - embedding_bag
779
838
  - embedding_renorm_
839
+ - empty
840
+ - empty_like
780
841
  - eq
781
842
  - equal
782
843
  - erf
@@ -791,12 +852,12 @@ torch:
791
852
  - expm1
792
853
  - expm1_
793
854
  - eye
794
- - feature_dropout
795
855
  - feature_alpha_dropout
796
856
  - feature_alpha_dropout_
857
+ - feature_dropout
797
858
  - feature_dropout_
798
- - fix
799
859
  - fill_
860
+ - fix
800
861
  - fix_
801
862
  - flatten
802
863
  - flip
@@ -811,8 +872,9 @@ torch:
811
872
  - fmod
812
873
  - frac
813
874
  - frac_
814
- - full
875
+ - frexp
815
876
  - frobenius_norm
877
+ - full
816
878
  - full_like
817
879
  - gather
818
880
  - gcd
@@ -824,8 +886,8 @@ torch:
824
886
  - greater_equal
825
887
  - grid_sampler
826
888
  - grid_sampler_2d
827
- - group_norm
828
889
  - grid_sampler_3d
890
+ - group_norm
829
891
  - gru
830
892
  - gru_cell
831
893
  - gt
@@ -835,23 +897,29 @@ torch:
835
897
  - heaviside
836
898
  - hinge_embedding_loss
837
899
  - histc
900
+ - histogram
901
+ - histogramdd
838
902
  - hsmm
903
+ - hsplit
839
904
  - hspmm
840
905
  - hstack
841
906
  - hypot
907
+ - i0
908
+ - i0_
842
909
  - igamma
843
910
  - igammac
844
911
  - index_add
845
912
  - index_copy
846
- - inner
847
913
  - index_fill
848
914
  - index_put
849
915
  - index_put_
850
916
  - index_select
917
+ - inner
851
918
  - instance_norm
852
919
  - inverse
853
920
  - isclose
854
921
  - isfinite
922
+ - isin
855
923
  - isinf
856
924
  - isnan
857
925
  - isneginf
@@ -879,8 +947,8 @@ torch:
879
947
  - log1p_
880
948
  - log2
881
949
  - log2_
882
- - log_softmax
883
950
  - log_
951
+ - log_softmax
884
952
  - logaddexp
885
953
  - logaddexp2
886
954
  - logcumsumexp
@@ -899,18 +967,18 @@ torch:
899
967
  - lt
900
968
  - lu_solve
901
969
  - lu_unpack
902
- - masked_fill
903
970
  - margin_ranking_loss
971
+ - masked_fill
904
972
  - masked_scatter
905
973
  - masked_select
906
- - matrix_exp
907
974
  - matmul
975
+ - matrix_exp
908
976
  - matrix_power
909
977
  - matrix_rank
910
978
  - max
911
979
  - max_pool1d
912
- - max_pool2d
913
980
  - max_pool1d_with_indices
981
+ - max_pool2d
914
982
  - max_pool3d
915
983
  - maximum
916
984
  - mean
@@ -929,18 +997,20 @@ torch:
929
997
  - mvlgamma
930
998
  - nan_to_num
931
999
  - nan_to_num_
1000
+ - nanmean
932
1001
  - nanmedian
1002
+ - nanquantile
933
1003
  - nansum
934
1004
  - narrow
1005
+ - narrow_copy
935
1006
  - native_batch_norm
936
1007
  - native_group_norm
937
- - narrow_copy
938
1008
  - native_layer_norm
939
1009
  - native_norm
940
1010
  - ne
941
1011
  - neg
942
- - negative
943
1012
  - neg_
1013
+ - negative
944
1014
  - negative_
945
1015
  - nextafter
946
1016
  - nonzero
@@ -972,30 +1042,31 @@ torch:
972
1042
  - ravel
973
1043
  - real
974
1044
  - reciprocal
975
- - relu
976
1045
  - reciprocal_
1046
+ - relu
977
1047
  - relu_
978
1048
  - remainder
979
1049
  - renorm
980
1050
  - repeat_interleave
981
1051
  - reshape
982
1052
  - resize_as_
1053
+ - resolve_neg
983
1054
  - roll
984
1055
  - rot90
985
1056
  - round
986
1057
  - round_
1058
+ - row_stack
987
1059
  - rrelu
988
1060
  - rrelu_
989
1061
  - rsqrt
990
- - row_stack
991
1062
  - rsqrt_
992
1063
  - rsub
993
1064
  - saddmm
994
1065
  - scalar_tensor
995
1066
  - scatter
996
- - select
997
1067
  - scatter_add
998
1068
  - searchsorted
1069
+ - select
999
1070
  - selu
1000
1071
  - selu_
1001
1072
  - sgn
@@ -1015,12 +1086,12 @@ torch:
1015
1086
  - solve
1016
1087
  - sort
1017
1088
  - sparse_coo_tensor
1018
- - square
1019
1089
  - split
1020
1090
  - split_with_sizes
1021
1091
  - spmm
1022
1092
  - sqrt
1023
1093
  - sqrt_
1094
+ - square
1024
1095
  - square_
1025
1096
  - squeeze
1026
1097
  - sspaddmm
@@ -1042,8 +1113,8 @@ torch:
1042
1113
  - tan_
1043
1114
  - tanh
1044
1115
  - tanh_
1045
- - tensordot
1046
1116
  - tensor_split
1117
+ - tensordot
1047
1118
  - threshold
1048
1119
  - threshold_
1049
1120
  - tile
@@ -1059,19 +1130,21 @@ torch:
1059
1130
  - true_divide
1060
1131
  - trunc
1061
1132
  - trunc_
1062
- - unique_consecutive
1063
- - xlogy
1064
1133
  - unbind
1134
+ - unflatten
1135
+ - unique_consecutive
1065
1136
  - unsafe_chunk
1066
1137
  - unsafe_split
1067
- - vander
1068
- - var
1069
- - vdot
1070
1138
  - unsafe_split_with_sizes
1071
1139
  - unsqueeze
1140
+ - vander
1141
+ - var
1072
1142
  - var_mean
1143
+ - vdot
1144
+ - vsplit
1073
1145
  - vstack
1074
1146
  - where
1147
+ - xlogy
1075
1148
  - xlogy_
1076
1149
 
1077
1150
  _VF:
@@ -1165,6 +1238,28 @@ torch_npu:
1165
1238
  - npu_moe_finalize_routing
1166
1239
  - npu_moe_gating_top_k_softmax
1167
1240
  - npu_trans_quant_param
1241
+ - npu_gelu
1242
+ - npu_ffn
1243
+ - npu_quant_matmul
1244
+ - npu_format_cast_
1245
+ - npu_dynamic_quant
1246
+ - npu_moe_compute_expert_tokens
1247
+ - npu_weight_quant_batchmatmul
1248
+ - npu_dynamic_quant_asymmetric
1249
+ - npu_grouped_matmul
1250
+ - npu_quant_scatter_
1251
+ - npu_group_quant
1252
+ - npu_fused_infer_attention_score
1253
+ - npu_quantize
1254
+ - npu_fast_gelu
1255
+ - npu_weight_quant_batchmatmul
1256
+ - scatter_update
1257
+ - scatter_update_
1258
+ - npu_moe_init_routing
1259
+ - npu_scatter_nd_update_
1260
+ - npu_scatter_nd_update
1261
+ - npu_prefetch
1262
+ - npu_dynamic_block_quant
1168
1263
 
1169
1264
  aten:
1170
1265
  - signbit
@@ -1912,4 +2007,27 @@ distributed:
1912
2007
  - all_to_all
1913
2008
  - all_gather_into_tensor
1914
2009
  - reduce_scatter_tensor
1915
- - batch_isend_irecv
2010
+ - batch_isend_irecv
2011
+
2012
+ npu_distributed:
2013
+ - isend
2014
+ - irecv
2015
+
2016
+ mindspeed:
2017
+ - dropout_add_layer_norm.npu_dropout_add_layer_norm
2018
+ - npu_rotary_position_embedding.npu_rotary_position_embedding
2019
+ - fusion_attention_v2.npu_fusion_attention
2020
+ - npu_mm_all_reduce_add_rms_norm.npu_mm_all_reduce_add_rms_norm
2021
+ - npu_mm_all_reduce_add_rms_norm_.npu_mm_all_reduce_add_rms_norm_
2022
+ - gmm.npu_gmm
2023
+ - gmm.npu_gmm_v2
2024
+ - npu_grouped_mat_mul_all_reduce.npu_grouped_mat_mul_all_reduce
2025
+ - ffn.npu_ffn
2026
+ - npu_moe_token_permute.npu_moe_token_permute
2027
+ - npu_moe_token_unpermute.npu_moe_token_unpermute
2028
+ - npu_ring_attention_update.npu_ring_attention_update
2029
+ - npu_matmul_add.npu_matmul_add_fp32
2030
+ - npu_groupmatmul_add.npu_groupmatmul_add_fp32
2031
+ - quant_gmm.npu_quant_gmm
2032
+ - quant_gmm.npu_quant_gmm_v2
2033
+ - npu_apply_fused_ema_adamw.npu_apply_fused_ema_adamw