mindstudio-probe 1.2.2__py3-none-any.whl → 8.1.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {mindstudio_probe-1.2.2.dist-info → mindstudio_probe-8.1.0.dist-info}/METADATA +4 -3
- {mindstudio_probe-1.2.2.dist-info → mindstudio_probe-8.1.0.dist-info}/RECORD +243 -191
- msprobe/README.md +57 -21
- msprobe/core/__init__.py +17 -0
- msprobe/core/common/const.py +224 -82
- msprobe/core/common/decorator.py +50 -0
- msprobe/core/common/exceptions.py +5 -3
- msprobe/core/common/file_utils.py +274 -40
- msprobe/core/common/framework_adapter.py +169 -0
- msprobe/core/common/global_lock.py +86 -0
- msprobe/core/common/runtime.py +25 -0
- msprobe/core/common/utils.py +148 -72
- msprobe/core/common_config.py +7 -0
- msprobe/core/compare/acc_compare.py +640 -462
- msprobe/core/compare/check.py +36 -107
- msprobe/core/compare/compare_cli.py +4 -0
- msprobe/core/compare/config.py +72 -0
- msprobe/core/compare/highlight.py +217 -215
- msprobe/core/compare/layer_mapping/layer_mapping.py +4 -1
- msprobe/core/compare/merge_result/merge_result.py +12 -6
- msprobe/core/compare/multiprocessing_compute.py +227 -107
- msprobe/core/compare/npy_compare.py +32 -16
- msprobe/core/compare/utils.py +218 -244
- msprobe/{mindspore/runtime.py → core/config_check/__init__.py} +2 -4
- msprobe/{pytorch/dump/kernel_dump/kernel_config.py → core/config_check/checkers/__init__.py} +8 -16
- msprobe/core/config_check/checkers/base_checker.py +60 -0
- msprobe/core/config_check/checkers/dataset_checker.py +138 -0
- msprobe/core/config_check/checkers/env_args_checker.py +96 -0
- msprobe/core/config_check/checkers/hyperparameter_checker.py +170 -0
- msprobe/core/config_check/checkers/pip_checker.py +90 -0
- msprobe/core/config_check/checkers/random_checker.py +367 -0
- msprobe/core/config_check/checkers/weights_checker.py +147 -0
- msprobe/core/config_check/ckpt_compare/ckpt_comparator.py +74 -0
- msprobe/core/config_check/ckpt_compare/megatron_loader.py +302 -0
- msprobe/core/config_check/ckpt_compare/metrics.py +83 -0
- msprobe/core/config_check/ckpt_compare/name_mapping.yaml +12 -0
- msprobe/core/config_check/config_check_cli.py +51 -0
- msprobe/core/config_check/config_checker.py +100 -0
- msprobe/{pytorch/parse.py → core/config_check/resource/dependency.yaml} +7 -4
- msprobe/core/config_check/resource/env.yaml +57 -0
- msprobe/core/config_check/resource/hyperparameter.yaml +21 -0
- msprobe/core/config_check/utils/hyperparameter_parser.py +115 -0
- msprobe/core/config_check/utils/utils.py +107 -0
- msprobe/core/data_dump/api_registry.py +239 -0
- msprobe/core/data_dump/data_collector.py +36 -9
- msprobe/core/data_dump/data_processor/base.py +74 -53
- msprobe/core/data_dump/data_processor/mindspore_processor.py +119 -78
- msprobe/core/data_dump/data_processor/pytorch_processor.py +134 -96
- msprobe/core/data_dump/json_writer.py +146 -57
- msprobe/core/debugger/precision_debugger.py +143 -0
- msprobe/core/grad_probe/constant.py +2 -1
- msprobe/core/grad_probe/grad_compare.py +2 -2
- msprobe/core/grad_probe/utils.py +1 -1
- msprobe/core/hook_manager.py +242 -0
- msprobe/core/monitor/anomaly_processor.py +384 -0
- msprobe/core/overflow_check/abnormal_scene.py +2 -0
- msprobe/core/service.py +356 -0
- msprobe/core/single_save/__init__.py +0 -0
- msprobe/core/single_save/single_comparator.py +243 -0
- msprobe/core/single_save/single_saver.py +157 -0
- msprobe/docs/01.installation.md +6 -5
- msprobe/docs/02.config_introduction.md +89 -30
- msprobe/docs/03.config_examples.md +1 -0
- msprobe/docs/04.kernel_dump_PyTorch.md +1 -1
- msprobe/docs/05.data_dump_PyTorch.md +184 -50
- msprobe/docs/06.data_dump_MindSpore.md +193 -28
- msprobe/docs/07.accuracy_checker_PyTorch.md +13 -3
- msprobe/docs/08.accuracy_checker_online_PyTorch.md +72 -10
- msprobe/docs/09.accuracy_checker_MindSpore.md +19 -7
- msprobe/docs/10.accuracy_compare_PyTorch.md +266 -102
- msprobe/docs/11.accuracy_compare_MindSpore.md +117 -43
- msprobe/docs/12.overflow_check_PyTorch.md +5 -3
- msprobe/docs/13.overflow_check_MindSpore.md +6 -4
- msprobe/docs/14.data_parse_PyTorch.md +4 -10
- msprobe/docs/17.grad_probe.md +2 -1
- msprobe/docs/18.online_dispatch.md +3 -3
- msprobe/docs/19.monitor.md +211 -103
- msprobe/docs/21.visualization_PyTorch.md +100 -28
- msprobe/docs/22.visualization_MindSpore.md +103 -31
- msprobe/docs/23.generate_operator_PyTorch.md +9 -9
- msprobe/docs/25.tool_function_introduction.md +23 -22
- msprobe/docs/26.data_dump_PyTorch_baseline.md +14 -3
- msprobe/docs/27.dump_json_instruction.md +278 -8
- msprobe/docs/28.debugger_save_instruction.md +111 -20
- msprobe/docs/28.kernel_dump_MindSpore.md +1 -1
- msprobe/docs/29.data_dump_MSAdapter.md +229 -0
- msprobe/docs/30.overflow_check_MSAdapter.md +31 -0
- msprobe/docs/31.config_check.md +95 -0
- msprobe/docs/32.ckpt_compare.md +69 -0
- msprobe/docs/33.generate_operator_MindSpore.md +190 -0
- msprobe/docs/34.RL_collect.md +92 -0
- msprobe/docs/35.nan_analyze.md +72 -0
- msprobe/docs/FAQ.md +3 -11
- msprobe/docs/data_dump_MindSpore/data_dump_MindSpore_baseline.md +12 -1
- msprobe/docs/data_dump_MindSpore/dynamic_graph_quick_start_example.md +3 -1
- msprobe/docs/img/compare_result.png +0 -0
- msprobe/docs/img/merge_result.png +0 -0
- msprobe/docs/img/save_compare_result_sample.png +0 -0
- msprobe/docs/img/visualization/proxy.png +0 -0
- msprobe/docs/img/visualization/vis_browser_1.png +0 -0
- msprobe/docs/img/visualization/vis_match_info.png +0 -0
- msprobe/docs/img/visualization/vis_precision_info.png +0 -0
- msprobe/docs/img/visualization/vis_search_info.png +0 -0
- msprobe/docs/img/visualization/vis_show_info.png +0 -0
- msprobe/docs/img/visualization/vis_showcase.png +0 -0
- msprobe/docs/img/visualization/vis_unmatch_info.png +0 -0
- msprobe/mindspore/__init__.py +3 -3
- msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +151 -55
- msprobe/mindspore/api_accuracy_checker/api_runner.py +25 -11
- msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +2 -1
- msprobe/mindspore/api_accuracy_checker/bench_functions/flash_attention_score.py +580 -0
- msprobe/mindspore/api_accuracy_checker/bench_functions/fusion_operator.py +41 -0
- msprobe/mindspore/api_accuracy_checker/cmd_parser.py +4 -0
- msprobe/mindspore/api_accuracy_checker/data_manager.py +4 -3
- msprobe/mindspore/api_accuracy_checker/generate_op_script/config_op.json +9 -0
- msprobe/mindspore/api_accuracy_checker/generate_op_script/op_generator.py +451 -0
- msprobe/mindspore/api_accuracy_checker/generate_op_script/operator_replication.template +2081 -0
- msprobe/mindspore/api_accuracy_checker/multi_api_accuracy_checker.py +11 -1
- msprobe/mindspore/api_accuracy_checker/torch_mindtorch_importer.py +2 -1
- msprobe/mindspore/cell_processor.py +204 -33
- msprobe/mindspore/code_mapping/graph_parser.py +4 -21
- msprobe/mindspore/common/const.py +73 -2
- msprobe/mindspore/common/utils.py +157 -29
- msprobe/mindspore/compare/common_dir_compare.py +382 -0
- msprobe/mindspore/compare/distributed_compare.py +2 -26
- msprobe/mindspore/compare/ms_compare.py +18 -398
- msprobe/mindspore/compare/ms_graph_compare.py +20 -10
- msprobe/mindspore/compare/utils.py +37 -0
- msprobe/mindspore/debugger/debugger_config.py +59 -7
- msprobe/mindspore/debugger/precision_debugger.py +83 -90
- msprobe/mindspore/dump/cell_dump_process.py +902 -0
- msprobe/mindspore/dump/cell_dump_with_insert_gradient.py +889 -0
- msprobe/mindspore/dump/dump_tool_factory.py +18 -8
- msprobe/mindspore/dump/graph_mode_cell_dump.py +139 -0
- msprobe/mindspore/dump/graph_tensor_dump.py +123 -0
- msprobe/mindspore/dump/hook_cell/api_register.py +176 -0
- msprobe/mindspore/dump/hook_cell/hook_cell.py +22 -12
- msprobe/mindspore/dump/hook_cell/ms_hook_manager.py +88 -0
- msprobe/mindspore/dump/hook_cell/primitive_hooks.py +8 -2
- msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +42 -26
- msprobe/mindspore/dump/jit_dump.py +35 -27
- msprobe/mindspore/dump/kernel_kbyk_dump.py +6 -3
- msprobe/mindspore/dym_loader/hook_dynamic_loader.cpp +110 -0
- msprobe/mindspore/dym_loader/hook_dynamic_loader.h +15 -16
- msprobe/mindspore/free_benchmark/api_pynative_self_check.py +22 -12
- msprobe/mindspore/free_benchmark/common/utils.py +1 -1
- msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +4 -2
- msprobe/mindspore/free_benchmark/self_check_tool_factory.py +6 -3
- msprobe/mindspore/grad_probe/global_context.py +9 -2
- msprobe/mindspore/grad_probe/grad_analyzer.py +2 -1
- msprobe/mindspore/grad_probe/grad_stat_csv.py +3 -2
- msprobe/mindspore/grad_probe/hook.py +2 -4
- msprobe/mindspore/mindspore_service.py +111 -0
- msprobe/mindspore/monitor/common_func.py +52 -0
- msprobe/mindspore/monitor/data_writers.py +237 -0
- msprobe/mindspore/monitor/distributed/wrap_distributed.py +1 -1
- msprobe/mindspore/monitor/features.py +13 -1
- msprobe/mindspore/monitor/module_hook.py +568 -444
- msprobe/mindspore/monitor/optimizer_collect.py +331 -0
- msprobe/mindspore/monitor/utils.py +71 -9
- msprobe/mindspore/ms_config.py +16 -15
- msprobe/mindspore/overflow_check/overflow_check_tool_factory.py +5 -3
- msprobe/mindspore/task_handler_factory.py +5 -2
- msprobe/msprobe.py +19 -0
- msprobe/nan_analyze/__init__.py +14 -0
- msprobe/nan_analyze/analyzer.py +255 -0
- msprobe/nan_analyze/graph.py +189 -0
- msprobe/nan_analyze/utils.py +211 -0
- msprobe/pytorch/api_accuracy_checker/common/config.py +2 -2
- msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +3 -6
- msprobe/pytorch/api_accuracy_checker/compare/compare.py +36 -34
- msprobe/pytorch/api_accuracy_checker/generate_op_script/op_generator.py +15 -13
- msprobe/pytorch/api_accuracy_checker/generate_op_script/operator_replication.template +206 -4
- msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +9 -9
- msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +6 -5
- msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +31 -9
- msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +28 -20
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +3 -1
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +29 -13
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/device_dispatch.py +12 -2
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +45 -31
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/utils.py +154 -0
- msprobe/pytorch/attl_manager.py +65 -0
- msprobe/pytorch/bench_functions/moe_gating_top_k_softmax.py +6 -0
- msprobe/pytorch/bench_functions/npu_fusion_attention.py +27 -0
- msprobe/pytorch/common/utils.py +53 -19
- msprobe/pytorch/compare/distributed_compare.py +4 -36
- msprobe/pytorch/compare/pt_compare.py +13 -84
- msprobe/pytorch/compare/utils.py +47 -0
- msprobe/pytorch/debugger/debugger_config.py +34 -17
- msprobe/pytorch/debugger/precision_debugger.py +50 -96
- msprobe/pytorch/dump/module_dump/hook_wrapper.py +93 -0
- msprobe/pytorch/dump/module_dump/module_dump.py +15 -61
- msprobe/pytorch/dump/module_dump/module_processer.py +150 -114
- msprobe/pytorch/free_benchmark/common/utils.py +1 -1
- msprobe/pytorch/free_benchmark/compare/single_benchmark.py +1 -1
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +3 -3
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +3 -3
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +1 -1
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +1 -1
- msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +1 -1
- msprobe/pytorch/function_factory.py +1 -1
- msprobe/pytorch/grad_probe/grad_monitor.py +2 -2
- msprobe/pytorch/grad_probe/grad_stat_csv.py +3 -2
- msprobe/pytorch/hook_module/api_register.py +155 -0
- msprobe/pytorch/hook_module/hook_module.py +18 -22
- msprobe/pytorch/hook_module/jit_script_wrapper.py +33 -0
- msprobe/pytorch/hook_module/pt_hook_manager.py +68 -0
- msprobe/pytorch/hook_module/register_optimizer_hook.py +2 -1
- msprobe/pytorch/hook_module/support_wrap_ops.yaml +193 -75
- msprobe/pytorch/hook_module/utils.py +28 -2
- msprobe/pytorch/monitor/csv2tb.py +14 -4
- msprobe/pytorch/monitor/data_writers.py +259 -0
- msprobe/pytorch/monitor/distributed/wrap_distributed.py +8 -2
- msprobe/pytorch/monitor/module_hook.py +336 -241
- msprobe/pytorch/monitor/module_metric.py +17 -0
- msprobe/pytorch/monitor/optimizer_collect.py +244 -224
- msprobe/pytorch/monitor/utils.py +84 -4
- msprobe/pytorch/online_dispatch/compare.py +0 -2
- msprobe/pytorch/online_dispatch/dispatch.py +13 -2
- msprobe/pytorch/online_dispatch/dump_compare.py +8 -2
- msprobe/pytorch/online_dispatch/utils.py +3 -0
- msprobe/pytorch/parse_tool/lib/interactive_cli.py +1 -6
- msprobe/pytorch/parse_tool/lib/utils.py +5 -4
- msprobe/pytorch/pt_config.py +16 -11
- msprobe/pytorch/pytorch_service.py +70 -0
- msprobe/visualization/builder/graph_builder.py +69 -10
- msprobe/visualization/builder/msprobe_adapter.py +24 -12
- msprobe/visualization/compare/graph_comparator.py +63 -51
- msprobe/visualization/compare/mode_adapter.py +22 -20
- msprobe/visualization/graph/base_node.py +11 -4
- msprobe/visualization/graph/distributed_analyzer.py +1 -10
- msprobe/visualization/graph/graph.py +2 -13
- msprobe/visualization/graph/node_op.py +1 -2
- msprobe/visualization/graph_service.py +251 -104
- msprobe/visualization/utils.py +26 -44
- msprobe/mindspore/dump/hook_cell/api_registry.py +0 -207
- msprobe/mindspore/dump/hook_cell/wrap_api.py +0 -212
- msprobe/mindspore/dym_loader/hook_dynamic_loader.cc +0 -140
- msprobe/mindspore/monitor/anomaly_detect.py +0 -404
- msprobe/mindspore/monitor/module_spec_verifier.py +0 -94
- msprobe/mindspore/service.py +0 -543
- msprobe/pytorch/hook_module/api_registry.py +0 -166
- msprobe/pytorch/hook_module/wrap_distributed.py +0 -79
- msprobe/pytorch/hook_module/wrap_functional.py +0 -66
- msprobe/pytorch/hook_module/wrap_npu_custom.py +0 -85
- msprobe/pytorch/hook_module/wrap_tensor.py +0 -69
- msprobe/pytorch/hook_module/wrap_torch.py +0 -84
- msprobe/pytorch/hook_module/wrap_vf.py +0 -60
- msprobe/pytorch/monitor/anomaly_analyse.py +0 -201
- msprobe/pytorch/monitor/anomaly_detect.py +0 -410
- msprobe/pytorch/monitor/module_spec_verifier.py +0 -95
- msprobe/pytorch/monitor/unittest/test_monitor.py +0 -160
- msprobe/pytorch/service.py +0 -470
- {mindstudio_probe-1.2.2.dist-info → mindstudio_probe-8.1.0.dist-info}/LICENSE +0 -0
- {mindstudio_probe-1.2.2.dist-info → mindstudio_probe-8.1.0.dist-info}/WHEEL +0 -0
- {mindstudio_probe-1.2.2.dist-info → mindstudio_probe-8.1.0.dist-info}/entry_points.txt +0 -0
- {mindstudio_probe-1.2.2.dist-info → mindstudio_probe-8.1.0.dist-info}/top_level.txt +0 -0
- /msprobe/{mindspore → core}/compare/ms_to_pt_api.yaml +0 -0
- /msprobe/{mindspore/dump → core}/kernel_dump/kernel_config.py +0 -0
- /msprobe/{pytorch/monitor/unittest → core/monitor}/__init__.py +0 -0
|
@@ -149,9 +149,9 @@ tensor:
|
|
|
149
149
|
- __bool__
|
|
150
150
|
- __div__
|
|
151
151
|
- __eq__
|
|
152
|
+
- __floordiv__
|
|
152
153
|
- __ge__
|
|
153
154
|
- __gt__
|
|
154
|
-
- __getitem__
|
|
155
155
|
- __iadd__
|
|
156
156
|
- __iand__
|
|
157
157
|
- __idiv__
|
|
@@ -160,23 +160,33 @@ tensor:
|
|
|
160
160
|
- __imod__
|
|
161
161
|
- __imul__
|
|
162
162
|
- __ior__
|
|
163
|
+
- __ipow__
|
|
163
164
|
- __irshift__
|
|
164
165
|
- __isub__
|
|
165
166
|
- __ixor__
|
|
167
|
+
- __le__
|
|
166
168
|
- __lshift__
|
|
169
|
+
- __lt__
|
|
167
170
|
- __matmul__
|
|
168
171
|
- __mod__
|
|
169
172
|
- __mul__
|
|
173
|
+
- __ne__
|
|
170
174
|
- __nonzero__
|
|
171
175
|
- __or__
|
|
176
|
+
- __pow__
|
|
172
177
|
- __radd__
|
|
178
|
+
- __rdiv__
|
|
179
|
+
- __rmod__
|
|
173
180
|
- __rmul__
|
|
181
|
+
- __ror__
|
|
182
|
+
- __rpow__
|
|
174
183
|
- __rshift__
|
|
184
|
+
- __rsub__
|
|
185
|
+
- __rxor__
|
|
175
186
|
- __setitem__
|
|
176
187
|
- __sub__
|
|
177
188
|
- __truediv__
|
|
178
189
|
- __xor__
|
|
179
|
-
- __pow__
|
|
180
190
|
- abs
|
|
181
191
|
- abs_
|
|
182
192
|
- absolute
|
|
@@ -199,12 +209,14 @@ tensor:
|
|
|
199
209
|
- addmv_
|
|
200
210
|
- addr
|
|
201
211
|
- addr_
|
|
212
|
+
- adjoint
|
|
202
213
|
- align_as
|
|
203
214
|
- align_to
|
|
204
215
|
- all
|
|
205
216
|
- allclose
|
|
206
217
|
- amax
|
|
207
218
|
- amin
|
|
219
|
+
- aminmax
|
|
208
220
|
- angle
|
|
209
221
|
- any
|
|
210
222
|
- arccos
|
|
@@ -216,12 +228,15 @@ tensor:
|
|
|
216
228
|
- arcsinh
|
|
217
229
|
- arcsinh_
|
|
218
230
|
- arctan
|
|
231
|
+
- arctan2
|
|
232
|
+
- arctan2_
|
|
219
233
|
- arctan_
|
|
220
234
|
- arctanh
|
|
221
235
|
- arctanh_
|
|
222
236
|
- argmax
|
|
223
237
|
- argmin
|
|
224
238
|
- argsort
|
|
239
|
+
- argwhere
|
|
225
240
|
- asin
|
|
226
241
|
- asin_
|
|
227
242
|
- asinh
|
|
@@ -236,39 +251,51 @@ tensor:
|
|
|
236
251
|
- baddbmm_
|
|
237
252
|
- bernoulli
|
|
238
253
|
- bernoulli_
|
|
254
|
+
- bfloat16
|
|
239
255
|
- bincount
|
|
240
256
|
- bitwise_and
|
|
241
257
|
- bitwise_and_
|
|
258
|
+
- bitwise_left_shift
|
|
259
|
+
- bitwise_left_shift_
|
|
242
260
|
- bitwise_not
|
|
243
261
|
- bitwise_not_
|
|
244
262
|
- bitwise_or
|
|
245
263
|
- bitwise_or_
|
|
264
|
+
- bitwise_right_shift
|
|
265
|
+
- bitwise_right_shift_
|
|
246
266
|
- bitwise_xor
|
|
247
267
|
- bitwise_xor_
|
|
248
268
|
- bmm
|
|
269
|
+
- bool
|
|
249
270
|
- broadcast_to
|
|
271
|
+
- byte
|
|
250
272
|
- cauchy_
|
|
251
273
|
- ceil
|
|
252
274
|
- ceil_
|
|
275
|
+
- cfloat
|
|
276
|
+
- char
|
|
253
277
|
- cholesky
|
|
278
|
+
- cholesky_inverse
|
|
279
|
+
- cholesky_solve
|
|
254
280
|
- chunk
|
|
255
281
|
- clamp
|
|
256
|
-
- cholesky_solve
|
|
257
|
-
- cholesky_inverse
|
|
258
282
|
- clamp_
|
|
259
283
|
- clamp_max
|
|
260
284
|
- clamp_max_
|
|
261
|
-
- clip
|
|
262
285
|
- clamp_min
|
|
263
286
|
- clamp_min_
|
|
287
|
+
- clip
|
|
264
288
|
- clip_
|
|
289
|
+
- conj_physical
|
|
265
290
|
- copysign
|
|
266
291
|
- copysign_
|
|
292
|
+
- corrcoef
|
|
267
293
|
- cos
|
|
268
294
|
- cos_
|
|
269
295
|
- cosh
|
|
270
296
|
- cosh_
|
|
271
297
|
- count_nonzero
|
|
298
|
+
- cov
|
|
272
299
|
- cummax
|
|
273
300
|
- cummin
|
|
274
301
|
- cumprod
|
|
@@ -282,20 +309,23 @@ tensor:
|
|
|
282
309
|
- diag_embed
|
|
283
310
|
- diagflat
|
|
284
311
|
- diagonal
|
|
312
|
+
- diagonal_scatter
|
|
285
313
|
- diff
|
|
286
|
-
- dist
|
|
287
314
|
- digamma
|
|
288
315
|
- digamma_
|
|
316
|
+
- dist
|
|
289
317
|
- div
|
|
290
318
|
- div_
|
|
291
319
|
- divide
|
|
292
320
|
- divide_
|
|
293
321
|
- dot
|
|
322
|
+
- double
|
|
323
|
+
- dsplit
|
|
294
324
|
- eig
|
|
295
325
|
- eq
|
|
296
326
|
- eq_
|
|
297
|
-
- erf
|
|
298
327
|
- equal
|
|
328
|
+
- erf
|
|
299
329
|
- erf_
|
|
300
330
|
- erfc
|
|
301
331
|
- erfc_
|
|
@@ -304,18 +334,21 @@ tensor:
|
|
|
304
334
|
- exp
|
|
305
335
|
- exp2
|
|
306
336
|
- exp2_
|
|
307
|
-
- expm1
|
|
308
337
|
- exp_
|
|
338
|
+
- expand
|
|
339
|
+
- expand_as
|
|
340
|
+
- expm1
|
|
309
341
|
- expm1_
|
|
310
342
|
- exponential_
|
|
311
343
|
- fill_
|
|
312
|
-
- fix
|
|
313
344
|
- fill_diagonal_
|
|
345
|
+
- fix
|
|
314
346
|
- fix_
|
|
347
|
+
- flatten
|
|
315
348
|
- flip
|
|
316
349
|
- fliplr
|
|
317
|
-
- flatten
|
|
318
350
|
- flipud
|
|
351
|
+
- float
|
|
319
352
|
- float_power
|
|
320
353
|
- float_power_
|
|
321
354
|
- floor
|
|
@@ -328,6 +361,7 @@ tensor:
|
|
|
328
361
|
- fmod_
|
|
329
362
|
- frac
|
|
330
363
|
- frac_
|
|
364
|
+
- frexp
|
|
331
365
|
- gather
|
|
332
366
|
- gcd
|
|
333
367
|
- gcd_
|
|
@@ -338,31 +372,37 @@ tensor:
|
|
|
338
372
|
- ger
|
|
339
373
|
- greater
|
|
340
374
|
- greater_
|
|
341
|
-
- gt
|
|
342
|
-
- gt_
|
|
343
375
|
- greater_equal
|
|
344
376
|
- greater_equal_
|
|
377
|
+
- gt
|
|
378
|
+
- gt_
|
|
379
|
+
- half
|
|
345
380
|
- hardshrink
|
|
346
381
|
- heaviside
|
|
347
382
|
- heaviside_
|
|
348
383
|
- histc
|
|
384
|
+
- histogram
|
|
385
|
+
- hsplit
|
|
349
386
|
- hypot
|
|
350
387
|
- hypot_
|
|
388
|
+
- i0
|
|
389
|
+
- i0_
|
|
351
390
|
- igamma
|
|
352
391
|
- igamma_
|
|
353
392
|
- igammac
|
|
354
393
|
- igammac_
|
|
355
394
|
- index_add
|
|
356
395
|
- index_add_
|
|
357
|
-
- inverse
|
|
358
396
|
- index_copy
|
|
359
397
|
- index_copy_
|
|
360
398
|
- index_fill
|
|
361
399
|
- index_fill_
|
|
362
400
|
- index_put
|
|
363
401
|
- index_put_
|
|
364
|
-
- inner
|
|
365
402
|
- index_select
|
|
403
|
+
- inner
|
|
404
|
+
- int
|
|
405
|
+
- inverse
|
|
366
406
|
- isclose
|
|
367
407
|
- isfinite
|
|
368
408
|
- isinf
|
|
@@ -380,7 +420,6 @@ tensor:
|
|
|
380
420
|
- le_
|
|
381
421
|
- lerp
|
|
382
422
|
- lerp_
|
|
383
|
-
- where
|
|
384
423
|
- less
|
|
385
424
|
- less_
|
|
386
425
|
- less_equal
|
|
@@ -397,43 +436,47 @@ tensor:
|
|
|
397
436
|
- log_
|
|
398
437
|
- log_normal_
|
|
399
438
|
- log_softmax
|
|
400
|
-
- logcumsumexp
|
|
401
|
-
- logdet
|
|
402
439
|
- logaddexp
|
|
403
440
|
- logaddexp2
|
|
441
|
+
- logcumsumexp
|
|
442
|
+
- logdet
|
|
404
443
|
- logical_and
|
|
405
444
|
- logical_and_
|
|
406
445
|
- logical_not
|
|
407
|
-
- logit
|
|
408
446
|
- logical_not_
|
|
409
447
|
- logical_or
|
|
410
448
|
- logical_or_
|
|
411
449
|
- logical_xor
|
|
412
450
|
- logical_xor_
|
|
451
|
+
- logit
|
|
413
452
|
- logit_
|
|
414
453
|
- logsumexp
|
|
454
|
+
- long
|
|
415
455
|
- lstsq
|
|
416
456
|
- lt
|
|
417
457
|
- lt_
|
|
458
|
+
- lu
|
|
418
459
|
- lu_solve
|
|
419
460
|
- map2_
|
|
420
461
|
- map_
|
|
421
462
|
- masked_fill
|
|
422
|
-
- matmul
|
|
423
463
|
- masked_fill_
|
|
424
464
|
- masked_scatter
|
|
425
465
|
- masked_scatter_
|
|
426
466
|
- masked_select
|
|
467
|
+
- matmul
|
|
427
468
|
- matrix_exp
|
|
469
|
+
- matrix_power
|
|
428
470
|
- max
|
|
429
471
|
- maximum
|
|
430
472
|
- mean
|
|
431
|
-
- matrix_power
|
|
432
473
|
- median
|
|
433
474
|
- min
|
|
434
475
|
- minimum
|
|
435
476
|
- mm
|
|
436
477
|
- mode
|
|
478
|
+
- moveaxis
|
|
479
|
+
- movedim
|
|
437
480
|
- msort
|
|
438
481
|
- mul
|
|
439
482
|
- mul_
|
|
@@ -443,6 +486,11 @@ tensor:
|
|
|
443
486
|
- mv
|
|
444
487
|
- mvlgamma
|
|
445
488
|
- mvlgamma_
|
|
489
|
+
- nan_to_num
|
|
490
|
+
- nan_to_num_
|
|
491
|
+
- nanmean
|
|
492
|
+
- nanmedian
|
|
493
|
+
- nanquantile
|
|
446
494
|
- nansum
|
|
447
495
|
- narrow
|
|
448
496
|
- narrow_copy
|
|
@@ -452,20 +500,29 @@ tensor:
|
|
|
452
500
|
- neg_
|
|
453
501
|
- negative
|
|
454
502
|
- negative_
|
|
503
|
+
- nextafter
|
|
504
|
+
- nextafter_
|
|
455
505
|
- nonzero
|
|
456
506
|
- norm
|
|
457
507
|
- normal_
|
|
458
508
|
- not_equal
|
|
459
509
|
- not_equal_
|
|
510
|
+
- numpy
|
|
511
|
+
- orgqr
|
|
512
|
+
- ormqr
|
|
513
|
+
- outer
|
|
460
514
|
- permute
|
|
461
515
|
- pinverse
|
|
462
516
|
- polygamma
|
|
517
|
+
- polygamma_
|
|
463
518
|
- pow
|
|
464
519
|
- pow_
|
|
465
|
-
- polygamma_
|
|
466
520
|
- prelu
|
|
467
521
|
- prod
|
|
468
522
|
- put_
|
|
523
|
+
- q_zero_point
|
|
524
|
+
- qr
|
|
525
|
+
- quantile
|
|
469
526
|
- rad2deg
|
|
470
527
|
- rad2deg_
|
|
471
528
|
- ravel
|
|
@@ -474,15 +531,16 @@ tensor:
|
|
|
474
531
|
- relu
|
|
475
532
|
- relu_
|
|
476
533
|
- remainder
|
|
477
|
-
- repeat_interleave
|
|
478
|
-
- reshape
|
|
479
534
|
- remainder_
|
|
480
535
|
- renorm
|
|
481
536
|
- renorm_
|
|
482
537
|
- repeat
|
|
538
|
+
- repeat_interleave
|
|
539
|
+
- reshape
|
|
483
540
|
- reshape_as
|
|
484
541
|
- resize_
|
|
485
542
|
- resize_as_
|
|
543
|
+
- resolve_neg
|
|
486
544
|
- roll
|
|
487
545
|
- rot90
|
|
488
546
|
- round
|
|
@@ -496,6 +554,7 @@ tensor:
|
|
|
496
554
|
- select
|
|
497
555
|
- sgn
|
|
498
556
|
- sgn_
|
|
557
|
+
- short
|
|
499
558
|
- sigmoid
|
|
500
559
|
- sigmoid_
|
|
501
560
|
- sign
|
|
@@ -507,11 +566,13 @@ tensor:
|
|
|
507
566
|
- sinc_
|
|
508
567
|
- sinh
|
|
509
568
|
- sinh_
|
|
569
|
+
- slice_scatter
|
|
510
570
|
- slogdet
|
|
511
571
|
- smm
|
|
512
572
|
- softmax
|
|
513
573
|
- solve
|
|
514
574
|
- sort
|
|
575
|
+
- split
|
|
515
576
|
- split_with_sizes
|
|
516
577
|
- sqrt
|
|
517
578
|
- sqrt_
|
|
@@ -521,21 +582,29 @@ tensor:
|
|
|
521
582
|
- squeeze_
|
|
522
583
|
- sspaddmm
|
|
523
584
|
- std
|
|
585
|
+
- stft
|
|
586
|
+
- stride
|
|
524
587
|
- sub
|
|
525
588
|
- sub_
|
|
589
|
+
- subtract
|
|
526
590
|
- sum
|
|
527
591
|
- sum_to_size
|
|
528
592
|
- svd
|
|
593
|
+
- swapaxes
|
|
594
|
+
- swapdims
|
|
595
|
+
- swapdims_
|
|
529
596
|
- symeig
|
|
530
597
|
- t
|
|
531
598
|
- t_
|
|
532
599
|
- take
|
|
600
|
+
- take_along_dim
|
|
533
601
|
- tan
|
|
534
602
|
- tan_
|
|
535
603
|
- tanh
|
|
536
604
|
- tanh_
|
|
537
605
|
- tensor_split
|
|
538
606
|
- tile
|
|
607
|
+
- to
|
|
539
608
|
- topk
|
|
540
609
|
- transpose
|
|
541
610
|
- transpose_
|
|
@@ -543,8 +612,8 @@ tensor:
|
|
|
543
612
|
- tril
|
|
544
613
|
- tril_
|
|
545
614
|
- triu
|
|
546
|
-
- true_divide
|
|
547
615
|
- triu_
|
|
616
|
+
- true_divide
|
|
548
617
|
- true_divide_
|
|
549
618
|
- trunc
|
|
550
619
|
- trunc_
|
|
@@ -552,37 +621,20 @@ tensor:
|
|
|
552
621
|
- unbind
|
|
553
622
|
- unflatten
|
|
554
623
|
- unfold
|
|
624
|
+
- unique
|
|
625
|
+
- unique_consecutive
|
|
555
626
|
- unsafe_chunk
|
|
556
|
-
- unsqueeze
|
|
557
627
|
- unsafe_split
|
|
558
628
|
- unsafe_split_with_sizes
|
|
629
|
+
- unsqueeze
|
|
630
|
+
- unsqueeze_
|
|
559
631
|
- var
|
|
560
632
|
- vdot
|
|
561
|
-
- unsqueeze_
|
|
562
633
|
- view_as
|
|
634
|
+
- vsplit
|
|
635
|
+
- where
|
|
563
636
|
- xlogy
|
|
564
637
|
- xlogy_
|
|
565
|
-
- split
|
|
566
|
-
- stft
|
|
567
|
-
- nan_to_num
|
|
568
|
-
- dsplit
|
|
569
|
-
- orgqr
|
|
570
|
-
- bitwise_left_shift_
|
|
571
|
-
- arctan2
|
|
572
|
-
- histogram
|
|
573
|
-
- q_zero_point
|
|
574
|
-
- adjoint
|
|
575
|
-
- ormqr
|
|
576
|
-
- bitwise_right_shift_
|
|
577
|
-
- nanquantile
|
|
578
|
-
- lu
|
|
579
|
-
- quantile
|
|
580
|
-
- arctan2_
|
|
581
|
-
- qr
|
|
582
|
-
- diagonal_scatter
|
|
583
|
-
- corrcoef
|
|
584
|
-
- vsplit
|
|
585
|
-
- aminmax
|
|
586
638
|
|
|
587
639
|
torch:
|
|
588
640
|
- linalg.norm
|
|
@@ -624,6 +676,7 @@ torch:
|
|
|
624
676
|
- _batch_norm_impl_index
|
|
625
677
|
- _convolution
|
|
626
678
|
- _foreach_norm
|
|
679
|
+
- _fused_adamw_
|
|
627
680
|
- _softmax_backward_data
|
|
628
681
|
- abs
|
|
629
682
|
- abs_
|
|
@@ -642,13 +695,14 @@ torch:
|
|
|
642
695
|
- addmv
|
|
643
696
|
- addmv_
|
|
644
697
|
- addr
|
|
645
|
-
- amax
|
|
646
698
|
- affine_grid_generator
|
|
647
699
|
- align_tensors
|
|
648
700
|
- all
|
|
649
701
|
- alpha_dropout
|
|
650
|
-
- amin
|
|
651
702
|
- alpha_dropout_
|
|
703
|
+
- amax
|
|
704
|
+
- amin
|
|
705
|
+
- aminmax
|
|
652
706
|
- angle
|
|
653
707
|
- any
|
|
654
708
|
- arange
|
|
@@ -661,12 +715,14 @@ torch:
|
|
|
661
715
|
- arcsinh
|
|
662
716
|
- arcsinh_
|
|
663
717
|
- arctan
|
|
718
|
+
- arctan2
|
|
664
719
|
- arctan_
|
|
665
720
|
- arctanh
|
|
666
721
|
- arctanh_
|
|
667
722
|
- argmax
|
|
668
723
|
- argmin
|
|
669
724
|
- argsort
|
|
725
|
+
- argwhere
|
|
670
726
|
- asin
|
|
671
727
|
- asin_
|
|
672
728
|
- asinh
|
|
@@ -687,13 +743,13 @@ torch:
|
|
|
687
743
|
- batch_norm_elemt
|
|
688
744
|
- batch_norm_gather_stats
|
|
689
745
|
- batch_norm_gather_stats_with_counts
|
|
690
|
-
- bernoulli
|
|
691
746
|
- batch_norm_stats
|
|
692
747
|
- batch_norm_update_stats
|
|
748
|
+
- bernoulli
|
|
693
749
|
- bilinear
|
|
750
|
+
- binary_cross_entropy_with_logits
|
|
694
751
|
- bincount
|
|
695
752
|
- binomial
|
|
696
|
-
- binary_cross_entropy_with_logits
|
|
697
753
|
- bitwise_and
|
|
698
754
|
- bitwise_not
|
|
699
755
|
- bitwise_or
|
|
@@ -739,9 +795,9 @@ torch:
|
|
|
739
795
|
- conv_transpose1d
|
|
740
796
|
- conv_transpose2d
|
|
741
797
|
- conv_transpose3d
|
|
742
|
-
- cos
|
|
743
798
|
- convolution
|
|
744
799
|
- copysign
|
|
800
|
+
- cos
|
|
745
801
|
- cos_
|
|
746
802
|
- cosh
|
|
747
803
|
- cosh_
|
|
@@ -755,14 +811,16 @@ torch:
|
|
|
755
811
|
- cummin
|
|
756
812
|
- cumprod
|
|
757
813
|
- cumsum
|
|
814
|
+
- cumulative_trapezoid
|
|
758
815
|
- deg2rad
|
|
759
816
|
- deg2rad_
|
|
760
817
|
- det
|
|
761
818
|
- diag
|
|
762
819
|
- diag_embed
|
|
763
|
-
- diff
|
|
764
820
|
- diagflat
|
|
765
821
|
- diagonal
|
|
822
|
+
- diagonal_scatter
|
|
823
|
+
- diff
|
|
766
824
|
- digamma
|
|
767
825
|
- dist
|
|
768
826
|
- div
|
|
@@ -771,12 +829,15 @@ torch:
|
|
|
771
829
|
- dropout
|
|
772
830
|
- dropout_
|
|
773
831
|
- dsmm
|
|
832
|
+
- dsplit
|
|
774
833
|
- dstack
|
|
775
834
|
- eig
|
|
776
835
|
- einsum
|
|
777
836
|
- embedding
|
|
778
837
|
- embedding_bag
|
|
779
838
|
- embedding_renorm_
|
|
839
|
+
- empty
|
|
840
|
+
- empty_like
|
|
780
841
|
- eq
|
|
781
842
|
- equal
|
|
782
843
|
- erf
|
|
@@ -791,12 +852,12 @@ torch:
|
|
|
791
852
|
- expm1
|
|
792
853
|
- expm1_
|
|
793
854
|
- eye
|
|
794
|
-
- feature_dropout
|
|
795
855
|
- feature_alpha_dropout
|
|
796
856
|
- feature_alpha_dropout_
|
|
857
|
+
- feature_dropout
|
|
797
858
|
- feature_dropout_
|
|
798
|
-
- fix
|
|
799
859
|
- fill_
|
|
860
|
+
- fix
|
|
800
861
|
- fix_
|
|
801
862
|
- flatten
|
|
802
863
|
- flip
|
|
@@ -811,8 +872,9 @@ torch:
|
|
|
811
872
|
- fmod
|
|
812
873
|
- frac
|
|
813
874
|
- frac_
|
|
814
|
-
-
|
|
875
|
+
- frexp
|
|
815
876
|
- frobenius_norm
|
|
877
|
+
- full
|
|
816
878
|
- full_like
|
|
817
879
|
- gather
|
|
818
880
|
- gcd
|
|
@@ -824,8 +886,8 @@ torch:
|
|
|
824
886
|
- greater_equal
|
|
825
887
|
- grid_sampler
|
|
826
888
|
- grid_sampler_2d
|
|
827
|
-
- group_norm
|
|
828
889
|
- grid_sampler_3d
|
|
890
|
+
- group_norm
|
|
829
891
|
- gru
|
|
830
892
|
- gru_cell
|
|
831
893
|
- gt
|
|
@@ -835,23 +897,29 @@ torch:
|
|
|
835
897
|
- heaviside
|
|
836
898
|
- hinge_embedding_loss
|
|
837
899
|
- histc
|
|
900
|
+
- histogram
|
|
901
|
+
- histogramdd
|
|
838
902
|
- hsmm
|
|
903
|
+
- hsplit
|
|
839
904
|
- hspmm
|
|
840
905
|
- hstack
|
|
841
906
|
- hypot
|
|
907
|
+
- i0
|
|
908
|
+
- i0_
|
|
842
909
|
- igamma
|
|
843
910
|
- igammac
|
|
844
911
|
- index_add
|
|
845
912
|
- index_copy
|
|
846
|
-
- inner
|
|
847
913
|
- index_fill
|
|
848
914
|
- index_put
|
|
849
915
|
- index_put_
|
|
850
916
|
- index_select
|
|
917
|
+
- inner
|
|
851
918
|
- instance_norm
|
|
852
919
|
- inverse
|
|
853
920
|
- isclose
|
|
854
921
|
- isfinite
|
|
922
|
+
- isin
|
|
855
923
|
- isinf
|
|
856
924
|
- isnan
|
|
857
925
|
- isneginf
|
|
@@ -879,8 +947,8 @@ torch:
|
|
|
879
947
|
- log1p_
|
|
880
948
|
- log2
|
|
881
949
|
- log2_
|
|
882
|
-
- log_softmax
|
|
883
950
|
- log_
|
|
951
|
+
- log_softmax
|
|
884
952
|
- logaddexp
|
|
885
953
|
- logaddexp2
|
|
886
954
|
- logcumsumexp
|
|
@@ -899,18 +967,18 @@ torch:
|
|
|
899
967
|
- lt
|
|
900
968
|
- lu_solve
|
|
901
969
|
- lu_unpack
|
|
902
|
-
- masked_fill
|
|
903
970
|
- margin_ranking_loss
|
|
971
|
+
- masked_fill
|
|
904
972
|
- masked_scatter
|
|
905
973
|
- masked_select
|
|
906
|
-
- matrix_exp
|
|
907
974
|
- matmul
|
|
975
|
+
- matrix_exp
|
|
908
976
|
- matrix_power
|
|
909
977
|
- matrix_rank
|
|
910
978
|
- max
|
|
911
979
|
- max_pool1d
|
|
912
|
-
- max_pool2d
|
|
913
980
|
- max_pool1d_with_indices
|
|
981
|
+
- max_pool2d
|
|
914
982
|
- max_pool3d
|
|
915
983
|
- maximum
|
|
916
984
|
- mean
|
|
@@ -929,18 +997,20 @@ torch:
|
|
|
929
997
|
- mvlgamma
|
|
930
998
|
- nan_to_num
|
|
931
999
|
- nan_to_num_
|
|
1000
|
+
- nanmean
|
|
932
1001
|
- nanmedian
|
|
1002
|
+
- nanquantile
|
|
933
1003
|
- nansum
|
|
934
1004
|
- narrow
|
|
1005
|
+
- narrow_copy
|
|
935
1006
|
- native_batch_norm
|
|
936
1007
|
- native_group_norm
|
|
937
|
-
- narrow_copy
|
|
938
1008
|
- native_layer_norm
|
|
939
1009
|
- native_norm
|
|
940
1010
|
- ne
|
|
941
1011
|
- neg
|
|
942
|
-
- negative
|
|
943
1012
|
- neg_
|
|
1013
|
+
- negative
|
|
944
1014
|
- negative_
|
|
945
1015
|
- nextafter
|
|
946
1016
|
- nonzero
|
|
@@ -972,30 +1042,31 @@ torch:
|
|
|
972
1042
|
- ravel
|
|
973
1043
|
- real
|
|
974
1044
|
- reciprocal
|
|
975
|
-
- relu
|
|
976
1045
|
- reciprocal_
|
|
1046
|
+
- relu
|
|
977
1047
|
- relu_
|
|
978
1048
|
- remainder
|
|
979
1049
|
- renorm
|
|
980
1050
|
- repeat_interleave
|
|
981
1051
|
- reshape
|
|
982
1052
|
- resize_as_
|
|
1053
|
+
- resolve_neg
|
|
983
1054
|
- roll
|
|
984
1055
|
- rot90
|
|
985
1056
|
- round
|
|
986
1057
|
- round_
|
|
1058
|
+
- row_stack
|
|
987
1059
|
- rrelu
|
|
988
1060
|
- rrelu_
|
|
989
1061
|
- rsqrt
|
|
990
|
-
- row_stack
|
|
991
1062
|
- rsqrt_
|
|
992
1063
|
- rsub
|
|
993
1064
|
- saddmm
|
|
994
1065
|
- scalar_tensor
|
|
995
1066
|
- scatter
|
|
996
|
-
- select
|
|
997
1067
|
- scatter_add
|
|
998
1068
|
- searchsorted
|
|
1069
|
+
- select
|
|
999
1070
|
- selu
|
|
1000
1071
|
- selu_
|
|
1001
1072
|
- sgn
|
|
@@ -1015,12 +1086,12 @@ torch:
|
|
|
1015
1086
|
- solve
|
|
1016
1087
|
- sort
|
|
1017
1088
|
- sparse_coo_tensor
|
|
1018
|
-
- square
|
|
1019
1089
|
- split
|
|
1020
1090
|
- split_with_sizes
|
|
1021
1091
|
- spmm
|
|
1022
1092
|
- sqrt
|
|
1023
1093
|
- sqrt_
|
|
1094
|
+
- square
|
|
1024
1095
|
- square_
|
|
1025
1096
|
- squeeze
|
|
1026
1097
|
- sspaddmm
|
|
@@ -1042,8 +1113,8 @@ torch:
|
|
|
1042
1113
|
- tan_
|
|
1043
1114
|
- tanh
|
|
1044
1115
|
- tanh_
|
|
1045
|
-
- tensordot
|
|
1046
1116
|
- tensor_split
|
|
1117
|
+
- tensordot
|
|
1047
1118
|
- threshold
|
|
1048
1119
|
- threshold_
|
|
1049
1120
|
- tile
|
|
@@ -1059,19 +1130,21 @@ torch:
|
|
|
1059
1130
|
- true_divide
|
|
1060
1131
|
- trunc
|
|
1061
1132
|
- trunc_
|
|
1062
|
-
- unique_consecutive
|
|
1063
|
-
- xlogy
|
|
1064
1133
|
- unbind
|
|
1134
|
+
- unflatten
|
|
1135
|
+
- unique_consecutive
|
|
1065
1136
|
- unsafe_chunk
|
|
1066
1137
|
- unsafe_split
|
|
1067
|
-
- vander
|
|
1068
|
-
- var
|
|
1069
|
-
- vdot
|
|
1070
1138
|
- unsafe_split_with_sizes
|
|
1071
1139
|
- unsqueeze
|
|
1140
|
+
- vander
|
|
1141
|
+
- var
|
|
1072
1142
|
- var_mean
|
|
1143
|
+
- vdot
|
|
1144
|
+
- vsplit
|
|
1073
1145
|
- vstack
|
|
1074
1146
|
- where
|
|
1147
|
+
- xlogy
|
|
1075
1148
|
- xlogy_
|
|
1076
1149
|
|
|
1077
1150
|
_VF:
|
|
@@ -1165,6 +1238,28 @@ torch_npu:
|
|
|
1165
1238
|
- npu_moe_finalize_routing
|
|
1166
1239
|
- npu_moe_gating_top_k_softmax
|
|
1167
1240
|
- npu_trans_quant_param
|
|
1241
|
+
- npu_gelu
|
|
1242
|
+
- npu_ffn
|
|
1243
|
+
- npu_quant_matmul
|
|
1244
|
+
- npu_format_cast_
|
|
1245
|
+
- npu_dynamic_quant
|
|
1246
|
+
- npu_moe_compute_expert_tokens
|
|
1247
|
+
- npu_weight_quant_batchmatmul
|
|
1248
|
+
- npu_dynamic_quant_asymmetric
|
|
1249
|
+
- npu_grouped_matmul
|
|
1250
|
+
- npu_quant_scatter_
|
|
1251
|
+
- npu_group_quant
|
|
1252
|
+
- npu_fused_infer_attention_score
|
|
1253
|
+
- npu_quantize
|
|
1254
|
+
- npu_fast_gelu
|
|
1255
|
+
- npu_weight_quant_batchmatmul
|
|
1256
|
+
- scatter_update
|
|
1257
|
+
- scatter_update_
|
|
1258
|
+
- npu_moe_init_routing
|
|
1259
|
+
- npu_scatter_nd_update_
|
|
1260
|
+
- npu_scatter_nd_update
|
|
1261
|
+
- npu_prefetch
|
|
1262
|
+
- npu_dynamic_block_quant
|
|
1168
1263
|
|
|
1169
1264
|
aten:
|
|
1170
1265
|
- signbit
|
|
@@ -1912,4 +2007,27 @@ distributed:
|
|
|
1912
2007
|
- all_to_all
|
|
1913
2008
|
- all_gather_into_tensor
|
|
1914
2009
|
- reduce_scatter_tensor
|
|
1915
|
-
- batch_isend_irecv
|
|
2010
|
+
- batch_isend_irecv
|
|
2011
|
+
|
|
2012
|
+
npu_distributed:
|
|
2013
|
+
- isend
|
|
2014
|
+
- irecv
|
|
2015
|
+
|
|
2016
|
+
mindspeed:
|
|
2017
|
+
- dropout_add_layer_norm.npu_dropout_add_layer_norm
|
|
2018
|
+
- npu_rotary_position_embedding.npu_rotary_position_embedding
|
|
2019
|
+
- fusion_attention_v2.npu_fusion_attention
|
|
2020
|
+
- npu_mm_all_reduce_add_rms_norm.npu_mm_all_reduce_add_rms_norm
|
|
2021
|
+
- npu_mm_all_reduce_add_rms_norm_.npu_mm_all_reduce_add_rms_norm_
|
|
2022
|
+
- gmm.npu_gmm
|
|
2023
|
+
- gmm.npu_gmm_v2
|
|
2024
|
+
- npu_grouped_mat_mul_all_reduce.npu_grouped_mat_mul_all_reduce
|
|
2025
|
+
- ffn.npu_ffn
|
|
2026
|
+
- npu_moe_token_permute.npu_moe_token_permute
|
|
2027
|
+
- npu_moe_token_unpermute.npu_moe_token_unpermute
|
|
2028
|
+
- npu_ring_attention_update.npu_ring_attention_update
|
|
2029
|
+
- npu_matmul_add.npu_matmul_add_fp32
|
|
2030
|
+
- npu_groupmatmul_add.npu_groupmatmul_add_fp32
|
|
2031
|
+
- quant_gmm.npu_quant_gmm
|
|
2032
|
+
- quant_gmm.npu_quant_gmm_v2
|
|
2033
|
+
- npu_apply_fused_ema_adamw.npu_apply_fused_ema_adamw
|