PyPI - mindspore - Versions diffs - 2.2.0__cp38-cp38-manylinux1_x86_64.whl → 2.2.10__cp38-cp38-manylinux1_x86_64.whl - Mend

mindspore 2.2.0__cp38-cp38-manylinux1_x86_64.whl → 2.2.10__cp38-cp38-manylinux1_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mindspore might be problematic. Click here for more details.

Files changed (149) hide show

mindspore/.commit_id +1 -1
mindspore/_akg/akg/composite/build_module.py +9 -15
mindspore/_akg/akg/utils/ascend_profilier/__init__.py +0 -0
mindspore/_akg/akg/utils/ascend_profilier/cann_file_parser.py +76 -0
mindspore/_akg/akg/utils/ascend_profilier/file_manager.py +56 -0
mindspore/_akg/akg/utils/ascend_profilier/op_summary_bean.py +23 -0
mindspore/_akg/akg/utils/ascend_profilier/op_summary_headers.py +8 -0
mindspore/_akg/akg/utils/ascend_profilier/op_summary_parser.py +42 -0
mindspore/_akg/akg/utils/ascend_profilier/path_manager.py +65 -0
mindspore/_akg/akg/utils/kernel_exec.py +41 -15
mindspore/_akg/akg/utils/tbe_codegen_utils.py +27 -6
mindspore/_akg/akg/utils/util.py +38 -0
mindspore/_c_dataengine.cpython-38-x86_64-linux-gnu.so +0 -0
mindspore/_c_expression.cpython-38-x86_64-linux-gnu.so +0 -0
mindspore/_checkparam.py +3 -3
mindspore/_extends/graph_kernel/model/graph_split.py +84 -76
mindspore/_extends/graph_kernel/splitter.py +3 -2
mindspore/_extends/parallel_compile/akg_compiler/build_tbe_kernel.py +83 -66
mindspore/_extends/parallel_compile/akg_compiler/tbe_topi.py +4 -4
mindspore/_extends/parallel_compile/akg_compiler/util.py +10 -7
mindspore/_extends/parallel_compile/tbe_compiler/tbe_helper.py +2 -1
mindspore/_extends/parse/standard_method.py +2 -9
mindspore/_extends/remote/kernel_build_server.py +2 -1
mindspore/_mindspore_offline_debug.cpython-38-x86_64-linux-gnu.so +0 -0
mindspore/bin/cache_admin +0 -0
mindspore/bin/cache_server +0 -0
mindspore/common/api.py +1 -1
mindspore/common/auto_dynamic_shape.py +81 -85
mindspore/common/dump.py +1 -1
mindspore/common/tensor.py +3 -20
mindspore/config/op_info.config +1 -1
mindspore/context.py +11 -4
mindspore/dataset/engine/datasets_standard_format.py +5 -0
mindspore/dataset/vision/transforms.py +21 -21
mindspore/experimental/optim/adam.py +1 -1
mindspore/gen_ops.py +1 -1
mindspore/include/api/model.h +17 -0
mindspore/include/api/status.h +8 -3
mindspore/lib/libdnnl.so.2 +0 -0
mindspore/lib/libmindspore.so +0 -0
mindspore/lib/libmindspore_backend.so +0 -0
mindspore/lib/libmindspore_common.so +0 -0
mindspore/lib/libmindspore_core.so +0 -0
mindspore/lib/libmindspore_glog.so.0 +0 -0
mindspore/lib/libmindspore_gpr.so.15 +0 -0
mindspore/lib/libmindspore_grpc++.so.1 +0 -0
mindspore/lib/libmindspore_grpc.so.15 +0 -0
mindspore/lib/libmindspore_shared_lib.so +0 -0
mindspore/lib/libnnacl.so +0 -0
mindspore/lib/libopencv_core.so.4.5 +0 -0
mindspore/lib/libopencv_imgcodecs.so.4.5 +0 -0
mindspore/lib/libopencv_imgproc.so.4.5 +0 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend310/aic-ascend310-ops-info.json +123 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend310p/aic-ascend310p-ops-info.json +123 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910/aic-ascend910-ops-info.json +158 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910b/aic-ascend910b-ops-info.json +37 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/custom_aicore_ops_impl/add_dsl.py +46 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/custom_aicore_ops_impl/add_tik.py +51 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/custom_aicore_ops_impl/kv_cache_mgr.py +241 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/custom_aicore_ops_impl/matmul_tik.py +212 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/vector_core/tbe/custom_aicore_ops_impl/add_dsl.py +46 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/vector_core/tbe/custom_aicore_ops_impl/add_tik.py +51 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/vector_core/tbe/custom_aicore_ops_impl/kv_cache_mgr.py +241 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/vector_core/tbe/custom_aicore_ops_impl/matmul_tik.py +212 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_proto/libop_proto.so +0 -0
mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/aicpu_kernel/impl/libcust_aicpu_kernels.so +0 -0
mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/aicpu_kernel/impl/libcust_cpu_kernels.so +0 -0
mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/config/cust_aicpu_kernel.json +8 -80
mindspore/lib/plugin/ascend/custom_aicpu_ops/op_proto/libcust_op_proto.so +0 -0
mindspore/lib/plugin/ascend/libakg.so +0 -0
mindspore/lib/plugin/ascend/libhccl_plugin.so +0 -0
mindspore/lib/plugin/ascend/libmindspore_aicpu_kernels.so +0 -0
mindspore/lib/plugin/ascend/libmindspore_cpu_kernels.so +0 -0
mindspore/lib/plugin/cpu/libakg.so +0 -0
mindspore/lib/plugin/gpu/libcuda_ops.so.10 +0 -0
mindspore/lib/plugin/gpu/libcuda_ops.so.11 +0 -0
mindspore/lib/plugin/gpu10.1/libakg.so +0 -0
mindspore/lib/plugin/gpu10.1/libnccl.so.2 +0 -0
mindspore/lib/plugin/gpu11.1/libakg.so +0 -0
mindspore/lib/plugin/gpu11.1/libnccl.so.2 +0 -0
mindspore/lib/plugin/gpu11.6/libakg.so +0 -0
mindspore/lib/plugin/gpu11.6/libnccl.so.2 +0 -0
mindspore/lib/plugin/libmindspore_ascend.so.1 +0 -0
mindspore/lib/plugin/libmindspore_ascend.so.2 +0 -0
mindspore/lib/plugin/libmindspore_gpu.so.10.1 +0 -0
mindspore/lib/plugin/libmindspore_gpu.so.11.1 +0 -0
mindspore/lib/plugin/libmindspore_gpu.so.11.6 +0 -0
mindspore/nn/cell.py +0 -3
mindspore/nn/layer/activation.py +4 -5
mindspore/nn/layer/conv.py +39 -23
mindspore/nn/layer/flash_attention.py +90 -78
mindspore/nn/layer/math.py +3 -7
mindspore/nn/layer/rnn_cells.py +5 -5
mindspore/nn/wrap/cell_wrapper.py +6 -0
mindspore/numpy/utils_const.py +5 -5
mindspore/ops/_grad_experimental/grad_array_ops.py +1 -1
mindspore/ops/_grad_experimental/grad_implementations.py +2 -2
mindspore/ops/_grad_experimental/grad_math_ops.py +19 -18
mindspore/ops/_grad_experimental/grad_sparse_ops.py +3 -3
mindspore/ops/_op_impl/aicpu/add.py +3 -3
mindspore/ops/_utils/utils.py +2 -0
mindspore/ops/composite/multitype_ops/_compile_utils.py +2 -1
mindspore/ops/composite/multitype_ops/getitem_impl.py +2 -2
mindspore/ops/function/array_func.py +10 -7
mindspore/ops/function/grad/grad_func.py +0 -1
mindspore/ops/function/nn_func.py +98 -9
mindspore/ops/function/random_func.py +2 -1
mindspore/ops/op_info_register.py +24 -21
mindspore/ops/operations/__init__.py +3 -2
mindspore/ops/operations/_grad_ops.py +24 -4
mindspore/ops/operations/_inner_ops.py +155 -23
mindspore/ops/operations/array_ops.py +9 -7
mindspore/ops/operations/comm_ops.py +2 -2
mindspore/ops/operations/custom_ops.py +85 -68
mindspore/ops/operations/inner_ops.py +26 -3
mindspore/ops/operations/math_ops.py +4 -3
mindspore/ops/operations/nn_ops.py +109 -28
mindspore/parallel/_parallel_serialization.py +10 -3
mindspore/parallel/_tensor.py +4 -1
mindspore/parallel/checkpoint_transform.py +13 -2
mindspore/parallel/shard.py +17 -10
mindspore/profiler/common/util.py +1 -0
mindspore/profiler/parser/ascend_hccl_generator.py +232 -0
mindspore/profiler/parser/ascend_msprof_exporter.py +86 -43
mindspore/profiler/parser/ascend_msprof_generator.py +196 -9
mindspore/profiler/parser/ascend_op_generator.py +1 -1
mindspore/profiler/parser/ascend_timeline_generator.py +6 -182
mindspore/profiler/parser/base_timeline_generator.py +1 -1
mindspore/profiler/parser/cpu_gpu_timeline_generator.py +2 -2
mindspore/profiler/parser/framework_parser.py +1 -1
mindspore/profiler/parser/profiler_info.py +19 -0
mindspore/profiler/profiling.py +46 -24
mindspore/rewrite/api/pattern_engine.py +1 -1
mindspore/rewrite/parsers/for_parser.py +1 -1
mindspore/rewrite/symbol_tree.py +1 -4
mindspore/run_check/_check_version.py +5 -3
mindspore/safeguard/rewrite_obfuscation.py +52 -28
mindspore/train/callback/_summary_collector.py +1 -1
mindspore/train/dataset_helper.py +1 -0
mindspore/train/model.py +2 -2
mindspore/train/serialization.py +97 -11
mindspore/train/summary/_summary_adapter.py +1 -1
mindspore/train/summary/summary_record.py +23 -7
mindspore/version.py +1 -1
{mindspore-2.2.0.dist-info → mindspore-2.2.10.dist-info}/METADATA +1 -1
{mindspore-2.2.0.dist-info → mindspore-2.2.10.dist-info}/RECORD +149 -129
{mindspore-2.2.0.dist-info → mindspore-2.2.10.dist-info}/WHEEL +0 -0
{mindspore-2.2.0.dist-info → mindspore-2.2.10.dist-info}/entry_points.txt +0 -0
{mindspore-2.2.0.dist-info → mindspore-2.2.10.dist-info}/top_level.txt +0 -0

mindspore/include/api/model.h CHANGED Viewed

@@ -136,6 +136,13 @@ class MS_API Model {
   /// \return Status.
   Status UpdateWeights(const std::vector<MSTensor> &new_weights);
+  /// \brief Change the size and or content of weight tensors
+  ///
+  /// \param[in]  A vector where model constant are arranged in sequence
+  ///
+  /// \return Status.
+  Status UpdateWeights(const std::vector<std::vector<MSTensor>> &new_weights);
   /// \brief Inference model API. If use this API in train mode, it's equal to RunStep API.
   ///
   /// \param[in] inputs A vector where model inputs are arranged in sequence.
@@ -358,6 +365,13 @@ class MS_API Model {
   const std::shared_ptr<ModelImpl> impl() const { return impl_; }
+  /// \brief Get model info by key
+  ///
+  /// \param[in] key The key of model info key-value pair
+  ///
+  /// \return The value of the model info associated with the given key.
+  inline std::string GetModelInfo(const std::string &key);
  private:
   friend class Serialization;
   // api without std::string
@@ -374,6 +388,7 @@ class MS_API Model {
                const std::vector<char> &cropto_lib_path);
   Status Build(const std::vector<char> &model_path, ModelType model_type, const std::shared_ptr<Context> &model_context,
                const Key &dec_key, const std::vector<char> &dec_mode, const std::vector<char> &cropto_lib_path);
+  std::vector<char> GetModelInfo(const std::vector<char> &key);
   std::shared_ptr<ModelImpl> impl_;
 };
@@ -416,5 +431,7 @@ Status Model::Build(const std::string &model_path, ModelType model_type,
                     const std::shared_ptr<Context> &model_context) {
   return Build(StringToChar(model_path), model_type, model_context);
 }
+inline std::string Model::GetModelInfo(const std::string &key) { return CharToString(GetModelInfo(StringToChar(key))); }
 }  // namespace mindspore
 #endif  // MINDSPORE_INCLUDE_API_MODEL_H

mindspore/include/api/status.h CHANGED Viewed

@@ -83,9 +83,14 @@ enum StatusCode : uint32_t {
   kLiteModelRebuild = kLite | (0x0FFFFFFF & -12),    /**< Model has been built. */
   // Executor error code, range: [-100,-200)
-  kLiteOutOfTensorRange = kLite | (0x0FFFFFFF & -100), /**< Failed to check range. */
-  kLiteInputTensorError = kLite | (0x0FFFFFFF & -101), /**< Failed to check input tensor. */
-  kLiteReentrantError = kLite | (0x0FFFFFFF & -102),   /**< Exist executor running. */
+  kLiteOutOfTensorRange = kLite | (0x0FFFFFFF & -100),           /**< Failed to check range. */
+  kLiteInputTensorError = kLite | (0x0FFFFFFF & -101),           /**< Failed to check input tensor. */
+  kLiteReentrantError = kLite | (0x0FFFFFFF & -102),             /**< Exist executor running. */
+  kLiteLLMWaitProcessTimeOut = kLite | (0x0FFFFFFF & -103),      /**< Wait to be processed time out. */
+  kLiteLLMKVCacheNotExist = kLite | (0x0FFFFFFF & -104),         /**< KV Cache not exist. */
+  kLiteLLMRepeatRequest = kLite | (0x0FFFFFFF & -105),           /**< repeat request. */
+  kLiteLLMRequestAlreadyCompleted = kLite | (0x0FFFFFFF & -106), /**< request already complete!. */
+  kLiteLLMEngineFinalized = kLite | (0x0FFFFFFF & -107),         /**< llm engine finalized. */
   // Graph error code, range: [-200,-300)
   kLiteGraphFileError = kLite | (0x0FFFFFFF & -200), /**< Failed to verify graph file. */

mindspore/lib/libdnnl.so.2 CHANGED Viewed

Binary file

mindspore/lib/libmindspore.so CHANGED Viewed

Binary file

mindspore/lib/libmindspore_backend.so CHANGED Viewed

Binary file

mindspore/lib/libmindspore_common.so CHANGED Viewed

Binary file

mindspore/lib/libmindspore_core.so CHANGED Viewed

Binary file

mindspore/lib/libmindspore_glog.so.0 CHANGED Viewed

Binary file

mindspore/lib/libmindspore_gpr.so.15 CHANGED Viewed

Binary file

mindspore/lib/libmindspore_grpc++.so.1 CHANGED Viewed

Binary file

mindspore/lib/libmindspore_grpc.so.15 CHANGED Viewed

Binary file

mindspore/lib/libmindspore_shared_lib.so CHANGED Viewed

Binary file

mindspore/lib/libnnacl.so CHANGED Viewed

Binary file

mindspore/lib/libopencv_core.so.4.5 CHANGED Viewed

Binary file

mindspore/lib/libopencv_imgcodecs.so.4.5 CHANGED Viewed

Binary file

mindspore/lib/libopencv_imgproc.so.4.5 CHANGED Viewed

Binary file

mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend310/aic-ascend310-ops-info.json ADDED Viewed

@@ -0,0 +1,123 @@
+{
+    "AddDSL":{
+        "input0":{
+            "dtype":"float16",
+            "format":"NCHW",
+            "name":"x1",
+            "paramType":"required"
+        },
+        "input1":{
+            "dtype":"float16",
+            "format":"NCHW",
+            "name":"x2",
+            "paramType":"required"
+        },
+        "opFile":{
+            "value":"add_dsl"
+        },
+        "opInterface":{
+            "value":"add_dsl"
+        },
+        "output0":{
+            "dtype":"float16",
+            "format":"NCHW",
+            "name":"y",
+            "paramType":"required"
+        }
+    },
+    "AddTik":{
+        "input0":{
+            "dtype":"float16",
+            "format":"ND",
+            "name":"x1",
+            "paramType":"required"
+        },
+        "input1":{
+            "dtype":"float16",
+            "format":"ND",
+            "name":"x2",
+            "paramType":"required"
+        },
+        "opFile":{
+            "value":"add_tik"
+        },
+        "opInterface":{
+            "value":"add_tik"
+        },
+        "output0":{
+            "dtype":"float16",
+            "format":"ND",
+            "name":"y",
+            "paramType":"required"
+        }
+    },
+    "FlashAttention":{
+        "input0":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"q",
+            "paramType":"required"
+        },
+        "input1":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"k",
+            "paramType":"required"
+        },
+        "input2":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"v",
+            "paramType":"required"
+        },
+        "input3":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"attention_mask",
+            "paramType":"required"
+        },
+        "opFile":{
+            "value":"flash_attention"
+        },
+        "opInterface":{
+            "value":"flash_attention"
+        },
+        "output0":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"y",
+            "paramType":"required"
+        }
+    },
+    "MatmulTik":{
+        "input0":{
+            "dtype":"int8,uint8,float16",
+            "format":"ND,ND,ND",
+            "name":"x1",
+            "needCompile":"false",
+            "paramType":"required",
+            "shape":"all"
+        },
+        "input1":{
+            "dtype":"int8,int8,float16",
+            "format":"ND,ND,ND",
+            "name":"x2",
+            "needCompile":"false",
+            "paramType":"required",
+            "shape":"all"
+        },
+        "opFile":{
+            "value":"matmul_tik"
+        },
+        "opInterface":{
+            "value":"matmul_tik"
+        },
+        "output0":{
+            "dtype":"int32,int32,float",
+            "format":"ND,ND,ND",
+            "name":"y",
+            "paramType":"required",
+            "shape":"all"
+        }
+    }
+}

mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend310p/aic-ascend310p-ops-info.json ADDED Viewed

@@ -0,0 +1,123 @@
+{
+    "AddDSL":{
+        "input0":{
+            "dtype":"float16",
+            "format":"NCHW",
+            "name":"x1",
+            "paramType":"required"
+        },
+        "input1":{
+            "dtype":"float16",
+            "format":"NCHW",
+            "name":"x2",
+            "paramType":"required"
+        },
+        "opFile":{
+            "value":"add_dsl"
+        },
+        "opInterface":{
+            "value":"add_dsl"
+        },
+        "output0":{
+            "dtype":"float16",
+            "format":"NCHW",
+            "name":"y",
+            "paramType":"required"
+        }
+    },
+    "AddTik":{
+        "input0":{
+            "dtype":"float16",
+            "format":"ND",
+            "name":"x1",
+            "paramType":"required"
+        },
+        "input1":{
+            "dtype":"float16",
+            "format":"ND",
+            "name":"x2",
+            "paramType":"required"
+        },
+        "opFile":{
+            "value":"add_tik"
+        },
+        "opInterface":{
+            "value":"add_tik"
+        },
+        "output0":{
+            "dtype":"float16",
+            "format":"ND",
+            "name":"y",
+            "paramType":"required"
+        }
+    },
+    "FlashAttention":{
+        "input0":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"q",
+            "paramType":"required"
+        },
+        "input1":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"k",
+            "paramType":"required"
+        },
+        "input2":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"v",
+            "paramType":"required"
+        },
+        "input3":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"attention_mask",
+            "paramType":"required"
+        },
+        "opFile":{
+            "value":"flash_attention"
+        },
+        "opInterface":{
+            "value":"flash_attention"
+        },
+        "output0":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"y",
+            "paramType":"required"
+        }
+    },
+    "MatmulTik":{
+        "input0":{
+            "dtype":"int8,uint8,float16",
+            "format":"ND,ND,ND",
+            "name":"x1",
+            "needCompile":"false",
+            "paramType":"required",
+            "shape":"all"
+        },
+        "input1":{
+            "dtype":"int8,int8,float16",
+            "format":"ND,ND,ND",
+            "name":"x2",
+            "needCompile":"false",
+            "paramType":"required",
+            "shape":"all"
+        },
+        "opFile":{
+            "value":"matmul_tik"
+        },
+        "opInterface":{
+            "value":"matmul_tik"
+        },
+        "output0":{
+            "dtype":"int32,int32,float",
+            "format":"ND,ND,ND",
+            "name":"y",
+            "paramType":"required",
+            "shape":"all"
+        }
+    }
+}

mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910/aic-ascend910-ops-info.json ADDED Viewed

@@ -0,0 +1,158 @@
+{
+    "AddDSL":{
+        "input0":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"x1",
+            "paramType":"required"
+        },
+        "input1":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"x2",
+            "paramType":"required"
+        },
+        "opFile":{
+            "value":"add_dsl"
+        },
+        "opInterface":{
+            "value":"add_dsl"
+        },
+        "output0":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"y",
+            "paramType":"required"
+        }
+    },
+    "AddTik":{
+        "input0":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"x1",
+            "paramType":"required"
+        },
+        "input1":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"x2",
+            "paramType":"required"
+        },
+        "opFile":{
+            "value":"add_tik"
+        },
+        "opInterface":{
+            "value":"add_tik"
+        },
+        "output0":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"y",
+            "paramType":"required"
+        }
+    },
+    "FlashAttention":{
+        "input0":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"q",
+            "paramType":"required"
+        },
+        "input1":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"k",
+            "paramType":"required"
+        },
+        "input2":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"v",
+            "paramType":"required"
+        },
+        "input3":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"attention_mask",
+            "paramType":"required"
+        },
+        "opFile":{
+            "value":"flash_attention"
+        },
+        "opInterface":{
+            "value":"flash_attention"
+        },
+        "output0":{
+            "dtype":"float16,float32,int32",
+            "format":"ND,ND,ND",
+            "name":"y",
+            "paramType":"required"
+        }
+    },
+    "KVCacheMgr":{
+        "input0":{
+            "dtype":"float32, int32, uint32, float16, int16, uint16, int8, uint8",
+            "format":"ND,ND,ND,ND,ND,ND,ND,ND",
+            "name":"past",
+            "paramType":"required"
+        },
+        "input1":{
+            "dtype":"float32, int32, uint32, float16, int16, uint16, int8, uint8",
+            "format":"ND,ND,ND,ND,ND,ND,ND,ND",
+            "name":"cur",
+            "paramType":"required"
+        },
+        "input2":{
+            "dtype":"int32,int32,int32,int32,int32,int32,int32,int32",
+            "format":"ND,ND,ND,ND,ND,ND,ND,ND",
+            "name":"index",
+            "paramType":"required"
+        },
+        "needCheckSupport":{
+            "flag":"true"
+        },
+        "opFile":{
+            "value":"kv_cache_mgr"
+        },
+        "opInterface":{
+            "value":"kv_cache_mgr"
+        },
+        "output0":{
+            "dtype":"float32, int32, uint32, float16, int16, uint16, int8, uint8",
+            "format":"ND,ND,ND,ND,ND,ND,ND,ND",
+            "name":"past",
+            "paramType":"required"
+        }
+    },
+    "MatmulTik":{
+        "input0":{
+            "dtype":"int8,uint8,float16",
+            "format":"ND,ND,ND",
+            "name":"x1",
+            "needCompile":"false",
+            "paramType":"required",
+            "shape":"all"
+        },
+        "input1":{
+            "dtype":"int8,int8,float16",
+            "format":"ND,ND,ND",
+            "name":"x2",
+            "needCompile":"false",
+            "paramType":"required",
+            "shape":"all"
+        },
+        "opFile":{
+            "value":"matmul_tik"
+        },
+        "opInterface":{
+            "value":"matmul_tik"
+        },
+        "output0":{
+            "dtype":"int32,int32,float",
+            "format":"ND,ND,ND",
+            "name":"y",
+            "paramType":"required",
+            "shape":"all"
+        }
+    }
+}

mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910b/aic-ascend910b-ops-info.json ADDED Viewed

@@ -0,0 +1,37 @@
+{
+    "KVCacheMgr":{
+        "input0":{
+            "dtype":"float32, int32, uint32, float16, int16, uint16, int8, uint8",
+            "format":"ND,ND,ND,ND,ND,ND,ND,ND",
+            "name":"past",
+            "paramType":"required"
+        },
+        "input1":{
+            "dtype":"float32, int32, uint32, float16, int16, uint16, int8, uint8",
+            "format":"ND,ND,ND,ND,ND,ND,ND,ND",
+            "name":"cur",
+            "paramType":"required"
+        },
+        "input2":{
+            "dtype":"int32,int32,int32,int32,int32,int32,int32,int32",
+            "format":"ND,ND,ND,ND,ND,ND,ND,ND",
+            "name":"index",
+            "paramType":"required"
+        },
+        "needCheckSupport":{
+            "flag":"true"
+        },
+        "opFile":{
+            "value":"kv_cache_mgr"
+        },
+        "opInterface":{
+            "value":"kv_cache_mgr"
+        },
+        "output0":{
+            "dtype":"float32, int32, uint32, float16, int16, uint16, int8, uint8",
+            "format":"ND,ND,ND,ND,ND,ND,ND,ND",
+            "name":"past",
+            "paramType":"required"
+        }
+    }
+}

mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/custom_aicore_ops_impl/add_dsl.py ADDED Viewed

@@ -0,0 +1,46 @@
+# Copyright 2022 Huawei Technologies Co., Ltd
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ============================================================================
+"""ascend custom op: add by dsl"""
+import tbe.dsl as tbe
+from tbe import tvm
+from tbe.common.register import register_op_compute
+from tbe.common.utils import para_check
+@register_op_compute("add_dsl")
+def add_dsl_compute(x1, x2, y, kernel_name="add_dsl"):
+    res = tbe.vadd(x1, x2)
+    return res
+@para_check.check_op_params(para_check.REQUIRED_INPUT, para_check.REQUIRED_INPUT,
+                            para_check.REQUIRED_OUTPUT, para_check.KERNEL_NAME)
+def add_dsl(x1, x2, y, kernel_name="add_dsl"):
+    """add dsl impl function"""
+    data_x1 = tvm.placeholder(
+        x1.get("shape"), dtype=x1.get("dtype"), name="data_x1")
+    data_x2 = tvm.placeholder(
+        x2.get("shape"), dtype=x2.get("dtype"), name="data_x2")
+    res = add_dsl_compute(data_x1, data_x2, y, kernel_name)
+    # auto schedule
+    with tvm.target.cce():
+        schedule = tbe.auto_schedule(res)
+    # operator build
+    config = {"name": kernel_name,
+              "tensor_list": [data_x1, data_x2, res]}
+    tbe.build(schedule, config)

mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/custom_aicore_ops_impl/add_tik.py ADDED Viewed

@@ -0,0 +1,51 @@
+# Copyright 2022 Huawei Technologies Co., Ltd
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ============================================================================
+"""ascend custom op: add by tik"""
+from tbe.common.register import register_op_compute
+from tbe.common.utils import para_check
+from tbe import tik
+@register_op_compute("AddTik")
+@para_check.check_op_params(para_check.REQUIRED_INPUT, para_check.REQUIRED_INPUT,
+                            para_check.REQUIRED_OUTPUT, para_check.KERNEL_NAME)
+def add_tik(x1, x2, y, kernel_name="add_tik"):
+    """add dsl impl function"""
+    tik_instance = tik.Tik()
+    x1_shape = x1.get("shape")
+    x2_shape = x2.get("shape")
+    y_shape = y.get("shape")
+    data_a = tik_instance.Tensor(
+        "float16", x1_shape, name="x1", scope=tik.scope_gm)
+    data_b = tik_instance.Tensor(
+        "float16", x2_shape, name="x2", scope=tik.scope_gm)
+    data_c = tik_instance.Tensor(
+        "float16", y_shape, name="y", scope=tik.scope_gm)
+    data_a_ub = tik_instance.Tensor(
+        "float16", x1_shape, name="data_A_ub", scope=tik.scope_ubuf)
+    data_b_ub = tik_instance.Tensor(
+        "float16", x2_shape, name="data_B_ub", scope=tik.scope_ubuf)
+    data_c_ub = tik_instance.Tensor(
+        "float16", y_shape, name="data_C_ub", scope=tik.scope_ubuf)
+    tik_instance.data_move(data_a_ub, data_a, 0, 1, 128 // 16, 0, 0)
+    tik_instance.data_move(data_b_ub, data_b, 0, 1, 128 // 16, 0, 0)
+    tik_instance.vec_add(
+        128, data_c_ub[0], data_a_ub[0], data_b_ub[0], 1, 8, 8, 8)
+    tik_instance.data_move(data_c, data_c_ub, 0, 1, 128 // 16, 0, 0)
+    tik_instance.BuildCCE(kernel_name=kernel_name, inputs=[data_a, data_b], outputs=[data_c])
+    return tik_instance