mindspore 2.2.0__cp38-cp38-manylinux1_x86_64.whl → 2.2.11__cp38-cp38-manylinux1_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mindspore might be problematic. Click here for more details.

Files changed (170) hide show
  1. mindspore/.commit_id +1 -1
  2. mindspore/_akg/akg/composite/build_module.py +104 -20
  3. mindspore/_akg/akg/utils/ascend_profilier/cann_file_parser.py +76 -0
  4. mindspore/_akg/akg/utils/ascend_profilier/file_manager.py +56 -0
  5. mindspore/_akg/akg/utils/ascend_profilier/op_summary_bean.py +23 -0
  6. mindspore/_akg/akg/utils/ascend_profilier/op_summary_headers.py +8 -0
  7. mindspore/_akg/akg/utils/ascend_profilier/op_summary_parser.py +42 -0
  8. mindspore/_akg/akg/utils/ascend_profilier/path_manager.py +65 -0
  9. mindspore/_akg/akg/utils/composite_op_helper.py +7 -2
  10. mindspore/_akg/akg/utils/dump_ascend_meta.py +22 -3
  11. mindspore/_akg/akg/utils/kernel_exec.py +41 -15
  12. mindspore/_akg/akg/utils/tbe_codegen_utils.py +27 -6
  13. mindspore/_akg/akg/utils/util.py +56 -1
  14. mindspore/_c_dataengine.cpython-38-x86_64-linux-gnu.so +0 -0
  15. mindspore/_c_expression.cpython-38-x86_64-linux-gnu.so +0 -0
  16. mindspore/_checkparam.py +3 -3
  17. mindspore/_extends/graph_kernel/model/graph_split.py +84 -76
  18. mindspore/_extends/graph_kernel/splitter.py +3 -2
  19. mindspore/_extends/parallel_compile/akg_compiler/build_tbe_kernel.py +83 -66
  20. mindspore/_extends/parallel_compile/akg_compiler/tbe_topi.py +4 -4
  21. mindspore/_extends/parallel_compile/akg_compiler/util.py +10 -7
  22. mindspore/_extends/parallel_compile/tbe_compiler/tbe_helper.py +2 -1
  23. mindspore/_extends/parse/__init__.py +3 -2
  24. mindspore/_extends/parse/parser.py +6 -1
  25. mindspore/_extends/parse/standard_method.py +14 -11
  26. mindspore/_extends/remote/kernel_build_server.py +2 -1
  27. mindspore/_mindspore_offline_debug.cpython-38-x86_64-linux-gnu.so +0 -0
  28. mindspore/bin/cache_admin +0 -0
  29. mindspore/bin/cache_server +0 -0
  30. mindspore/common/_utils.py +16 -0
  31. mindspore/common/api.py +1 -1
  32. mindspore/common/auto_dynamic_shape.py +81 -85
  33. mindspore/common/dump.py +1 -1
  34. mindspore/common/tensor.py +3 -20
  35. mindspore/config/op_info.config +1 -1
  36. mindspore/context.py +11 -4
  37. mindspore/dataset/engine/cache_client.py +8 -5
  38. mindspore/dataset/engine/datasets_standard_format.py +5 -0
  39. mindspore/dataset/vision/transforms.py +21 -21
  40. mindspore/experimental/optim/adam.py +1 -1
  41. mindspore/gen_ops.py +1 -1
  42. mindspore/include/api/model.h +17 -0
  43. mindspore/include/api/status.h +8 -3
  44. mindspore/lib/libdnnl.so.2 +0 -0
  45. mindspore/lib/libmindspore.so +0 -0
  46. mindspore/lib/libmindspore_backend.so +0 -0
  47. mindspore/lib/libmindspore_common.so +0 -0
  48. mindspore/lib/libmindspore_core.so +0 -0
  49. mindspore/lib/libmindspore_glog.so.0 +0 -0
  50. mindspore/lib/libmindspore_gpr.so.15 +0 -0
  51. mindspore/lib/libmindspore_grpc++.so.1 +0 -0
  52. mindspore/lib/libmindspore_grpc.so.15 +0 -0
  53. mindspore/lib/libmindspore_shared_lib.so +0 -0
  54. mindspore/lib/libnnacl.so +0 -0
  55. mindspore/lib/libopencv_core.so.4.5 +0 -0
  56. mindspore/lib/libopencv_imgcodecs.so.4.5 +0 -0
  57. mindspore/lib/libopencv_imgproc.so.4.5 +0 -0
  58. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend310/aic-ascend310-ops-info.json +123 -0
  59. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend310p/aic-ascend310p-ops-info.json +123 -0
  60. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910/aic-ascend910-ops-info.json +158 -0
  61. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910b/aic-ascend910b-ops-info.json +37 -0
  62. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/custom_aicore_ops_impl/add_dsl.py +46 -0
  63. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/custom_aicore_ops_impl/add_tik.py +51 -0
  64. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/custom_aicore_ops_impl/kv_cache_mgr.py +241 -0
  65. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/custom_aicore_ops_impl/matmul_tik.py +212 -0
  66. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/vector_core/tbe/custom_aicore_ops_impl/add_dsl.py +46 -0
  67. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/vector_core/tbe/custom_aicore_ops_impl/add_tik.py +51 -0
  68. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/vector_core/tbe/custom_aicore_ops_impl/kv_cache_mgr.py +241 -0
  69. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/vector_core/tbe/custom_aicore_ops_impl/matmul_tik.py +212 -0
  70. mindspore/lib/plugin/ascend/custom_aicore_ops/op_proto/libop_proto.so +0 -0
  71. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/aicpu_kernel/impl/libcust_aicpu_kernels.so +0 -0
  72. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/aicpu_kernel/impl/libcust_cpu_kernels.so +0 -0
  73. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/config/cust_aicpu_kernel.json +78 -80
  74. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_proto/libcust_op_proto.so +0 -0
  75. mindspore/lib/plugin/ascend/libakg.so +0 -0
  76. mindspore/lib/plugin/ascend/libhccl_plugin.so +0 -0
  77. mindspore/lib/plugin/ascend/libmindspore_aicpu_kernels.so +0 -0
  78. mindspore/lib/plugin/ascend/libmindspore_cpu_kernels.so +0 -0
  79. mindspore/lib/plugin/cpu/libakg.so +0 -0
  80. mindspore/lib/plugin/gpu/libcuda_ops.so.10 +0 -0
  81. mindspore/lib/plugin/gpu/libcuda_ops.so.11 +0 -0
  82. mindspore/lib/plugin/gpu10.1/libakg.so +0 -0
  83. mindspore/lib/plugin/gpu11.1/libakg.so +0 -0
  84. mindspore/lib/plugin/gpu11.1/libnccl.so.2 +0 -0
  85. mindspore/lib/plugin/gpu11.6/libakg.so +0 -0
  86. mindspore/lib/plugin/gpu11.6/libnccl.so.2 +0 -0
  87. mindspore/lib/plugin/libmindspore_ascend.so.1 +0 -0
  88. mindspore/lib/plugin/libmindspore_ascend.so.2 +0 -0
  89. mindspore/lib/plugin/libmindspore_gpu.so.10.1 +0 -0
  90. mindspore/lib/plugin/libmindspore_gpu.so.11.1 +0 -0
  91. mindspore/lib/plugin/libmindspore_gpu.so.11.6 +0 -0
  92. mindspore/nn/cell.py +0 -3
  93. mindspore/nn/layer/activation.py +4 -5
  94. mindspore/nn/layer/conv.py +39 -23
  95. mindspore/nn/layer/flash_attention.py +54 -129
  96. mindspore/nn/layer/math.py +3 -7
  97. mindspore/nn/layer/rnn_cells.py +5 -5
  98. mindspore/nn/wrap/__init__.py +4 -2
  99. mindspore/nn/wrap/cell_wrapper.py +12 -3
  100. mindspore/numpy/utils_const.py +5 -5
  101. mindspore/ops/_grad_experimental/grad_array_ops.py +1 -1
  102. mindspore/ops/_grad_experimental/grad_implementations.py +2 -2
  103. mindspore/ops/_grad_experimental/grad_math_ops.py +19 -18
  104. mindspore/ops/_grad_experimental/grad_sparse_ops.py +3 -3
  105. mindspore/ops/_op_impl/aicpu/add.py +3 -3
  106. mindspore/ops/_op_impl/aicpu/linear_sum_assignment.py +21 -2
  107. mindspore/ops/_utils/utils.py +2 -0
  108. mindspore/ops/composite/multitype_ops/_compile_utils.py +2 -1
  109. mindspore/ops/composite/multitype_ops/getitem_impl.py +2 -2
  110. mindspore/ops/function/array_func.py +10 -7
  111. mindspore/ops/function/grad/grad_func.py +0 -1
  112. mindspore/ops/function/nn_func.py +98 -9
  113. mindspore/ops/function/random_func.py +2 -1
  114. mindspore/ops/op_info_register.py +24 -21
  115. mindspore/ops/operations/__init__.py +6 -2
  116. mindspore/ops/operations/_grad_ops.py +25 -6
  117. mindspore/ops/operations/_inner_ops.py +155 -23
  118. mindspore/ops/operations/array_ops.py +9 -7
  119. mindspore/ops/operations/comm_ops.py +2 -2
  120. mindspore/ops/operations/custom_ops.py +85 -68
  121. mindspore/ops/operations/inner_ops.py +26 -3
  122. mindspore/ops/operations/math_ops.py +7 -6
  123. mindspore/ops/operations/nn_ops.py +193 -49
  124. mindspore/parallel/_parallel_serialization.py +10 -3
  125. mindspore/parallel/_tensor.py +4 -1
  126. mindspore/parallel/checkpoint_transform.py +13 -2
  127. mindspore/parallel/shard.py +17 -10
  128. mindspore/profiler/common/util.py +1 -0
  129. mindspore/profiler/parser/ascend_hccl_generator.py +232 -0
  130. mindspore/profiler/parser/ascend_msprof_exporter.py +86 -43
  131. mindspore/profiler/parser/ascend_msprof_generator.py +196 -9
  132. mindspore/profiler/parser/ascend_op_generator.py +1 -1
  133. mindspore/profiler/parser/ascend_timeline_generator.py +6 -182
  134. mindspore/profiler/parser/base_timeline_generator.py +1 -1
  135. mindspore/profiler/parser/cpu_gpu_timeline_generator.py +2 -2
  136. mindspore/profiler/parser/framework_parser.py +1 -1
  137. mindspore/profiler/parser/profiler_info.py +19 -0
  138. mindspore/profiler/profiling.py +46 -24
  139. mindspore/rewrite/api/pattern_engine.py +1 -1
  140. mindspore/rewrite/parsers/for_parser.py +7 -7
  141. mindspore/rewrite/parsers/module_parser.py +4 -4
  142. mindspore/rewrite/symbol_tree.py +1 -4
  143. mindspore/run_check/_check_version.py +5 -3
  144. mindspore/safeguard/rewrite_obfuscation.py +52 -28
  145. mindspore/scipy/ops.py +55 -5
  146. mindspore/scipy/optimize/__init__.py +3 -2
  147. mindspore/scipy/optimize/linear_sum_assignment.py +38 -33
  148. mindspore/train/callback/_summary_collector.py +1 -1
  149. mindspore/train/dataset_helper.py +1 -0
  150. mindspore/train/model.py +2 -2
  151. mindspore/train/serialization.py +97 -11
  152. mindspore/train/summary/_summary_adapter.py +1 -1
  153. mindspore/train/summary/summary_record.py +23 -7
  154. mindspore/version.py +1 -1
  155. {mindspore-2.2.0.dist-info → mindspore-2.2.11.dist-info}/METADATA +3 -2
  156. {mindspore-2.2.0.dist-info → mindspore-2.2.11.dist-info}/RECORD +160 -151
  157. mindspore/ops/_op_impl/_custom_op/flash_attention/attention.py +0 -406
  158. mindspore/ops/_op_impl/_custom_op/flash_attention/constants.py +0 -41
  159. mindspore/ops/_op_impl/_custom_op/flash_attention/flash_attention_bwd.py +0 -467
  160. mindspore/ops/_op_impl/_custom_op/flash_attention/flash_attention_fwd.py +0 -563
  161. mindspore/ops/_op_impl/_custom_op/flash_attention/flash_attention_impl.py +0 -193
  162. mindspore/ops/_op_impl/_custom_op/flash_attention/tik_ops_utils.py +0 -435
  163. mindspore/ops/_op_impl/_custom_op/flash_attention/tiling_strategy/__init__.py +0 -0
  164. mindspore/ops/_op_impl/_custom_op/flash_attention/tiling_strategy/sparse_tiling.py +0 -45
  165. mindspore/ops/_op_impl/_custom_op/flash_attention/tiling_strategy/strategy.py +0 -67
  166. mindspore/ops/_op_impl/_custom_op/flash_attention/tiling_strategy/wukong_tiling.py +0 -62
  167. /mindspore/{ops/_op_impl/_custom_op/flash_attention → _akg/akg/utils/ascend_profilier}/__init__.py +0 -0
  168. {mindspore-2.2.0.dist-info → mindspore-2.2.11.dist-info}/WHEEL +0 -0
  169. {mindspore-2.2.0.dist-info → mindspore-2.2.11.dist-info}/entry_points.txt +0 -0
  170. {mindspore-2.2.0.dist-info → mindspore-2.2.11.dist-info}/top_level.txt +0 -0
@@ -144,14 +144,14 @@ class AdjustBrightness(ImageTensorOperation, PyTensorOperation):
144
144
 
145
145
  Args:
146
146
  device_target (str, optional): The operator will be executed on this device. Currently supports
147
- ``CPU`` and ``Ascend`` , where ``Ascend`` refers to Ascend910B device. Default: ``CPU`` .
147
+ ``CPU`` . Default: ``CPU`` .
148
148
 
149
149
  Raises:
150
150
  TypeError: If `device_target` is not of type str.
151
- ValueError: If `device_target` is not within the valid set of ['CPU', 'Ascend'].
151
+ ValueError: If `device_target` is not ``CPU`` .
152
152
 
153
153
  Supported Platforms:
154
- ``CPU`` ``Ascend``
154
+ ``CPU``
155
155
 
156
156
  Examples:
157
157
  >>> import mindspore.dataset as ds
@@ -227,14 +227,14 @@ class AdjustContrast(ImageTensorOperation, PyTensorOperation):
227
227
 
228
228
  Args:
229
229
  device_target (str, optional): The operator will be executed on this device. Currently supports
230
- ``CPU`` and ``Ascend`` , where ``Ascend`` refers to Ascend910B device. Default: ``CPU`` .
230
+ ``CPU`` . Default: ``CPU`` .
231
231
 
232
232
  Raises:
233
233
  TypeError: If `device_target` is not of type str.
234
- ValueError: If `device_target` is not within the valid set of ['CPU', 'Ascend'].
234
+ ValueError: If `device_target` is not ``CPU`` .
235
235
 
236
236
  Supported Platforms:
237
- ``CPU`` ``Ascend``
237
+ ``CPU``
238
238
 
239
239
  Examples:
240
240
  >>> import mindspore.dataset as ds
@@ -373,14 +373,14 @@ class AdjustHue(ImageTensorOperation, PyTensorOperation):
373
373
 
374
374
  Args:
375
375
  device_target (str, optional): The operator will be executed on this device. Currently supports
376
- ``CPU`` and ``Ascend`` , where ``Ascend`` refers to Ascend910B device. Default: ``CPU`` .
376
+ ``CPU`` . Default: ``CPU`` .
377
377
 
378
378
  Raises:
379
379
  TypeError: If `device_target` is not of type str.
380
- ValueError: If `device_target` is not within the valid set of ['CPU', 'Ascend'].
380
+ ValueError: If `device_target` is not ``CPU`` .
381
381
 
382
382
  Supported Platforms:
383
- ``CPU`` ``Ascend``
383
+ ``CPU``
384
384
 
385
385
  Examples:
386
386
  >>> import mindspore.dataset as ds
@@ -457,14 +457,14 @@ class AdjustSaturation(ImageTensorOperation, PyTensorOperation):
457
457
 
458
458
  Args:
459
459
  device_target (str, optional): The operator will be executed on this device. Currently supports
460
- ``CPU`` and ``Ascend`` , where ``Ascend`` refers to Ascend910B device. Default: ``CPU`` .
460
+ ``CPU`` . Default: ``CPU`` .
461
461
 
462
462
  Raises:
463
463
  TypeError: If `device_target` is not of type str.
464
- ValueError: If `device_target` is not within the valid set of ['CPU', 'Ascend'].
464
+ ValueError: If `device_target` is not ``CPU`` .
465
465
 
466
466
  Supported Platforms:
467
- ``CPU`` ``Ascend``
467
+ ``CPU``
468
468
 
469
469
  Examples:
470
470
  >>> import mindspore.dataset as ds
@@ -1159,14 +1159,14 @@ class Decode(ImageTensorOperation, PyTensorOperation):
1159
1159
 
1160
1160
  Args:
1161
1161
  device_target (str, optional): The operator will be executed on this device. Currently supports
1162
- ``CPU`` and ``Ascend`` , where ``Ascend`` refers to Ascend910B device. Default: ``CPU`` .
1162
+ ``CPU`` . Default: ``CPU`` .
1163
1163
 
1164
1164
  Raises:
1165
1165
  TypeError: If `device_target` is not of type str.
1166
- ValueError: If `device_target` is not within the valid set of ['CPU', 'Ascend'].
1166
+ ValueError: If `device_target` is not ``CPU`` .
1167
1167
 
1168
1168
  Supported Platforms:
1169
- ``CPU`` ``Ascend``
1169
+ ``CPU``
1170
1170
 
1171
1171
  Examples:
1172
1172
  >>> import mindspore.dataset as ds
@@ -1908,14 +1908,14 @@ class Normalize(ImageTensorOperation):
1908
1908
 
1909
1909
  Args:
1910
1910
  device_target (str, optional): The operator will be executed on this device. Currently supports
1911
- ``CPU`` and ``Ascend`` , where ``Ascend`` refers to Ascend910B device. Default: ``CPU`` .
1911
+ ``CPU`` . Default: ``CPU`` .
1912
1912
 
1913
1913
  Raises:
1914
1914
  TypeError: If `device_target` is not of type str.
1915
- ValueError: If `device_target` is not within the valid set of ['CPU', 'Ascend'].
1915
+ ValueError: If `device_target` is not ``CPU`` .
1916
1916
 
1917
1917
  Supported Platforms:
1918
- ``CPU`` ``Ascend``
1918
+ ``CPU``
1919
1919
 
1920
1920
  Examples:
1921
1921
  >>> import mindspore.dataset as ds
@@ -4182,14 +4182,14 @@ class Resize(ImageTensorOperation, PyTensorOperation):
4182
4182
 
4183
4183
  Args:
4184
4184
  device_target (str, optional): The operator will be executed on this device. Currently supports
4185
- ``CPU`` and ``Ascend`` , where ``Ascend`` refers to Ascend910B device. Default: ``CPU`` .
4185
+ ``CPU`` . Default: ``CPU`` .
4186
4186
 
4187
4187
  Raises:
4188
4188
  TypeError: If `device_target` is not of type str.
4189
- ValueError: If `device_target` is not within the valid set of ['CPU', 'Ascend'].
4189
+ ValueError: If `device_target` is not ``CPU`` .
4190
4190
 
4191
4191
  Supported Platforms:
4192
- ``CPU`` ``Ascend``
4192
+ ``CPU``
4193
4193
 
4194
4194
  Examples:
4195
4195
  >>> import mindspore.dataset as ds
@@ -43,7 +43,7 @@ def _run_adam_with_amsgrad_opt(opt, beta1_power, beta2_power, lr, gradient, para
43
43
 
44
44
  class Adam(Optimizer):
45
45
  r"""
46
- Implements Adam algorithm..
46
+ Implements Adam algorithm.
47
47
 
48
48
  The updating formulas are as follows:
49
49
 
mindspore/gen_ops.py CHANGED
@@ -120,7 +120,7 @@ def generate_py_primitive(yaml_data):
120
120
  assign_str += arg_name
121
121
  args_assign.append(assign_str)
122
122
 
123
- args_assign = '\n'.join(assign for assign in args_assign)
123
+ args_assign = '\n'.join([assign for assign in args_assign])
124
124
  primitive_code = f"""
125
125
  class {class_name}(Primitive):
126
126
  def __init__(self, {', '.join(init_args_with_default)}):
@@ -136,6 +136,13 @@ class MS_API Model {
136
136
  /// \return Status.
137
137
  Status UpdateWeights(const std::vector<MSTensor> &new_weights);
138
138
 
139
+ /// \brief Change the size and or content of weight tensors
140
+ ///
141
+ /// \param[in] A vector where model constant are arranged in sequence
142
+ ///
143
+ /// \return Status.
144
+ Status UpdateWeights(const std::vector<std::vector<MSTensor>> &new_weights);
145
+
139
146
  /// \brief Inference model API. If use this API in train mode, it's equal to RunStep API.
140
147
  ///
141
148
  /// \param[in] inputs A vector where model inputs are arranged in sequence.
@@ -358,6 +365,13 @@ class MS_API Model {
358
365
 
359
366
  const std::shared_ptr<ModelImpl> impl() const { return impl_; }
360
367
 
368
+ /// \brief Get model info by key
369
+ ///
370
+ /// \param[in] key The key of model info key-value pair
371
+ ///
372
+ /// \return The value of the model info associated with the given key.
373
+ inline std::string GetModelInfo(const std::string &key);
374
+
361
375
  private:
362
376
  friend class Serialization;
363
377
  // api without std::string
@@ -374,6 +388,7 @@ class MS_API Model {
374
388
  const std::vector<char> &cropto_lib_path);
375
389
  Status Build(const std::vector<char> &model_path, ModelType model_type, const std::shared_ptr<Context> &model_context,
376
390
  const Key &dec_key, const std::vector<char> &dec_mode, const std::vector<char> &cropto_lib_path);
391
+ std::vector<char> GetModelInfo(const std::vector<char> &key);
377
392
  std::shared_ptr<ModelImpl> impl_;
378
393
  };
379
394
 
@@ -416,5 +431,7 @@ Status Model::Build(const std::string &model_path, ModelType model_type,
416
431
  const std::shared_ptr<Context> &model_context) {
417
432
  return Build(StringToChar(model_path), model_type, model_context);
418
433
  }
434
+
435
+ inline std::string Model::GetModelInfo(const std::string &key) { return CharToString(GetModelInfo(StringToChar(key))); }
419
436
  } // namespace mindspore
420
437
  #endif // MINDSPORE_INCLUDE_API_MODEL_H
@@ -83,9 +83,14 @@ enum StatusCode : uint32_t {
83
83
  kLiteModelRebuild = kLite | (0x0FFFFFFF & -12), /**< Model has been built. */
84
84
 
85
85
  // Executor error code, range: [-100,-200)
86
- kLiteOutOfTensorRange = kLite | (0x0FFFFFFF & -100), /**< Failed to check range. */
87
- kLiteInputTensorError = kLite | (0x0FFFFFFF & -101), /**< Failed to check input tensor. */
88
- kLiteReentrantError = kLite | (0x0FFFFFFF & -102), /**< Exist executor running. */
86
+ kLiteOutOfTensorRange = kLite | (0x0FFFFFFF & -100), /**< Failed to check range. */
87
+ kLiteInputTensorError = kLite | (0x0FFFFFFF & -101), /**< Failed to check input tensor. */
88
+ kLiteReentrantError = kLite | (0x0FFFFFFF & -102), /**< Exist executor running. */
89
+ kLiteLLMWaitProcessTimeOut = kLite | (0x0FFFFFFF & -103), /**< Wait to be processed time out. */
90
+ kLiteLLMKVCacheNotExist = kLite | (0x0FFFFFFF & -104), /**< KV Cache not exist. */
91
+ kLiteLLMRepeatRequest = kLite | (0x0FFFFFFF & -105), /**< repeat request. */
92
+ kLiteLLMRequestAlreadyCompleted = kLite | (0x0FFFFFFF & -106), /**< request already complete!. */
93
+ kLiteLLMEngineFinalized = kLite | (0x0FFFFFFF & -107), /**< llm engine finalized. */
89
94
 
90
95
  // Graph error code, range: [-200,-300)
91
96
  kLiteGraphFileError = kLite | (0x0FFFFFFF & -200), /**< Failed to verify graph file. */
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
Binary file
mindspore/lib/libnnacl.so CHANGED
Binary file
Binary file
Binary file
Binary file
@@ -0,0 +1,123 @@
1
+ {
2
+ "AddDSL":{
3
+ "input0":{
4
+ "dtype":"float16",
5
+ "format":"NCHW",
6
+ "name":"x1",
7
+ "paramType":"required"
8
+ },
9
+ "input1":{
10
+ "dtype":"float16",
11
+ "format":"NCHW",
12
+ "name":"x2",
13
+ "paramType":"required"
14
+ },
15
+ "opFile":{
16
+ "value":"add_dsl"
17
+ },
18
+ "opInterface":{
19
+ "value":"add_dsl"
20
+ },
21
+ "output0":{
22
+ "dtype":"float16",
23
+ "format":"NCHW",
24
+ "name":"y",
25
+ "paramType":"required"
26
+ }
27
+ },
28
+ "AddTik":{
29
+ "input0":{
30
+ "dtype":"float16",
31
+ "format":"ND",
32
+ "name":"x1",
33
+ "paramType":"required"
34
+ },
35
+ "input1":{
36
+ "dtype":"float16",
37
+ "format":"ND",
38
+ "name":"x2",
39
+ "paramType":"required"
40
+ },
41
+ "opFile":{
42
+ "value":"add_tik"
43
+ },
44
+ "opInterface":{
45
+ "value":"add_tik"
46
+ },
47
+ "output0":{
48
+ "dtype":"float16",
49
+ "format":"ND",
50
+ "name":"y",
51
+ "paramType":"required"
52
+ }
53
+ },
54
+ "FlashAttention":{
55
+ "input0":{
56
+ "dtype":"float16,float32,int32",
57
+ "format":"ND,ND,ND",
58
+ "name":"q",
59
+ "paramType":"required"
60
+ },
61
+ "input1":{
62
+ "dtype":"float16,float32,int32",
63
+ "format":"ND,ND,ND",
64
+ "name":"k",
65
+ "paramType":"required"
66
+ },
67
+ "input2":{
68
+ "dtype":"float16,float32,int32",
69
+ "format":"ND,ND,ND",
70
+ "name":"v",
71
+ "paramType":"required"
72
+ },
73
+ "input3":{
74
+ "dtype":"float16,float32,int32",
75
+ "format":"ND,ND,ND",
76
+ "name":"attention_mask",
77
+ "paramType":"required"
78
+ },
79
+ "opFile":{
80
+ "value":"flash_attention"
81
+ },
82
+ "opInterface":{
83
+ "value":"flash_attention"
84
+ },
85
+ "output0":{
86
+ "dtype":"float16,float32,int32",
87
+ "format":"ND,ND,ND",
88
+ "name":"y",
89
+ "paramType":"required"
90
+ }
91
+ },
92
+ "MatmulTik":{
93
+ "input0":{
94
+ "dtype":"int8,uint8,float16",
95
+ "format":"ND,ND,ND",
96
+ "name":"x1",
97
+ "needCompile":"false",
98
+ "paramType":"required",
99
+ "shape":"all"
100
+ },
101
+ "input1":{
102
+ "dtype":"int8,int8,float16",
103
+ "format":"ND,ND,ND",
104
+ "name":"x2",
105
+ "needCompile":"false",
106
+ "paramType":"required",
107
+ "shape":"all"
108
+ },
109
+ "opFile":{
110
+ "value":"matmul_tik"
111
+ },
112
+ "opInterface":{
113
+ "value":"matmul_tik"
114
+ },
115
+ "output0":{
116
+ "dtype":"int32,int32,float",
117
+ "format":"ND,ND,ND",
118
+ "name":"y",
119
+ "paramType":"required",
120
+ "shape":"all"
121
+ }
122
+ }
123
+ }
@@ -0,0 +1,123 @@
1
+ {
2
+ "AddDSL":{
3
+ "input0":{
4
+ "dtype":"float16",
5
+ "format":"NCHW",
6
+ "name":"x1",
7
+ "paramType":"required"
8
+ },
9
+ "input1":{
10
+ "dtype":"float16",
11
+ "format":"NCHW",
12
+ "name":"x2",
13
+ "paramType":"required"
14
+ },
15
+ "opFile":{
16
+ "value":"add_dsl"
17
+ },
18
+ "opInterface":{
19
+ "value":"add_dsl"
20
+ },
21
+ "output0":{
22
+ "dtype":"float16",
23
+ "format":"NCHW",
24
+ "name":"y",
25
+ "paramType":"required"
26
+ }
27
+ },
28
+ "AddTik":{
29
+ "input0":{
30
+ "dtype":"float16",
31
+ "format":"ND",
32
+ "name":"x1",
33
+ "paramType":"required"
34
+ },
35
+ "input1":{
36
+ "dtype":"float16",
37
+ "format":"ND",
38
+ "name":"x2",
39
+ "paramType":"required"
40
+ },
41
+ "opFile":{
42
+ "value":"add_tik"
43
+ },
44
+ "opInterface":{
45
+ "value":"add_tik"
46
+ },
47
+ "output0":{
48
+ "dtype":"float16",
49
+ "format":"ND",
50
+ "name":"y",
51
+ "paramType":"required"
52
+ }
53
+ },
54
+ "FlashAttention":{
55
+ "input0":{
56
+ "dtype":"float16,float32,int32",
57
+ "format":"ND,ND,ND",
58
+ "name":"q",
59
+ "paramType":"required"
60
+ },
61
+ "input1":{
62
+ "dtype":"float16,float32,int32",
63
+ "format":"ND,ND,ND",
64
+ "name":"k",
65
+ "paramType":"required"
66
+ },
67
+ "input2":{
68
+ "dtype":"float16,float32,int32",
69
+ "format":"ND,ND,ND",
70
+ "name":"v",
71
+ "paramType":"required"
72
+ },
73
+ "input3":{
74
+ "dtype":"float16,float32,int32",
75
+ "format":"ND,ND,ND",
76
+ "name":"attention_mask",
77
+ "paramType":"required"
78
+ },
79
+ "opFile":{
80
+ "value":"flash_attention"
81
+ },
82
+ "opInterface":{
83
+ "value":"flash_attention"
84
+ },
85
+ "output0":{
86
+ "dtype":"float16,float32,int32",
87
+ "format":"ND,ND,ND",
88
+ "name":"y",
89
+ "paramType":"required"
90
+ }
91
+ },
92
+ "MatmulTik":{
93
+ "input0":{
94
+ "dtype":"int8,uint8,float16",
95
+ "format":"ND,ND,ND",
96
+ "name":"x1",
97
+ "needCompile":"false",
98
+ "paramType":"required",
99
+ "shape":"all"
100
+ },
101
+ "input1":{
102
+ "dtype":"int8,int8,float16",
103
+ "format":"ND,ND,ND",
104
+ "name":"x2",
105
+ "needCompile":"false",
106
+ "paramType":"required",
107
+ "shape":"all"
108
+ },
109
+ "opFile":{
110
+ "value":"matmul_tik"
111
+ },
112
+ "opInterface":{
113
+ "value":"matmul_tik"
114
+ },
115
+ "output0":{
116
+ "dtype":"int32,int32,float",
117
+ "format":"ND,ND,ND",
118
+ "name":"y",
119
+ "paramType":"required",
120
+ "shape":"all"
121
+ }
122
+ }
123
+ }
@@ -0,0 +1,158 @@
1
+ {
2
+ "AddDSL":{
3
+ "input0":{
4
+ "dtype":"float16,float32,int32",
5
+ "format":"ND,ND,ND",
6
+ "name":"x1",
7
+ "paramType":"required"
8
+ },
9
+ "input1":{
10
+ "dtype":"float16,float32,int32",
11
+ "format":"ND,ND,ND",
12
+ "name":"x2",
13
+ "paramType":"required"
14
+ },
15
+ "opFile":{
16
+ "value":"add_dsl"
17
+ },
18
+ "opInterface":{
19
+ "value":"add_dsl"
20
+ },
21
+ "output0":{
22
+ "dtype":"float16,float32,int32",
23
+ "format":"ND,ND,ND",
24
+ "name":"y",
25
+ "paramType":"required"
26
+ }
27
+ },
28
+ "AddTik":{
29
+ "input0":{
30
+ "dtype":"float16,float32,int32",
31
+ "format":"ND,ND,ND",
32
+ "name":"x1",
33
+ "paramType":"required"
34
+ },
35
+ "input1":{
36
+ "dtype":"float16,float32,int32",
37
+ "format":"ND,ND,ND",
38
+ "name":"x2",
39
+ "paramType":"required"
40
+ },
41
+ "opFile":{
42
+ "value":"add_tik"
43
+ },
44
+ "opInterface":{
45
+ "value":"add_tik"
46
+ },
47
+ "output0":{
48
+ "dtype":"float16,float32,int32",
49
+ "format":"ND,ND,ND",
50
+ "name":"y",
51
+ "paramType":"required"
52
+ }
53
+ },
54
+ "FlashAttention":{
55
+ "input0":{
56
+ "dtype":"float16,float32,int32",
57
+ "format":"ND,ND,ND",
58
+ "name":"q",
59
+ "paramType":"required"
60
+ },
61
+ "input1":{
62
+ "dtype":"float16,float32,int32",
63
+ "format":"ND,ND,ND",
64
+ "name":"k",
65
+ "paramType":"required"
66
+ },
67
+ "input2":{
68
+ "dtype":"float16,float32,int32",
69
+ "format":"ND,ND,ND",
70
+ "name":"v",
71
+ "paramType":"required"
72
+ },
73
+ "input3":{
74
+ "dtype":"float16,float32,int32",
75
+ "format":"ND,ND,ND",
76
+ "name":"attention_mask",
77
+ "paramType":"required"
78
+ },
79
+ "opFile":{
80
+ "value":"flash_attention"
81
+ },
82
+ "opInterface":{
83
+ "value":"flash_attention"
84
+ },
85
+ "output0":{
86
+ "dtype":"float16,float32,int32",
87
+ "format":"ND,ND,ND",
88
+ "name":"y",
89
+ "paramType":"required"
90
+ }
91
+ },
92
+ "KVCacheMgr":{
93
+ "input0":{
94
+ "dtype":"float32, int32, uint32, float16, int16, uint16, int8, uint8",
95
+ "format":"ND,ND,ND,ND,ND,ND,ND,ND",
96
+ "name":"past",
97
+ "paramType":"required"
98
+ },
99
+ "input1":{
100
+ "dtype":"float32, int32, uint32, float16, int16, uint16, int8, uint8",
101
+ "format":"ND,ND,ND,ND,ND,ND,ND,ND",
102
+ "name":"cur",
103
+ "paramType":"required"
104
+ },
105
+ "input2":{
106
+ "dtype":"int32,int32,int32,int32,int32,int32,int32,int32",
107
+ "format":"ND,ND,ND,ND,ND,ND,ND,ND",
108
+ "name":"index",
109
+ "paramType":"required"
110
+ },
111
+ "needCheckSupport":{
112
+ "flag":"true"
113
+ },
114
+ "opFile":{
115
+ "value":"kv_cache_mgr"
116
+ },
117
+ "opInterface":{
118
+ "value":"kv_cache_mgr"
119
+ },
120
+ "output0":{
121
+ "dtype":"float32, int32, uint32, float16, int16, uint16, int8, uint8",
122
+ "format":"ND,ND,ND,ND,ND,ND,ND,ND",
123
+ "name":"past",
124
+ "paramType":"required"
125
+ }
126
+ },
127
+ "MatmulTik":{
128
+ "input0":{
129
+ "dtype":"int8,uint8,float16",
130
+ "format":"ND,ND,ND",
131
+ "name":"x1",
132
+ "needCompile":"false",
133
+ "paramType":"required",
134
+ "shape":"all"
135
+ },
136
+ "input1":{
137
+ "dtype":"int8,int8,float16",
138
+ "format":"ND,ND,ND",
139
+ "name":"x2",
140
+ "needCompile":"false",
141
+ "paramType":"required",
142
+ "shape":"all"
143
+ },
144
+ "opFile":{
145
+ "value":"matmul_tik"
146
+ },
147
+ "opInterface":{
148
+ "value":"matmul_tik"
149
+ },
150
+ "output0":{
151
+ "dtype":"int32,int32,float",
152
+ "format":"ND,ND,ND",
153
+ "name":"y",
154
+ "paramType":"required",
155
+ "shape":"all"
156
+ }
157
+ }
158
+ }