nvidia-cudnn-cu12 8.9.7.29__py3-none-win_amd64.whl → 9.1.0.70__py3-none-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (56) hide show
  1. nvidia/cudnn/bin/cudnn64_9.dll +0 -0
  2. nvidia/cudnn/bin/{cudnn_adv_infer64_8.dll → cudnn_adv64_9.dll} +0 -0
  3. nvidia/cudnn/bin/cudnn_cnn64_9.dll +0 -0
  4. nvidia/cudnn/bin/{cudnn_cnn_infer64_8.dll → cudnn_engines_precompiled64_9.dll} +0 -0
  5. nvidia/cudnn/bin/cudnn_engines_runtime_compiled64_9.dll +0 -0
  6. nvidia/cudnn/bin/cudnn_graph64_9.dll +0 -0
  7. nvidia/cudnn/bin/{cudnn_ops_infer64_8.dll → cudnn_heuristic64_9.dll} +0 -0
  8. nvidia/cudnn/bin/{cudnn_adv_train64_8.dll → cudnn_ops64_9.dll} +0 -0
  9. nvidia/cudnn/include/cudnn.h +8 -18
  10. nvidia/cudnn/include/{cudnn_adv_infer.h → cudnn_adv.h} +265 -252
  11. nvidia/cudnn/include/cudnn_backend.h +3 -558
  12. nvidia/cudnn/include/{cudnn_cnn_infer.h → cudnn_cnn.h} +187 -65
  13. nvidia/cudnn/include/cudnn_graph.h +909 -0
  14. nvidia/cudnn/include/{cudnn_ops_infer.h → cudnn_ops.h} +469 -336
  15. nvidia/cudnn/include/cudnn_version.h +4 -43
  16. nvidia/cudnn/lib/x64/cudnn.lib +0 -0
  17. nvidia/cudnn/lib/x64/cudnn64_9.lib +0 -0
  18. nvidia/cudnn/lib/x64/cudnn_adv.lib +0 -0
  19. nvidia/cudnn/lib/x64/cudnn_adv64_9.lib +0 -0
  20. nvidia/cudnn/lib/x64/cudnn_cnn.lib +0 -0
  21. nvidia/cudnn/lib/x64/cudnn_cnn64_9.lib +0 -0
  22. nvidia/cudnn/lib/x64/cudnn_engines_precompiled.lib +0 -0
  23. nvidia/cudnn/lib/x64/cudnn_engines_precompiled64_9.lib +0 -0
  24. nvidia/cudnn/lib/x64/cudnn_engines_runtime_compiled.lib +0 -0
  25. nvidia/cudnn/lib/x64/cudnn_engines_runtime_compiled64_9.lib +0 -0
  26. nvidia/cudnn/lib/x64/cudnn_graph.lib +0 -0
  27. nvidia/cudnn/lib/x64/cudnn_graph64_9.lib +0 -0
  28. nvidia/cudnn/lib/x64/cudnn_heuristic.lib +0 -0
  29. nvidia/cudnn/lib/x64/cudnn_heuristic64_9.lib +0 -0
  30. nvidia/cudnn/lib/x64/cudnn_ops.lib +0 -0
  31. nvidia/cudnn/lib/x64/cudnn_ops64_9.lib +0 -0
  32. {nvidia_cudnn_cu12-8.9.7.29.dist-info → nvidia_cudnn_cu12-9.1.0.70.dist-info}/METADATA +1 -1
  33. nvidia_cudnn_cu12-9.1.0.70.dist-info/RECORD +41 -0
  34. nvidia/cudnn/bin/cudnn64_8.dll +0 -0
  35. nvidia/cudnn/bin/cudnn_cnn_train64_8.dll +0 -0
  36. nvidia/cudnn/bin/cudnn_ops_train64_8.dll +0 -0
  37. nvidia/cudnn/include/cudnn_adv_train.h +0 -540
  38. nvidia/cudnn/include/cudnn_cnn_train.h +0 -219
  39. nvidia/cudnn/include/cudnn_ops_train.h +0 -501
  40. nvidia/cudnn/lib/x64/cudnn64_8.lib +0 -0
  41. nvidia/cudnn/lib/x64/cudnn_adv_infer.lib +0 -0
  42. nvidia/cudnn/lib/x64/cudnn_adv_infer64_8.lib +0 -0
  43. nvidia/cudnn/lib/x64/cudnn_adv_train.lib +0 -0
  44. nvidia/cudnn/lib/x64/cudnn_adv_train64_8.lib +0 -0
  45. nvidia/cudnn/lib/x64/cudnn_cnn_infer.lib +0 -0
  46. nvidia/cudnn/lib/x64/cudnn_cnn_infer64_8.lib +0 -0
  47. nvidia/cudnn/lib/x64/cudnn_cnn_train.lib +0 -0
  48. nvidia/cudnn/lib/x64/cudnn_cnn_train64_8.lib +0 -0
  49. nvidia/cudnn/lib/x64/cudnn_ops_infer.lib +0 -0
  50. nvidia/cudnn/lib/x64/cudnn_ops_infer64_8.lib +0 -0
  51. nvidia/cudnn/lib/x64/cudnn_ops_train.lib +0 -0
  52. nvidia/cudnn/lib/x64/cudnn_ops_train64_8.lib +0 -0
  53. nvidia_cudnn_cu12-8.9.7.29.dist-info/RECORD +0 -40
  54. {nvidia_cudnn_cu12-8.9.7.29.dist-info → nvidia_cudnn_cu12-9.1.0.70.dist-info}/License.txt +0 -0
  55. {nvidia_cudnn_cu12-8.9.7.29.dist-info → nvidia_cudnn_cu12-9.1.0.70.dist-info}/WHEEL +0 -0
  56. {nvidia_cudnn_cu12-8.9.7.29.dist-info → nvidia_cudnn_cu12-9.1.0.70.dist-info}/top_level.txt +0 -0
@@ -48,26 +48,24 @@
48
48
  */
49
49
 
50
50
  /*
51
- * cudnn_cnn_infer : cuDNN's basic definitions and inference CNN functions.
51
+ * cudnn_cnn : cuDNN's basic definitions and CNN functions.
52
52
  */
53
53
 
54
- #if !defined(CUDNN_CNN_INFER_H_)
55
- #define CUDNN_CNN_INFER_H_
54
+ #if !defined(CUDNN_CNN_H_)
55
+ #define CUDNN_CNN_H_
56
56
 
57
57
  #pragma once
58
- #include <cuda_runtime.h>
59
58
  #include <stdint.h>
60
59
 
61
60
  #include "cudnn_version.h"
62
- #include "cudnn_ops_infer.h"
61
+ #include "cudnn_ops.h"
63
62
 
64
63
  /* These version numbers are autogenerated, do not edit manually. */
65
- #define CUDNN_CNN_INFER_MAJOR 8
66
- #define CUDNN_CNN_INFER_MINOR 9
67
- #define CUDNN_CNN_INFER_PATCH 7
64
+ #define CUDNN_CNN_MAJOR 9
65
+ #define CUDNN_CNN_MINOR 1
66
+ #define CUDNN_CNN_PATCH 0
68
67
 
69
- #if (CUDNN_CNN_INFER_MAJOR != CUDNN_MAJOR) || (CUDNN_CNN_INFER_MINOR != CUDNN_MINOR) || \
70
- (CUDNN_CNN_INFER_PATCH != CUDNN_PATCHLEVEL)
68
+ #if (CUDNN_CNN_MAJOR != CUDNN_MAJOR) || (CUDNN_CNN_MINOR != CUDNN_MINOR) || (CUDNN_CNN_PATCH != CUDNN_PATCHLEVEL)
71
69
  #error Version mismatch in cuDNN CNN INFER!!!
72
70
  #endif
73
71
 
@@ -75,20 +73,7 @@
75
73
  extern "C" {
76
74
  #endif
77
75
 
78
- typedef struct cudnnConvolutionStruct *cudnnConvolutionDescriptor_t;
79
-
80
- /*
81
- * convolution mode
82
- */
83
- typedef enum { CUDNN_CONVOLUTION = 0, CUDNN_CROSS_CORRELATION = 1 } cudnnConvolutionMode_t;
84
-
85
- /*
86
- * CUDNN Reorder
87
- */
88
- typedef enum {
89
- CUDNN_DEFAULT_REORDER = 0,
90
- CUDNN_NO_REORDER = 1,
91
- } cudnnReorderType_t;
76
+ typedef struct cudnnConvolutionStruct *cudnnConvolutionDescriptor_t CUDNN_DEPRECATED;
92
77
 
93
78
  typedef struct cudnnConvolutionFwdAlgoPerfStruct {
94
79
  cudnnConvolutionFwdAlgo_t algo;
@@ -98,35 +83,35 @@ typedef struct cudnnConvolutionFwdAlgoPerfStruct {
98
83
  cudnnDeterminism_t determinism;
99
84
  cudnnMathType_t mathType;
100
85
  int reserved[3];
101
- } cudnnConvolutionFwdAlgoPerf_t;
86
+ } cudnnConvolutionFwdAlgoPerf_t CUDNN_DEPRECATED;
102
87
 
103
88
  /* Create an instance of convolution descriptor */
104
- cudnnStatus_t CUDNNWINAPI
89
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
105
90
  cudnnCreateConvolutionDescriptor(cudnnConvolutionDescriptor_t *convDesc);
106
91
 
107
92
  /* Destroy an instance of convolution descriptor */
108
- cudnnStatus_t CUDNNWINAPI
93
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
109
94
  cudnnDestroyConvolutionDescriptor(cudnnConvolutionDescriptor_t convDesc);
110
95
 
111
- cudnnStatus_t CUDNNWINAPI
96
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
112
97
  cudnnSetConvolutionMathType(cudnnConvolutionDescriptor_t convDesc, cudnnMathType_t mathType);
113
98
 
114
- cudnnStatus_t CUDNNWINAPI
99
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
115
100
  cudnnGetConvolutionMathType(cudnnConvolutionDescriptor_t convDesc, cudnnMathType_t *mathType);
116
101
 
117
- cudnnStatus_t CUDNNWINAPI
102
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
118
103
  cudnnSetConvolutionGroupCount(cudnnConvolutionDescriptor_t convDesc, int groupCount);
119
104
 
120
- cudnnStatus_t CUDNNWINAPI
105
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
121
106
  cudnnGetConvolutionGroupCount(cudnnConvolutionDescriptor_t convDesc, int *groupCount);
122
107
 
123
- cudnnStatus_t CUDNNWINAPI
108
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
124
109
  cudnnSetConvolutionReorderType(cudnnConvolutionDescriptor_t convDesc, cudnnReorderType_t reorderType);
125
110
 
126
- cudnnStatus_t CUDNNWINAPI
111
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
127
112
  cudnnGetConvolutionReorderType(cudnnConvolutionDescriptor_t convDesc, cudnnReorderType_t *reorderType);
128
113
 
129
- cudnnStatus_t CUDNNWINAPI
114
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
130
115
  cudnnSetConvolution2dDescriptor(cudnnConvolutionDescriptor_t convDesc,
131
116
  int pad_h, /* zero-padding height */
132
117
  int pad_w, /* zero-padding width */
@@ -137,7 +122,7 @@ cudnnSetConvolution2dDescriptor(cudnnConvolutionDescriptor_t convDesc,
137
122
  cudnnConvolutionMode_t mode,
138
123
  cudnnDataType_t computeType);
139
124
 
140
- cudnnStatus_t CUDNNWINAPI
125
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
141
126
  cudnnGetConvolution2dDescriptor(const cudnnConvolutionDescriptor_t convDesc,
142
127
  int *pad_h, /* zero-padding height */
143
128
  int *pad_w, /* zero-padding width */
@@ -148,7 +133,7 @@ cudnnGetConvolution2dDescriptor(const cudnnConvolutionDescriptor_t convDesc,
148
133
  cudnnConvolutionMode_t *mode,
149
134
  cudnnDataType_t *computeType);
150
135
 
151
- cudnnStatus_t CUDNNWINAPI
136
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
152
137
  cudnnSetConvolutionNdDescriptor(cudnnConvolutionDescriptor_t convDesc,
153
138
  int arrayLength, /* nbDims-2 size */
154
139
  const int padA[],
@@ -158,7 +143,7 @@ cudnnSetConvolutionNdDescriptor(cudnnConvolutionDescriptor_t convDesc,
158
143
  cudnnDataType_t computeType); /* convolution data type */
159
144
 
160
145
  /* Helper function to return the dimensions of the output tensor given a convolution descriptor */
161
- cudnnStatus_t CUDNNWINAPI
146
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
162
147
  cudnnGetConvolutionNdDescriptor(const cudnnConvolutionDescriptor_t convDesc,
163
148
  int arrayLengthRequested,
164
149
  int *arrayLength,
@@ -168,7 +153,7 @@ cudnnGetConvolutionNdDescriptor(const cudnnConvolutionDescriptor_t convDesc,
168
153
  cudnnConvolutionMode_t *mode,
169
154
  cudnnDataType_t *computeType); /* convolution data type */
170
155
 
171
- cudnnStatus_t CUDNNWINAPI
156
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
172
157
  cudnnGetConvolution2dForwardOutputDim(const cudnnConvolutionDescriptor_t convDesc,
173
158
  const cudnnTensorDescriptor_t inputTensorDesc,
174
159
  const cudnnFilterDescriptor_t filterDesc,
@@ -178,7 +163,7 @@ cudnnGetConvolution2dForwardOutputDim(const cudnnConvolutionDescriptor_t convDes
178
163
  int *w);
179
164
 
180
165
  /* Helper function to return the dimensions of the output tensor given a convolution descriptor */
181
- cudnnStatus_t CUDNNWINAPI
166
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
182
167
  cudnnGetConvolutionNdForwardOutputDim(const cudnnConvolutionDescriptor_t convDesc,
183
168
  const cudnnTensorDescriptor_t inputTensorDesc,
184
169
  const cudnnFilterDescriptor_t filterDesc,
@@ -186,10 +171,10 @@ cudnnGetConvolutionNdForwardOutputDim(const cudnnConvolutionDescriptor_t convDes
186
171
  int tensorOuputDimA[]);
187
172
 
188
173
  /* helper function to provide the convolution forward algo that fit best the requirement */
189
- cudnnStatus_t CUDNNWINAPI
174
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
190
175
  cudnnGetConvolutionForwardAlgorithmMaxCount(cudnnHandle_t handle, int *count);
191
176
 
192
- cudnnStatus_t CUDNNWINAPI
177
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
193
178
  cudnnGetConvolutionForwardAlgorithm_v7(cudnnHandle_t handle,
194
179
  const cudnnTensorDescriptor_t srcDesc,
195
180
  const cudnnFilterDescriptor_t filterDesc,
@@ -199,7 +184,7 @@ cudnnGetConvolutionForwardAlgorithm_v7(cudnnHandle_t handle,
199
184
  int *returnedAlgoCount,
200
185
  cudnnConvolutionFwdAlgoPerf_t *perfResults);
201
186
 
202
- cudnnStatus_t CUDNNWINAPI
187
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
203
188
  cudnnFindConvolutionForwardAlgorithm(cudnnHandle_t handle,
204
189
  const cudnnTensorDescriptor_t xDesc,
205
190
  const cudnnFilterDescriptor_t wDesc,
@@ -209,7 +194,7 @@ cudnnFindConvolutionForwardAlgorithm(cudnnHandle_t handle,
209
194
  int *returnedAlgoCount,
210
195
  cudnnConvolutionFwdAlgoPerf_t *perfResults);
211
196
 
212
- cudnnStatus_t CUDNNWINAPI
197
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
213
198
  cudnnFindConvolutionForwardAlgorithmEx(cudnnHandle_t handle,
214
199
  const cudnnTensorDescriptor_t xDesc,
215
200
  const void *x,
@@ -224,7 +209,7 @@ cudnnFindConvolutionForwardAlgorithmEx(cudnnHandle_t handle,
224
209
  void *workSpace,
225
210
  size_t workSpaceSizeInBytes);
226
211
 
227
- cudnnStatus_t CUDNNWINAPI
212
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
228
213
  cudnnIm2Col(cudnnHandle_t handle,
229
214
  const cudnnTensorDescriptor_t xDesc,
230
215
  const void *x,
@@ -232,7 +217,7 @@ cudnnIm2Col(cudnnHandle_t handle,
232
217
  const cudnnConvolutionDescriptor_t convDesc,
233
218
  void *colBuffer);
234
219
 
235
- cudnnStatus_t CUDNNWINAPI
220
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
236
221
  cudnnReorderFilterAndBias(cudnnHandle_t handle,
237
222
  const cudnnFilterDescriptor_t filterDesc,
238
223
  cudnnReorderType_t reorderType,
@@ -243,7 +228,7 @@ cudnnReorderFilterAndBias(cudnnHandle_t handle,
243
228
  void *reorderedBiasData);
244
229
 
245
230
  /* Helper function to return the minimum size of the workspace to be passed to the convolution given an algo*/
246
- cudnnStatus_t CUDNNWINAPI
231
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
247
232
  cudnnGetConvolutionForwardWorkspaceSize(cudnnHandle_t handle,
248
233
  const cudnnTensorDescriptor_t xDesc,
249
234
  const cudnnFilterDescriptor_t wDesc,
@@ -255,7 +240,7 @@ cudnnGetConvolutionForwardWorkspaceSize(cudnnHandle_t handle,
255
240
  /* Convolution functions: All of the form "output = alpha * Op(inputs) + beta * output" */
256
241
 
257
242
  /* Function to perform the forward pass for batch convolution */
258
- cudnnStatus_t CUDNNWINAPI
243
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
259
244
  cudnnConvolutionForward(cudnnHandle_t handle,
260
245
  const void *alpha,
261
246
  const cudnnTensorDescriptor_t xDesc,
@@ -271,7 +256,7 @@ cudnnConvolutionForward(cudnnHandle_t handle,
271
256
  void *y);
272
257
 
273
258
  /* Fused conv/bias/activation operation : y = Act( alpha1 * conv(x) + alpha2 * z + bias ) */
274
- cudnnStatus_t CUDNNWINAPI
259
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
275
260
  cudnnConvolutionBiasActivationForward(cudnnHandle_t handle,
276
261
  const void *alpha1,
277
262
  const cudnnTensorDescriptor_t xDesc,
@@ -301,12 +286,12 @@ typedef struct cudnnConvolutionBwdDataAlgoPerfStruct {
301
286
  cudnnDeterminism_t determinism;
302
287
  cudnnMathType_t mathType;
303
288
  int reserved[3];
304
- } cudnnConvolutionBwdDataAlgoPerf_t;
289
+ } cudnnConvolutionBwdDataAlgoPerf_t CUDNN_DEPRECATED;
305
290
 
306
- cudnnStatus_t CUDNNWINAPI
291
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
307
292
  cudnnGetConvolutionBackwardDataAlgorithmMaxCount(cudnnHandle_t handle, int *count);
308
293
 
309
- cudnnStatus_t CUDNNWINAPI
294
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
310
295
  cudnnFindConvolutionBackwardDataAlgorithm(cudnnHandle_t handle,
311
296
  const cudnnFilterDescriptor_t wDesc,
312
297
  const cudnnTensorDescriptor_t dyDesc,
@@ -316,7 +301,7 @@ cudnnFindConvolutionBackwardDataAlgorithm(cudnnHandle_t handle,
316
301
  int *returnedAlgoCount,
317
302
  cudnnConvolutionBwdDataAlgoPerf_t *perfResults);
318
303
 
319
- cudnnStatus_t CUDNNWINAPI
304
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
320
305
  cudnnFindConvolutionBackwardDataAlgorithmEx(cudnnHandle_t handle,
321
306
  const cudnnFilterDescriptor_t wDesc,
322
307
  const void *w,
@@ -331,7 +316,7 @@ cudnnFindConvolutionBackwardDataAlgorithmEx(cudnnHandle_t handle,
331
316
  void *workSpace,
332
317
  size_t workSpaceSizeInBytes);
333
318
 
334
- cudnnStatus_t CUDNNWINAPI
319
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
335
320
  cudnnGetConvolutionBackwardDataAlgorithm_v7(cudnnHandle_t handle,
336
321
  const cudnnFilterDescriptor_t filterDesc,
337
322
  const cudnnTensorDescriptor_t diffDesc,
@@ -346,7 +331,7 @@ cudnnGetConvolutionBackwardDataAlgorithm_v7(cudnnHandle_t handle,
346
331
  */
347
332
 
348
333
  /* Helper function to return the minimum size of the workspace to be passed to the convolution given an algo*/
349
- cudnnStatus_t CUDNNWINAPI
334
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
350
335
  cudnnGetConvolutionBackwardDataWorkspaceSize(cudnnHandle_t handle,
351
336
  const cudnnFilterDescriptor_t wDesc,
352
337
  const cudnnTensorDescriptor_t dyDesc,
@@ -355,7 +340,7 @@ cudnnGetConvolutionBackwardDataWorkspaceSize(cudnnHandle_t handle,
355
340
  cudnnConvolutionBwdDataAlgo_t algo,
356
341
  size_t *sizeInBytes);
357
342
 
358
- cudnnStatus_t CUDNNWINAPI
343
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
359
344
  cudnnConvolutionBackwardData(cudnnHandle_t handle,
360
345
  const void *alpha,
361
346
  const cudnnFilterDescriptor_t wDesc,
@@ -371,7 +356,7 @@ cudnnConvolutionBackwardData(cudnnHandle_t handle,
371
356
  void *dx);
372
357
 
373
358
  /* Helper function to calculate folding descriptors for dgrad */
374
- cudnnStatus_t CUDNNWINAPI
359
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
375
360
  cudnnGetFoldedConvBackwardDataDescriptors(const cudnnHandle_t handle,
376
361
  const cudnnFilterDescriptor_t filterDesc,
377
362
  const cudnnTensorDescriptor_t diffDesc,
@@ -389,13 +374,13 @@ cudnnGetFoldedConvBackwardDataDescriptors(const cudnnHandle_t handle,
389
374
 
390
375
  /* cudnnFusedOps... */
391
376
  struct cudnnFusedOpsConstParamStruct;
392
- typedef struct cudnnFusedOpsConstParamStruct *cudnnFusedOpsConstParamPack_t;
377
+ typedef struct cudnnFusedOpsConstParamStruct *cudnnFusedOpsConstParamPack_t CUDNN_DEPRECATED;
393
378
 
394
379
  struct cudnnFusedOpsVariantParamStruct;
395
- typedef struct cudnnFusedOpsVariantParamStruct *cudnnFusedOpsVariantParamPack_t;
380
+ typedef struct cudnnFusedOpsVariantParamStruct *cudnnFusedOpsVariantParamPack_t CUDNN_DEPRECATED;
396
381
 
397
382
  struct cudnnFusedOpsPlanStruct;
398
- typedef struct cudnnFusedOpsPlanStruct *cudnnFusedOpsPlan_t;
383
+ typedef struct cudnnFusedOpsPlanStruct *cudnnFusedOpsPlan_t CUDNN_DEPRECATED;
399
384
 
400
385
  typedef enum {
401
386
  /* each op in [ ] can be disabled by passing NULL ptr */
@@ -416,7 +401,7 @@ typedef enum {
416
401
  CUDNN_FUSED_SCALE_BIAS_ADD_ACTIVATION_GEN_BITMASK = 5,
417
402
  /* reserved for future use */
418
403
  CUDNN_FUSED_DACTIVATION_FORK_DBATCHNORM = 6,
419
- } cudnnFusedOps_t;
404
+ } cudnnFusedOps_t CUDNN_DEPRECATED;
420
405
 
421
406
  typedef enum {
422
407
  /* set XDESC: pass previously initialized cudnnTensorDescriptor_t */
@@ -515,13 +500,13 @@ typedef enum {
515
500
  CUDNN_PARAM_BN_DSCALE_PLACEHOLDER = 37,
516
501
  /* set/get CUDNN_PARAM_BN_DBIAS_PLACEHOLDER: pass cudnnFusedOpsPointerPlaceHolder_t* */
517
502
  CUDNN_PARAM_BN_DBIAS_PLACEHOLDER = 38,
518
- } cudnnFusedOpsConstParamLabel_t;
503
+ } cudnnFusedOpsConstParamLabel_t CUDNN_DEPRECATED;
519
504
 
520
505
  typedef enum {
521
506
  CUDNN_PTR_NULL = 0,
522
507
  CUDNN_PTR_ELEM_ALIGNED = 1,
523
508
  CUDNN_PTR_16B_ALIGNED = 2,
524
- } cudnnFusedOpsPointerPlaceHolder_t;
509
+ } cudnnFusedOpsPointerPlaceHolder_t CUDNN_DEPRECATED;
525
510
 
526
511
  typedef enum {
527
512
  /* set: pass void* pointing to dev memory */
@@ -559,13 +544,150 @@ typedef enum {
559
544
  CUDNN_SCALAR_DOUBLE_BN_EXP_AVG_FACTOR = 102,
560
545
  /* set/get: pass double* pointing to host memory */
561
546
  CUDNN_SCALAR_DOUBLE_BN_EPSILON = 103,
562
- } cudnnFusedOpsVariantParamLabel_t;
547
+ } cudnnFusedOpsVariantParamLabel_t CUDNN_DEPRECATED;
563
548
 
564
549
  cudnnStatus_t CUDNNWINAPI
565
- cudnnCnnInferVersionCheck(void);
550
+ cudnnCnnVersionCheck(void);
551
+
552
+ /* helper function to provide the convolution backward filter algo that fit best the requirement */
553
+
554
+ typedef struct cudnnConvolutionBwdFilterAlgoPerfStruct {
555
+ cudnnConvolutionBwdFilterAlgo_t algo;
556
+ cudnnStatus_t status;
557
+ float time;
558
+ size_t memory;
559
+ cudnnDeterminism_t determinism;
560
+ cudnnMathType_t mathType;
561
+ int reserved[3];
562
+ } cudnnConvolutionBwdFilterAlgoPerf_t CUDNN_DEPRECATED;
563
+
564
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
565
+ cudnnGetConvolutionBackwardFilterAlgorithmMaxCount(cudnnHandle_t handle, int *count);
566
+
567
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
568
+ cudnnFindConvolutionBackwardFilterAlgorithm(cudnnHandle_t handle,
569
+ const cudnnTensorDescriptor_t xDesc,
570
+ const cudnnTensorDescriptor_t dyDesc,
571
+ const cudnnConvolutionDescriptor_t convDesc,
572
+ const cudnnFilterDescriptor_t dwDesc,
573
+ const int requestedAlgoCount,
574
+ int *returnedAlgoCount,
575
+ cudnnConvolutionBwdFilterAlgoPerf_t *perfResults);
576
+
577
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
578
+ cudnnFindConvolutionBackwardFilterAlgorithmEx(cudnnHandle_t handle,
579
+ const cudnnTensorDescriptor_t xDesc,
580
+ const void *x,
581
+ const cudnnTensorDescriptor_t dyDesc,
582
+ const void *y,
583
+ const cudnnConvolutionDescriptor_t convDesc,
584
+ const cudnnFilterDescriptor_t dwDesc,
585
+ void *dw,
586
+ const int requestedAlgoCount,
587
+ int *returnedAlgoCount,
588
+ cudnnConvolutionBwdFilterAlgoPerf_t *perfResults,
589
+ void *workSpace,
590
+ size_t workSpaceSizeInBytes);
591
+
592
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
593
+ cudnnGetConvolutionBackwardFilterAlgorithm_v7(cudnnHandle_t handle,
594
+ const cudnnTensorDescriptor_t srcDesc,
595
+ const cudnnTensorDescriptor_t diffDesc,
596
+ const cudnnConvolutionDescriptor_t convDesc,
597
+ const cudnnFilterDescriptor_t gradDesc,
598
+ const int requestedAlgoCount,
599
+ int *returnedAlgoCount,
600
+ cudnnConvolutionBwdFilterAlgoPerf_t *perfResults);
601
+
602
+ /*
603
+ * convolution algorithm (which requires potentially some workspace)
604
+ */
605
+
606
+ /* Helper function to return the minimum size of the workspace to be passed to the convolution given an algo*/
607
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
608
+ cudnnGetConvolutionBackwardFilterWorkspaceSize(cudnnHandle_t handle,
609
+ const cudnnTensorDescriptor_t xDesc,
610
+ const cudnnTensorDescriptor_t dyDesc,
611
+ const cudnnConvolutionDescriptor_t convDesc,
612
+ const cudnnFilterDescriptor_t gradDesc,
613
+ cudnnConvolutionBwdFilterAlgo_t algo,
614
+ size_t *sizeInBytes);
615
+
616
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
617
+ cudnnConvolutionBackwardFilter(cudnnHandle_t handle,
618
+ const void *alpha,
619
+ const cudnnTensorDescriptor_t xDesc,
620
+ const void *x,
621
+ const cudnnTensorDescriptor_t dyDesc,
622
+ const void *dy,
623
+ const cudnnConvolutionDescriptor_t convDesc,
624
+ cudnnConvolutionBwdFilterAlgo_t algo,
625
+ void *workSpace,
626
+ size_t workSpaceSizeInBytes,
627
+ const void *beta,
628
+ const cudnnFilterDescriptor_t dwDesc,
629
+ void *dw);
630
+
631
+ /* Function to compute the bias gradient for batch convolution */
632
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
633
+ cudnnConvolutionBackwardBias(cudnnHandle_t handle,
634
+ const void *alpha,
635
+ const cudnnTensorDescriptor_t dyDesc,
636
+ const void *dy,
637
+ const void *beta,
638
+ const cudnnTensorDescriptor_t dbDesc,
639
+ void *db);
640
+
641
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
642
+ cudnnCreateFusedOpsConstParamPack(cudnnFusedOpsConstParamPack_t *constPack, cudnnFusedOps_t ops);
643
+
644
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
645
+ cudnnDestroyFusedOpsConstParamPack(cudnnFusedOpsConstParamPack_t constPack);
646
+
647
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
648
+ cudnnSetFusedOpsConstParamPackAttribute(cudnnFusedOpsConstParamPack_t constPack,
649
+ cudnnFusedOpsConstParamLabel_t paramLabel,
650
+ const void *param);
651
+
652
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
653
+ cudnnGetFusedOpsConstParamPackAttribute(const cudnnFusedOpsConstParamPack_t constPack,
654
+ cudnnFusedOpsConstParamLabel_t paramLabel,
655
+ void *param,
656
+ int *isNULL);
657
+
658
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
659
+ cudnnCreateFusedOpsVariantParamPack(cudnnFusedOpsVariantParamPack_t *varPack, cudnnFusedOps_t ops);
660
+
661
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
662
+ cudnnDestroyFusedOpsVariantParamPack(cudnnFusedOpsVariantParamPack_t varPack);
663
+
664
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
665
+ cudnnSetFusedOpsVariantParamPackAttribute(cudnnFusedOpsVariantParamPack_t varPack,
666
+ cudnnFusedOpsVariantParamLabel_t paramLabel,
667
+ void *ptr);
668
+
669
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
670
+ cudnnGetFusedOpsVariantParamPackAttribute(const cudnnFusedOpsVariantParamPack_t varPack,
671
+ cudnnFusedOpsVariantParamLabel_t paramLabel,
672
+ void *ptr);
673
+
674
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
675
+ cudnnCreateFusedOpsPlan(cudnnFusedOpsPlan_t *plan, cudnnFusedOps_t ops);
676
+
677
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
678
+ cudnnDestroyFusedOpsPlan(cudnnFusedOpsPlan_t plan);
679
+
680
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
681
+ cudnnMakeFusedOpsPlan(cudnnHandle_t handle,
682
+ cudnnFusedOpsPlan_t plan,
683
+ const cudnnFusedOpsConstParamPack_t constPack,
684
+ size_t *workspaceSizeInBytes);
685
+
686
+ CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
687
+ cudnnFusedOpsExecute(cudnnHandle_t handle, const cudnnFusedOpsPlan_t plan, cudnnFusedOpsVariantParamPack_t varPack);
566
688
 
567
689
  #if defined(__cplusplus)
568
690
  }
569
691
  #endif
570
692
 
571
- #endif /* CUDNN_CNN_INFER_H_ */
693
+ #endif /* CUDNN_CNN_H_ */