nvidia-cudnn-cu12 8.9.7.29__py3-none-win_amd64.whl → 9.1.0.70__py3-none-win_amd64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- nvidia/cudnn/bin/cudnn64_9.dll +0 -0
- nvidia/cudnn/bin/{cudnn_adv_infer64_8.dll → cudnn_adv64_9.dll} +0 -0
- nvidia/cudnn/bin/cudnn_cnn64_9.dll +0 -0
- nvidia/cudnn/bin/{cudnn_cnn_infer64_8.dll → cudnn_engines_precompiled64_9.dll} +0 -0
- nvidia/cudnn/bin/cudnn_engines_runtime_compiled64_9.dll +0 -0
- nvidia/cudnn/bin/cudnn_graph64_9.dll +0 -0
- nvidia/cudnn/bin/{cudnn_ops_infer64_8.dll → cudnn_heuristic64_9.dll} +0 -0
- nvidia/cudnn/bin/{cudnn_adv_train64_8.dll → cudnn_ops64_9.dll} +0 -0
- nvidia/cudnn/include/cudnn.h +8 -18
- nvidia/cudnn/include/{cudnn_adv_infer.h → cudnn_adv.h} +265 -252
- nvidia/cudnn/include/cudnn_backend.h +3 -558
- nvidia/cudnn/include/{cudnn_cnn_infer.h → cudnn_cnn.h} +187 -65
- nvidia/cudnn/include/cudnn_graph.h +909 -0
- nvidia/cudnn/include/{cudnn_ops_infer.h → cudnn_ops.h} +469 -336
- nvidia/cudnn/include/cudnn_version.h +4 -43
- nvidia/cudnn/lib/x64/cudnn.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn64_9.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_adv.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_adv64_9.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_cnn.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_cnn64_9.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_engines_precompiled.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_engines_precompiled64_9.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_engines_runtime_compiled.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_engines_runtime_compiled64_9.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_graph.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_graph64_9.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_heuristic.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_heuristic64_9.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_ops.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_ops64_9.lib +0 -0
- {nvidia_cudnn_cu12-8.9.7.29.dist-info → nvidia_cudnn_cu12-9.1.0.70.dist-info}/METADATA +1 -1
- nvidia_cudnn_cu12-9.1.0.70.dist-info/RECORD +41 -0
- nvidia/cudnn/bin/cudnn64_8.dll +0 -0
- nvidia/cudnn/bin/cudnn_cnn_train64_8.dll +0 -0
- nvidia/cudnn/bin/cudnn_ops_train64_8.dll +0 -0
- nvidia/cudnn/include/cudnn_adv_train.h +0 -540
- nvidia/cudnn/include/cudnn_cnn_train.h +0 -219
- nvidia/cudnn/include/cudnn_ops_train.h +0 -501
- nvidia/cudnn/lib/x64/cudnn64_8.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_adv_infer.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_adv_infer64_8.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_adv_train.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_adv_train64_8.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_cnn_infer.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_cnn_infer64_8.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_cnn_train.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_cnn_train64_8.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_ops_infer.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_ops_infer64_8.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_ops_train.lib +0 -0
- nvidia/cudnn/lib/x64/cudnn_ops_train64_8.lib +0 -0
- nvidia_cudnn_cu12-8.9.7.29.dist-info/RECORD +0 -40
- {nvidia_cudnn_cu12-8.9.7.29.dist-info → nvidia_cudnn_cu12-9.1.0.70.dist-info}/License.txt +0 -0
- {nvidia_cudnn_cu12-8.9.7.29.dist-info → nvidia_cudnn_cu12-9.1.0.70.dist-info}/WHEEL +0 -0
- {nvidia_cudnn_cu12-8.9.7.29.dist-info → nvidia_cudnn_cu12-9.1.0.70.dist-info}/top_level.txt +0 -0
|
@@ -48,26 +48,24 @@
|
|
|
48
48
|
*/
|
|
49
49
|
|
|
50
50
|
/*
|
|
51
|
-
*
|
|
51
|
+
* cudnn_cnn : cuDNN's basic definitions and CNN functions.
|
|
52
52
|
*/
|
|
53
53
|
|
|
54
|
-
#if !defined(
|
|
55
|
-
#define
|
|
54
|
+
#if !defined(CUDNN_CNN_H_)
|
|
55
|
+
#define CUDNN_CNN_H_
|
|
56
56
|
|
|
57
57
|
#pragma once
|
|
58
|
-
#include <cuda_runtime.h>
|
|
59
58
|
#include <stdint.h>
|
|
60
59
|
|
|
61
60
|
#include "cudnn_version.h"
|
|
62
|
-
#include "
|
|
61
|
+
#include "cudnn_ops.h"
|
|
63
62
|
|
|
64
63
|
/* These version numbers are autogenerated, do not edit manually. */
|
|
65
|
-
#define
|
|
66
|
-
#define
|
|
67
|
-
#define
|
|
64
|
+
#define CUDNN_CNN_MAJOR 9
|
|
65
|
+
#define CUDNN_CNN_MINOR 1
|
|
66
|
+
#define CUDNN_CNN_PATCH 0
|
|
68
67
|
|
|
69
|
-
#if (
|
|
70
|
-
(CUDNN_CNN_INFER_PATCH != CUDNN_PATCHLEVEL)
|
|
68
|
+
#if (CUDNN_CNN_MAJOR != CUDNN_MAJOR) || (CUDNN_CNN_MINOR != CUDNN_MINOR) || (CUDNN_CNN_PATCH != CUDNN_PATCHLEVEL)
|
|
71
69
|
#error Version mismatch in cuDNN CNN INFER!!!
|
|
72
70
|
#endif
|
|
73
71
|
|
|
@@ -75,20 +73,7 @@
|
|
|
75
73
|
extern "C" {
|
|
76
74
|
#endif
|
|
77
75
|
|
|
78
|
-
typedef struct cudnnConvolutionStruct *cudnnConvolutionDescriptor_t;
|
|
79
|
-
|
|
80
|
-
/*
|
|
81
|
-
* convolution mode
|
|
82
|
-
*/
|
|
83
|
-
typedef enum { CUDNN_CONVOLUTION = 0, CUDNN_CROSS_CORRELATION = 1 } cudnnConvolutionMode_t;
|
|
84
|
-
|
|
85
|
-
/*
|
|
86
|
-
* CUDNN Reorder
|
|
87
|
-
*/
|
|
88
|
-
typedef enum {
|
|
89
|
-
CUDNN_DEFAULT_REORDER = 0,
|
|
90
|
-
CUDNN_NO_REORDER = 1,
|
|
91
|
-
} cudnnReorderType_t;
|
|
76
|
+
typedef struct cudnnConvolutionStruct *cudnnConvolutionDescriptor_t CUDNN_DEPRECATED;
|
|
92
77
|
|
|
93
78
|
typedef struct cudnnConvolutionFwdAlgoPerfStruct {
|
|
94
79
|
cudnnConvolutionFwdAlgo_t algo;
|
|
@@ -98,35 +83,35 @@ typedef struct cudnnConvolutionFwdAlgoPerfStruct {
|
|
|
98
83
|
cudnnDeterminism_t determinism;
|
|
99
84
|
cudnnMathType_t mathType;
|
|
100
85
|
int reserved[3];
|
|
101
|
-
} cudnnConvolutionFwdAlgoPerf_t;
|
|
86
|
+
} cudnnConvolutionFwdAlgoPerf_t CUDNN_DEPRECATED;
|
|
102
87
|
|
|
103
88
|
/* Create an instance of convolution descriptor */
|
|
104
|
-
cudnnStatus_t CUDNNWINAPI
|
|
89
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
105
90
|
cudnnCreateConvolutionDescriptor(cudnnConvolutionDescriptor_t *convDesc);
|
|
106
91
|
|
|
107
92
|
/* Destroy an instance of convolution descriptor */
|
|
108
|
-
cudnnStatus_t CUDNNWINAPI
|
|
93
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
109
94
|
cudnnDestroyConvolutionDescriptor(cudnnConvolutionDescriptor_t convDesc);
|
|
110
95
|
|
|
111
|
-
cudnnStatus_t CUDNNWINAPI
|
|
96
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
112
97
|
cudnnSetConvolutionMathType(cudnnConvolutionDescriptor_t convDesc, cudnnMathType_t mathType);
|
|
113
98
|
|
|
114
|
-
cudnnStatus_t CUDNNWINAPI
|
|
99
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
115
100
|
cudnnGetConvolutionMathType(cudnnConvolutionDescriptor_t convDesc, cudnnMathType_t *mathType);
|
|
116
101
|
|
|
117
|
-
cudnnStatus_t CUDNNWINAPI
|
|
102
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
118
103
|
cudnnSetConvolutionGroupCount(cudnnConvolutionDescriptor_t convDesc, int groupCount);
|
|
119
104
|
|
|
120
|
-
cudnnStatus_t CUDNNWINAPI
|
|
105
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
121
106
|
cudnnGetConvolutionGroupCount(cudnnConvolutionDescriptor_t convDesc, int *groupCount);
|
|
122
107
|
|
|
123
|
-
cudnnStatus_t CUDNNWINAPI
|
|
108
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
124
109
|
cudnnSetConvolutionReorderType(cudnnConvolutionDescriptor_t convDesc, cudnnReorderType_t reorderType);
|
|
125
110
|
|
|
126
|
-
cudnnStatus_t CUDNNWINAPI
|
|
111
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
127
112
|
cudnnGetConvolutionReorderType(cudnnConvolutionDescriptor_t convDesc, cudnnReorderType_t *reorderType);
|
|
128
113
|
|
|
129
|
-
cudnnStatus_t CUDNNWINAPI
|
|
114
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
130
115
|
cudnnSetConvolution2dDescriptor(cudnnConvolutionDescriptor_t convDesc,
|
|
131
116
|
int pad_h, /* zero-padding height */
|
|
132
117
|
int pad_w, /* zero-padding width */
|
|
@@ -137,7 +122,7 @@ cudnnSetConvolution2dDescriptor(cudnnConvolutionDescriptor_t convDesc,
|
|
|
137
122
|
cudnnConvolutionMode_t mode,
|
|
138
123
|
cudnnDataType_t computeType);
|
|
139
124
|
|
|
140
|
-
cudnnStatus_t CUDNNWINAPI
|
|
125
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
141
126
|
cudnnGetConvolution2dDescriptor(const cudnnConvolutionDescriptor_t convDesc,
|
|
142
127
|
int *pad_h, /* zero-padding height */
|
|
143
128
|
int *pad_w, /* zero-padding width */
|
|
@@ -148,7 +133,7 @@ cudnnGetConvolution2dDescriptor(const cudnnConvolutionDescriptor_t convDesc,
|
|
|
148
133
|
cudnnConvolutionMode_t *mode,
|
|
149
134
|
cudnnDataType_t *computeType);
|
|
150
135
|
|
|
151
|
-
cudnnStatus_t CUDNNWINAPI
|
|
136
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
152
137
|
cudnnSetConvolutionNdDescriptor(cudnnConvolutionDescriptor_t convDesc,
|
|
153
138
|
int arrayLength, /* nbDims-2 size */
|
|
154
139
|
const int padA[],
|
|
@@ -158,7 +143,7 @@ cudnnSetConvolutionNdDescriptor(cudnnConvolutionDescriptor_t convDesc,
|
|
|
158
143
|
cudnnDataType_t computeType); /* convolution data type */
|
|
159
144
|
|
|
160
145
|
/* Helper function to return the dimensions of the output tensor given a convolution descriptor */
|
|
161
|
-
cudnnStatus_t CUDNNWINAPI
|
|
146
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
162
147
|
cudnnGetConvolutionNdDescriptor(const cudnnConvolutionDescriptor_t convDesc,
|
|
163
148
|
int arrayLengthRequested,
|
|
164
149
|
int *arrayLength,
|
|
@@ -168,7 +153,7 @@ cudnnGetConvolutionNdDescriptor(const cudnnConvolutionDescriptor_t convDesc,
|
|
|
168
153
|
cudnnConvolutionMode_t *mode,
|
|
169
154
|
cudnnDataType_t *computeType); /* convolution data type */
|
|
170
155
|
|
|
171
|
-
cudnnStatus_t CUDNNWINAPI
|
|
156
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
172
157
|
cudnnGetConvolution2dForwardOutputDim(const cudnnConvolutionDescriptor_t convDesc,
|
|
173
158
|
const cudnnTensorDescriptor_t inputTensorDesc,
|
|
174
159
|
const cudnnFilterDescriptor_t filterDesc,
|
|
@@ -178,7 +163,7 @@ cudnnGetConvolution2dForwardOutputDim(const cudnnConvolutionDescriptor_t convDes
|
|
|
178
163
|
int *w);
|
|
179
164
|
|
|
180
165
|
/* Helper function to return the dimensions of the output tensor given a convolution descriptor */
|
|
181
|
-
cudnnStatus_t CUDNNWINAPI
|
|
166
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
182
167
|
cudnnGetConvolutionNdForwardOutputDim(const cudnnConvolutionDescriptor_t convDesc,
|
|
183
168
|
const cudnnTensorDescriptor_t inputTensorDesc,
|
|
184
169
|
const cudnnFilterDescriptor_t filterDesc,
|
|
@@ -186,10 +171,10 @@ cudnnGetConvolutionNdForwardOutputDim(const cudnnConvolutionDescriptor_t convDes
|
|
|
186
171
|
int tensorOuputDimA[]);
|
|
187
172
|
|
|
188
173
|
/* helper function to provide the convolution forward algo that fit best the requirement */
|
|
189
|
-
cudnnStatus_t CUDNNWINAPI
|
|
174
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
190
175
|
cudnnGetConvolutionForwardAlgorithmMaxCount(cudnnHandle_t handle, int *count);
|
|
191
176
|
|
|
192
|
-
cudnnStatus_t CUDNNWINAPI
|
|
177
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
193
178
|
cudnnGetConvolutionForwardAlgorithm_v7(cudnnHandle_t handle,
|
|
194
179
|
const cudnnTensorDescriptor_t srcDesc,
|
|
195
180
|
const cudnnFilterDescriptor_t filterDesc,
|
|
@@ -199,7 +184,7 @@ cudnnGetConvolutionForwardAlgorithm_v7(cudnnHandle_t handle,
|
|
|
199
184
|
int *returnedAlgoCount,
|
|
200
185
|
cudnnConvolutionFwdAlgoPerf_t *perfResults);
|
|
201
186
|
|
|
202
|
-
cudnnStatus_t CUDNNWINAPI
|
|
187
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
203
188
|
cudnnFindConvolutionForwardAlgorithm(cudnnHandle_t handle,
|
|
204
189
|
const cudnnTensorDescriptor_t xDesc,
|
|
205
190
|
const cudnnFilterDescriptor_t wDesc,
|
|
@@ -209,7 +194,7 @@ cudnnFindConvolutionForwardAlgorithm(cudnnHandle_t handle,
|
|
|
209
194
|
int *returnedAlgoCount,
|
|
210
195
|
cudnnConvolutionFwdAlgoPerf_t *perfResults);
|
|
211
196
|
|
|
212
|
-
cudnnStatus_t CUDNNWINAPI
|
|
197
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
213
198
|
cudnnFindConvolutionForwardAlgorithmEx(cudnnHandle_t handle,
|
|
214
199
|
const cudnnTensorDescriptor_t xDesc,
|
|
215
200
|
const void *x,
|
|
@@ -224,7 +209,7 @@ cudnnFindConvolutionForwardAlgorithmEx(cudnnHandle_t handle,
|
|
|
224
209
|
void *workSpace,
|
|
225
210
|
size_t workSpaceSizeInBytes);
|
|
226
211
|
|
|
227
|
-
cudnnStatus_t CUDNNWINAPI
|
|
212
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
228
213
|
cudnnIm2Col(cudnnHandle_t handle,
|
|
229
214
|
const cudnnTensorDescriptor_t xDesc,
|
|
230
215
|
const void *x,
|
|
@@ -232,7 +217,7 @@ cudnnIm2Col(cudnnHandle_t handle,
|
|
|
232
217
|
const cudnnConvolutionDescriptor_t convDesc,
|
|
233
218
|
void *colBuffer);
|
|
234
219
|
|
|
235
|
-
cudnnStatus_t CUDNNWINAPI
|
|
220
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
236
221
|
cudnnReorderFilterAndBias(cudnnHandle_t handle,
|
|
237
222
|
const cudnnFilterDescriptor_t filterDesc,
|
|
238
223
|
cudnnReorderType_t reorderType,
|
|
@@ -243,7 +228,7 @@ cudnnReorderFilterAndBias(cudnnHandle_t handle,
|
|
|
243
228
|
void *reorderedBiasData);
|
|
244
229
|
|
|
245
230
|
/* Helper function to return the minimum size of the workspace to be passed to the convolution given an algo*/
|
|
246
|
-
cudnnStatus_t CUDNNWINAPI
|
|
231
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
247
232
|
cudnnGetConvolutionForwardWorkspaceSize(cudnnHandle_t handle,
|
|
248
233
|
const cudnnTensorDescriptor_t xDesc,
|
|
249
234
|
const cudnnFilterDescriptor_t wDesc,
|
|
@@ -255,7 +240,7 @@ cudnnGetConvolutionForwardWorkspaceSize(cudnnHandle_t handle,
|
|
|
255
240
|
/* Convolution functions: All of the form "output = alpha * Op(inputs) + beta * output" */
|
|
256
241
|
|
|
257
242
|
/* Function to perform the forward pass for batch convolution */
|
|
258
|
-
cudnnStatus_t CUDNNWINAPI
|
|
243
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
259
244
|
cudnnConvolutionForward(cudnnHandle_t handle,
|
|
260
245
|
const void *alpha,
|
|
261
246
|
const cudnnTensorDescriptor_t xDesc,
|
|
@@ -271,7 +256,7 @@ cudnnConvolutionForward(cudnnHandle_t handle,
|
|
|
271
256
|
void *y);
|
|
272
257
|
|
|
273
258
|
/* Fused conv/bias/activation operation : y = Act( alpha1 * conv(x) + alpha2 * z + bias ) */
|
|
274
|
-
cudnnStatus_t CUDNNWINAPI
|
|
259
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
275
260
|
cudnnConvolutionBiasActivationForward(cudnnHandle_t handle,
|
|
276
261
|
const void *alpha1,
|
|
277
262
|
const cudnnTensorDescriptor_t xDesc,
|
|
@@ -301,12 +286,12 @@ typedef struct cudnnConvolutionBwdDataAlgoPerfStruct {
|
|
|
301
286
|
cudnnDeterminism_t determinism;
|
|
302
287
|
cudnnMathType_t mathType;
|
|
303
288
|
int reserved[3];
|
|
304
|
-
} cudnnConvolutionBwdDataAlgoPerf_t;
|
|
289
|
+
} cudnnConvolutionBwdDataAlgoPerf_t CUDNN_DEPRECATED;
|
|
305
290
|
|
|
306
|
-
cudnnStatus_t CUDNNWINAPI
|
|
291
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
307
292
|
cudnnGetConvolutionBackwardDataAlgorithmMaxCount(cudnnHandle_t handle, int *count);
|
|
308
293
|
|
|
309
|
-
cudnnStatus_t CUDNNWINAPI
|
|
294
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
310
295
|
cudnnFindConvolutionBackwardDataAlgorithm(cudnnHandle_t handle,
|
|
311
296
|
const cudnnFilterDescriptor_t wDesc,
|
|
312
297
|
const cudnnTensorDescriptor_t dyDesc,
|
|
@@ -316,7 +301,7 @@ cudnnFindConvolutionBackwardDataAlgorithm(cudnnHandle_t handle,
|
|
|
316
301
|
int *returnedAlgoCount,
|
|
317
302
|
cudnnConvolutionBwdDataAlgoPerf_t *perfResults);
|
|
318
303
|
|
|
319
|
-
cudnnStatus_t CUDNNWINAPI
|
|
304
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
320
305
|
cudnnFindConvolutionBackwardDataAlgorithmEx(cudnnHandle_t handle,
|
|
321
306
|
const cudnnFilterDescriptor_t wDesc,
|
|
322
307
|
const void *w,
|
|
@@ -331,7 +316,7 @@ cudnnFindConvolutionBackwardDataAlgorithmEx(cudnnHandle_t handle,
|
|
|
331
316
|
void *workSpace,
|
|
332
317
|
size_t workSpaceSizeInBytes);
|
|
333
318
|
|
|
334
|
-
cudnnStatus_t CUDNNWINAPI
|
|
319
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
335
320
|
cudnnGetConvolutionBackwardDataAlgorithm_v7(cudnnHandle_t handle,
|
|
336
321
|
const cudnnFilterDescriptor_t filterDesc,
|
|
337
322
|
const cudnnTensorDescriptor_t diffDesc,
|
|
@@ -346,7 +331,7 @@ cudnnGetConvolutionBackwardDataAlgorithm_v7(cudnnHandle_t handle,
|
|
|
346
331
|
*/
|
|
347
332
|
|
|
348
333
|
/* Helper function to return the minimum size of the workspace to be passed to the convolution given an algo*/
|
|
349
|
-
cudnnStatus_t CUDNNWINAPI
|
|
334
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
350
335
|
cudnnGetConvolutionBackwardDataWorkspaceSize(cudnnHandle_t handle,
|
|
351
336
|
const cudnnFilterDescriptor_t wDesc,
|
|
352
337
|
const cudnnTensorDescriptor_t dyDesc,
|
|
@@ -355,7 +340,7 @@ cudnnGetConvolutionBackwardDataWorkspaceSize(cudnnHandle_t handle,
|
|
|
355
340
|
cudnnConvolutionBwdDataAlgo_t algo,
|
|
356
341
|
size_t *sizeInBytes);
|
|
357
342
|
|
|
358
|
-
cudnnStatus_t CUDNNWINAPI
|
|
343
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
359
344
|
cudnnConvolutionBackwardData(cudnnHandle_t handle,
|
|
360
345
|
const void *alpha,
|
|
361
346
|
const cudnnFilterDescriptor_t wDesc,
|
|
@@ -371,7 +356,7 @@ cudnnConvolutionBackwardData(cudnnHandle_t handle,
|
|
|
371
356
|
void *dx);
|
|
372
357
|
|
|
373
358
|
/* Helper function to calculate folding descriptors for dgrad */
|
|
374
|
-
cudnnStatus_t CUDNNWINAPI
|
|
359
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
375
360
|
cudnnGetFoldedConvBackwardDataDescriptors(const cudnnHandle_t handle,
|
|
376
361
|
const cudnnFilterDescriptor_t filterDesc,
|
|
377
362
|
const cudnnTensorDescriptor_t diffDesc,
|
|
@@ -389,13 +374,13 @@ cudnnGetFoldedConvBackwardDataDescriptors(const cudnnHandle_t handle,
|
|
|
389
374
|
|
|
390
375
|
/* cudnnFusedOps... */
|
|
391
376
|
struct cudnnFusedOpsConstParamStruct;
|
|
392
|
-
typedef struct cudnnFusedOpsConstParamStruct *cudnnFusedOpsConstParamPack_t;
|
|
377
|
+
typedef struct cudnnFusedOpsConstParamStruct *cudnnFusedOpsConstParamPack_t CUDNN_DEPRECATED;
|
|
393
378
|
|
|
394
379
|
struct cudnnFusedOpsVariantParamStruct;
|
|
395
|
-
typedef struct cudnnFusedOpsVariantParamStruct *cudnnFusedOpsVariantParamPack_t;
|
|
380
|
+
typedef struct cudnnFusedOpsVariantParamStruct *cudnnFusedOpsVariantParamPack_t CUDNN_DEPRECATED;
|
|
396
381
|
|
|
397
382
|
struct cudnnFusedOpsPlanStruct;
|
|
398
|
-
typedef struct cudnnFusedOpsPlanStruct *cudnnFusedOpsPlan_t;
|
|
383
|
+
typedef struct cudnnFusedOpsPlanStruct *cudnnFusedOpsPlan_t CUDNN_DEPRECATED;
|
|
399
384
|
|
|
400
385
|
typedef enum {
|
|
401
386
|
/* each op in [ ] can be disabled by passing NULL ptr */
|
|
@@ -416,7 +401,7 @@ typedef enum {
|
|
|
416
401
|
CUDNN_FUSED_SCALE_BIAS_ADD_ACTIVATION_GEN_BITMASK = 5,
|
|
417
402
|
/* reserved for future use */
|
|
418
403
|
CUDNN_FUSED_DACTIVATION_FORK_DBATCHNORM = 6,
|
|
419
|
-
} cudnnFusedOps_t;
|
|
404
|
+
} cudnnFusedOps_t CUDNN_DEPRECATED;
|
|
420
405
|
|
|
421
406
|
typedef enum {
|
|
422
407
|
/* set XDESC: pass previously initialized cudnnTensorDescriptor_t */
|
|
@@ -515,13 +500,13 @@ typedef enum {
|
|
|
515
500
|
CUDNN_PARAM_BN_DSCALE_PLACEHOLDER = 37,
|
|
516
501
|
/* set/get CUDNN_PARAM_BN_DBIAS_PLACEHOLDER: pass cudnnFusedOpsPointerPlaceHolder_t* */
|
|
517
502
|
CUDNN_PARAM_BN_DBIAS_PLACEHOLDER = 38,
|
|
518
|
-
} cudnnFusedOpsConstParamLabel_t;
|
|
503
|
+
} cudnnFusedOpsConstParamLabel_t CUDNN_DEPRECATED;
|
|
519
504
|
|
|
520
505
|
typedef enum {
|
|
521
506
|
CUDNN_PTR_NULL = 0,
|
|
522
507
|
CUDNN_PTR_ELEM_ALIGNED = 1,
|
|
523
508
|
CUDNN_PTR_16B_ALIGNED = 2,
|
|
524
|
-
} cudnnFusedOpsPointerPlaceHolder_t;
|
|
509
|
+
} cudnnFusedOpsPointerPlaceHolder_t CUDNN_DEPRECATED;
|
|
525
510
|
|
|
526
511
|
typedef enum {
|
|
527
512
|
/* set: pass void* pointing to dev memory */
|
|
@@ -559,13 +544,150 @@ typedef enum {
|
|
|
559
544
|
CUDNN_SCALAR_DOUBLE_BN_EXP_AVG_FACTOR = 102,
|
|
560
545
|
/* set/get: pass double* pointing to host memory */
|
|
561
546
|
CUDNN_SCALAR_DOUBLE_BN_EPSILON = 103,
|
|
562
|
-
} cudnnFusedOpsVariantParamLabel_t;
|
|
547
|
+
} cudnnFusedOpsVariantParamLabel_t CUDNN_DEPRECATED;
|
|
563
548
|
|
|
564
549
|
cudnnStatus_t CUDNNWINAPI
|
|
565
|
-
|
|
550
|
+
cudnnCnnVersionCheck(void);
|
|
551
|
+
|
|
552
|
+
/* helper function to provide the convolution backward filter algo that fit best the requirement */
|
|
553
|
+
|
|
554
|
+
typedef struct cudnnConvolutionBwdFilterAlgoPerfStruct {
|
|
555
|
+
cudnnConvolutionBwdFilterAlgo_t algo;
|
|
556
|
+
cudnnStatus_t status;
|
|
557
|
+
float time;
|
|
558
|
+
size_t memory;
|
|
559
|
+
cudnnDeterminism_t determinism;
|
|
560
|
+
cudnnMathType_t mathType;
|
|
561
|
+
int reserved[3];
|
|
562
|
+
} cudnnConvolutionBwdFilterAlgoPerf_t CUDNN_DEPRECATED;
|
|
563
|
+
|
|
564
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
565
|
+
cudnnGetConvolutionBackwardFilterAlgorithmMaxCount(cudnnHandle_t handle, int *count);
|
|
566
|
+
|
|
567
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
568
|
+
cudnnFindConvolutionBackwardFilterAlgorithm(cudnnHandle_t handle,
|
|
569
|
+
const cudnnTensorDescriptor_t xDesc,
|
|
570
|
+
const cudnnTensorDescriptor_t dyDesc,
|
|
571
|
+
const cudnnConvolutionDescriptor_t convDesc,
|
|
572
|
+
const cudnnFilterDescriptor_t dwDesc,
|
|
573
|
+
const int requestedAlgoCount,
|
|
574
|
+
int *returnedAlgoCount,
|
|
575
|
+
cudnnConvolutionBwdFilterAlgoPerf_t *perfResults);
|
|
576
|
+
|
|
577
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
578
|
+
cudnnFindConvolutionBackwardFilterAlgorithmEx(cudnnHandle_t handle,
|
|
579
|
+
const cudnnTensorDescriptor_t xDesc,
|
|
580
|
+
const void *x,
|
|
581
|
+
const cudnnTensorDescriptor_t dyDesc,
|
|
582
|
+
const void *y,
|
|
583
|
+
const cudnnConvolutionDescriptor_t convDesc,
|
|
584
|
+
const cudnnFilterDescriptor_t dwDesc,
|
|
585
|
+
void *dw,
|
|
586
|
+
const int requestedAlgoCount,
|
|
587
|
+
int *returnedAlgoCount,
|
|
588
|
+
cudnnConvolutionBwdFilterAlgoPerf_t *perfResults,
|
|
589
|
+
void *workSpace,
|
|
590
|
+
size_t workSpaceSizeInBytes);
|
|
591
|
+
|
|
592
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
593
|
+
cudnnGetConvolutionBackwardFilterAlgorithm_v7(cudnnHandle_t handle,
|
|
594
|
+
const cudnnTensorDescriptor_t srcDesc,
|
|
595
|
+
const cudnnTensorDescriptor_t diffDesc,
|
|
596
|
+
const cudnnConvolutionDescriptor_t convDesc,
|
|
597
|
+
const cudnnFilterDescriptor_t gradDesc,
|
|
598
|
+
const int requestedAlgoCount,
|
|
599
|
+
int *returnedAlgoCount,
|
|
600
|
+
cudnnConvolutionBwdFilterAlgoPerf_t *perfResults);
|
|
601
|
+
|
|
602
|
+
/*
|
|
603
|
+
* convolution algorithm (which requires potentially some workspace)
|
|
604
|
+
*/
|
|
605
|
+
|
|
606
|
+
/* Helper function to return the minimum size of the workspace to be passed to the convolution given an algo*/
|
|
607
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
608
|
+
cudnnGetConvolutionBackwardFilterWorkspaceSize(cudnnHandle_t handle,
|
|
609
|
+
const cudnnTensorDescriptor_t xDesc,
|
|
610
|
+
const cudnnTensorDescriptor_t dyDesc,
|
|
611
|
+
const cudnnConvolutionDescriptor_t convDesc,
|
|
612
|
+
const cudnnFilterDescriptor_t gradDesc,
|
|
613
|
+
cudnnConvolutionBwdFilterAlgo_t algo,
|
|
614
|
+
size_t *sizeInBytes);
|
|
615
|
+
|
|
616
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
617
|
+
cudnnConvolutionBackwardFilter(cudnnHandle_t handle,
|
|
618
|
+
const void *alpha,
|
|
619
|
+
const cudnnTensorDescriptor_t xDesc,
|
|
620
|
+
const void *x,
|
|
621
|
+
const cudnnTensorDescriptor_t dyDesc,
|
|
622
|
+
const void *dy,
|
|
623
|
+
const cudnnConvolutionDescriptor_t convDesc,
|
|
624
|
+
cudnnConvolutionBwdFilterAlgo_t algo,
|
|
625
|
+
void *workSpace,
|
|
626
|
+
size_t workSpaceSizeInBytes,
|
|
627
|
+
const void *beta,
|
|
628
|
+
const cudnnFilterDescriptor_t dwDesc,
|
|
629
|
+
void *dw);
|
|
630
|
+
|
|
631
|
+
/* Function to compute the bias gradient for batch convolution */
|
|
632
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
633
|
+
cudnnConvolutionBackwardBias(cudnnHandle_t handle,
|
|
634
|
+
const void *alpha,
|
|
635
|
+
const cudnnTensorDescriptor_t dyDesc,
|
|
636
|
+
const void *dy,
|
|
637
|
+
const void *beta,
|
|
638
|
+
const cudnnTensorDescriptor_t dbDesc,
|
|
639
|
+
void *db);
|
|
640
|
+
|
|
641
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
642
|
+
cudnnCreateFusedOpsConstParamPack(cudnnFusedOpsConstParamPack_t *constPack, cudnnFusedOps_t ops);
|
|
643
|
+
|
|
644
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
645
|
+
cudnnDestroyFusedOpsConstParamPack(cudnnFusedOpsConstParamPack_t constPack);
|
|
646
|
+
|
|
647
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
648
|
+
cudnnSetFusedOpsConstParamPackAttribute(cudnnFusedOpsConstParamPack_t constPack,
|
|
649
|
+
cudnnFusedOpsConstParamLabel_t paramLabel,
|
|
650
|
+
const void *param);
|
|
651
|
+
|
|
652
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
653
|
+
cudnnGetFusedOpsConstParamPackAttribute(const cudnnFusedOpsConstParamPack_t constPack,
|
|
654
|
+
cudnnFusedOpsConstParamLabel_t paramLabel,
|
|
655
|
+
void *param,
|
|
656
|
+
int *isNULL);
|
|
657
|
+
|
|
658
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
659
|
+
cudnnCreateFusedOpsVariantParamPack(cudnnFusedOpsVariantParamPack_t *varPack, cudnnFusedOps_t ops);
|
|
660
|
+
|
|
661
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
662
|
+
cudnnDestroyFusedOpsVariantParamPack(cudnnFusedOpsVariantParamPack_t varPack);
|
|
663
|
+
|
|
664
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
665
|
+
cudnnSetFusedOpsVariantParamPackAttribute(cudnnFusedOpsVariantParamPack_t varPack,
|
|
666
|
+
cudnnFusedOpsVariantParamLabel_t paramLabel,
|
|
667
|
+
void *ptr);
|
|
668
|
+
|
|
669
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
670
|
+
cudnnGetFusedOpsVariantParamPackAttribute(const cudnnFusedOpsVariantParamPack_t varPack,
|
|
671
|
+
cudnnFusedOpsVariantParamLabel_t paramLabel,
|
|
672
|
+
void *ptr);
|
|
673
|
+
|
|
674
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
675
|
+
cudnnCreateFusedOpsPlan(cudnnFusedOpsPlan_t *plan, cudnnFusedOps_t ops);
|
|
676
|
+
|
|
677
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
678
|
+
cudnnDestroyFusedOpsPlan(cudnnFusedOpsPlan_t plan);
|
|
679
|
+
|
|
680
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
681
|
+
cudnnMakeFusedOpsPlan(cudnnHandle_t handle,
|
|
682
|
+
cudnnFusedOpsPlan_t plan,
|
|
683
|
+
const cudnnFusedOpsConstParamPack_t constPack,
|
|
684
|
+
size_t *workspaceSizeInBytes);
|
|
685
|
+
|
|
686
|
+
CUDNN_DEPRECATED cudnnStatus_t CUDNNWINAPI
|
|
687
|
+
cudnnFusedOpsExecute(cudnnHandle_t handle, const cudnnFusedOpsPlan_t plan, cudnnFusedOpsVariantParamPack_t varPack);
|
|
566
688
|
|
|
567
689
|
#if defined(__cplusplus)
|
|
568
690
|
}
|
|
569
691
|
#endif
|
|
570
692
|
|
|
571
|
-
#endif /*
|
|
693
|
+
#endif /* CUDNN_CNN_H_ */
|