public class JCudnn extends Object
Modifier and Type | Field and Description |
---|---|
static int |
CUDNN_ATTN_DISABLE_PROJ_BIASES
Multi-head attention modes set in attention descriptor:
no biases in attention input and output projections
|
static int |
CUDNN_ATTN_ENABLE_PROJ_BIASES
Multi-head attention modes set in attention descriptor:
use biases in attention input and output projections
|
static int |
CUDNN_ATTN_QUERYMAP_ALL_TO_ONE
Multi-head attention modes set in attention descriptor:
multiple Q-s map to a single (K,V) set when beam size > 1
|
static int |
CUDNN_ATTN_QUERYMAP_ONE_TO_ONE
Multi-head attention modes set in attention descriptor:
multiple Q-s map to multiple (K,V) sets when beam size > 1
|
static int |
CUDNN_ATTN_WKIND_COUNT
Number of attention weight/bias tensors
|
static double |
CUDNN_BN_MIN_EPSILON
Minimum epsilon allowed to be used in the Batch Normalization formula
|
static int |
CUDNN_DIM_MAX
Maximum supported number of tensor dimensions
|
static int |
CUDNN_MAJOR |
static int |
CUDNN_MINOR |
static int |
CUDNN_PATCHLEVEL |
static int |
CUDNN_SEV_ERROR_EN
Message masks to be used with cudnnSetCallback()
|
static int |
CUDNN_SEV_INFO_EN |
static int |
CUDNN_SEV_WARNING_EN |
static int |
CUDNN_VERSION |
Modifier and Type | Method and Description |
---|---|
static int |
cudnnActivationBackward(cudnnHandle handle,
cudnnActivationDescriptor activationDesc,
Pointer alpha,
cudnnTensorDescriptor yDesc,
Pointer y,
cudnnTensorDescriptor dyDesc,
Pointer dy,
cudnnTensorDescriptor xDesc,
Pointer x,
Pointer beta,
cudnnTensorDescriptor dxDesc,
Pointer dx)
Function to perform backward activation
|
static int |
cudnnActivationForward(cudnnHandle handle,
cudnnActivationDescriptor activationDesc,
Pointer alpha,
cudnnTensorDescriptor xDesc,
Pointer x,
Pointer beta,
cudnnTensorDescriptor yDesc,
Pointer y)
Function to perform forward activation
|
static int |
cudnnAddTensor(cudnnHandle handle,
Pointer alpha,
cudnnTensorDescriptor aDesc,
Pointer A,
Pointer beta,
cudnnTensorDescriptor cDesc,
Pointer C)
Tensor Bias addition : C = alpha * A + beta * C
|
static int |
cudnnAdvInferVersionCheck()
Cross-library version checker..
|
static int |
cudnnAdvTrainVersionCheck()
Cross-library version checker..
|
static int |
cudnnBackendCreateDescriptor(int descriptorType,
cudnnBackendDescriptor descriptor) |
static int |
cudnnBackendDestroyDescriptor(cudnnBackendDescriptor descriptor) |
static int |
cudnnBackendExecute(cudnnHandle handle,
cudnnBackendDescriptor executionPlan,
cudnnBackendDescriptor variantPack) |
static int |
cudnnBackendFinalize(cudnnBackendDescriptor descriptor) |
static int |
cudnnBackendGetAttribute(cudnnBackendDescriptor descriptor,
int attributeName,
int attributeType,
long requestedElementCount,
long[] elementCount,
Pointer arrayOfElements) |
static int |
cudnnBackendInitialize(cudnnBackendDescriptor descriptor) |
static int |
cudnnBackendSetAttribute(cudnnBackendDescriptor descriptor,
int attributeName,
int attributeType,
long elementCount,
Pointer arrayOfElements) |
static int |
cudnnBatchNormalizationBackward(cudnnHandle handle,
int mode,
Pointer alphaDataDiff,
Pointer betaDataDiff,
Pointer alphaParamDiff,
Pointer betaParamDiff,
cudnnTensorDescriptor xDesc,
Pointer x,
cudnnTensorDescriptor dyDesc,
Pointer dy,
cudnnTensorDescriptor dxDesc,
Pointer dx,
cudnnTensorDescriptor dBnScaleBiasDesc,
Pointer bnScale,
Pointer dBnScaleResult,
Pointer dBnBiasResult,
double epsilon,
Pointer savedMean,
Pointer savedInvVariance)
Performs backward pass of Batch Normalization layer.
|
static int |
cudnnBatchNormalizationBackwardEx(cudnnHandle handle,
int mode,
int bnOps,
Pointer alphaDataDiff,
Pointer betaDataDiff,
Pointer alphaParamDiff,
Pointer betaParamDiff,
cudnnTensorDescriptor xDesc,
Pointer xData,
cudnnTensorDescriptor yDesc,
Pointer yData,
cudnnTensorDescriptor dyDesc,
Pointer dyData,
cudnnTensorDescriptor dzDesc,
Pointer dzData,
cudnnTensorDescriptor dxDesc,
Pointer dxData,
cudnnTensorDescriptor dBnScaleBiasDesc,
Pointer bnScaleData,
Pointer bnBiasData,
Pointer dBnScaleData,
Pointer dBnBiasData,
double epsilon,
Pointer savedMean,
Pointer savedInvVariance,
cudnnActivationDescriptor activationDesc,
Pointer workSpace,
long workSpaceSizeInBytes,
Pointer reserveSpace,
long reserveSpaceSizeInBytes) |
static int |
cudnnBatchNormalizationForwardInference(cudnnHandle handle,
int mode,
Pointer alpha,
Pointer beta,
cudnnTensorDescriptor xDesc,
Pointer x,
cudnnTensorDescriptor yDesc,
Pointer y,
cudnnTensorDescriptor bnScaleBiasMeanVarDesc,
Pointer bnScale,
Pointer bnBias,
Pointer estimatedMean,
Pointer estimatedVariance,
double epsilon)
Performs Batch Normalization during Inference:
y[i] = bnScale[k]*(x[i]-estimatedMean[k])/sqrt(epsilon+estimatedVariance[k]) + bnBias[k]
with bnScale, bnBias, runningMean, runningInvVariance tensors indexed
according to spatial or per-activation mode.
|
static int |
cudnnBatchNormalizationForwardTraining(cudnnHandle handle,
int mode,
Pointer alpha,
Pointer beta,
cudnnTensorDescriptor xDesc,
Pointer x,
cudnnTensorDescriptor yDesc,
Pointer y,
cudnnTensorDescriptor bnScaleBiasMeanVarDesc,
Pointer bnScale,
Pointer bnBias,
double exponentialAverageFactor,
Pointer resultRunningMean,
Pointer resultRunningVariance,
double epsilon,
Pointer resultSaveMean,
Pointer resultSaveInvVariance)
Computes y = BN(x).
|
static int |
cudnnBatchNormalizationForwardTrainingEx(cudnnHandle handle,
int mode,
int bnOps,
Pointer alpha,
Pointer beta,
cudnnTensorDescriptor xDesc,
Pointer xData,
cudnnTensorDescriptor zDesc,
Pointer zData,
cudnnTensorDescriptor yDesc,
Pointer yData,
cudnnTensorDescriptor bnScaleBiasMeanVarDesc,
Pointer bnScale,
Pointer bnBias,
double exponentialAverageFactor,
Pointer resultRunningMean,
Pointer resultRunningVariance,
double epsilon,
Pointer resultSaveMean,
Pointer resultSaveInvVariance,
cudnnActivationDescriptor activationDesc,
Pointer workspace,
long workSpaceSizeInBytes,
Pointer reserveSpace,
long reserveSpaceSizeInBytes)
Computes y = relu(BN(x) + z).
|
static int |
cudnnBuildRNNDynamic(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int miniBatch) |
static int |
cudnnCnnInferVersionCheck() |
static int |
cudnnCnnTrainVersionCheck() |
static int |
cudnnConvolutionBackwardBias(cudnnHandle handle,
Pointer alpha,
cudnnTensorDescriptor dyDesc,
Pointer dy,
Pointer beta,
cudnnTensorDescriptor dbDesc,
Pointer db)
Function to compute the bias gradient for batch convolution
|
static int |
cudnnConvolutionBackwardData(cudnnHandle handle,
Pointer alpha,
cudnnFilterDescriptor wDesc,
Pointer w,
cudnnTensorDescriptor dyDesc,
Pointer dy,
cudnnConvolutionDescriptor convDesc,
int algo,
Pointer workSpace,
long workSpaceSizeInBytes,
Pointer beta,
cudnnTensorDescriptor dxDesc,
Pointer dx) |
static int |
cudnnConvolutionBackwardFilter(cudnnHandle handle,
Pointer alpha,
cudnnTensorDescriptor xDesc,
Pointer x,
cudnnTensorDescriptor dyDesc,
Pointer dy,
cudnnConvolutionDescriptor convDesc,
int algo,
Pointer workSpace,
long workSpaceSizeInBytes,
Pointer beta,
cudnnFilterDescriptor dwDesc,
Pointer dw) |
static int |
cudnnConvolutionBiasActivationForward(cudnnHandle handle,
Pointer alpha1,
cudnnTensorDescriptor xDesc,
Pointer x,
cudnnFilterDescriptor wDesc,
Pointer w,
cudnnConvolutionDescriptor convDesc,
int algo,
Pointer workSpace,
long workSpaceSizeInBytes,
Pointer alpha2,
cudnnTensorDescriptor zDesc,
Pointer z,
cudnnTensorDescriptor biasDesc,
Pointer bias,
cudnnActivationDescriptor activationDesc,
cudnnTensorDescriptor yDesc,
Pointer y)
Fused conv/bias/activation operation : y = Act( alpha1 * conv(x) + alpha2 * z + bias )
|
static int |
cudnnConvolutionForward(cudnnHandle handle,
Pointer alpha,
cudnnTensorDescriptor xDesc,
Pointer x,
cudnnFilterDescriptor wDesc,
Pointer w,
cudnnConvolutionDescriptor convDesc,
int algo,
Pointer workSpace,
long workSpaceSizeInBytes,
Pointer beta,
cudnnTensorDescriptor yDesc,
Pointer y)
Function to perform the forward pass for batch convolution
|
static int |
cudnnCopyAlgorithmDescriptor(cudnnAlgorithmDescriptor src,
cudnnAlgorithmDescriptor dest)
Deprecated.
|
static int |
cudnnCreate(cudnnHandle handle) |
static int |
cudnnCreateActivationDescriptor(cudnnActivationDescriptor activationDesc)
Activation functions: All of the form "output = alpha * Op(inputs) + beta * output"
|
static int |
cudnnCreateAlgorithmDescriptor(cudnnAlgorithmDescriptor algoDesc)
Deprecated.
|
static int |
cudnnCreateAlgorithmPerformance(cudnnAlgorithmPerformance[] algoPerf,
int numberToCreate)
Deprecated.
|
static int |
cudnnCreateAttnDescriptor(cudnnAttnDescriptor attnDesc) |
static int |
cudnnCreateConvolutionDescriptor(cudnnConvolutionDescriptor convDesc)
Create an instance of convolution descriptor
|
static int |
cudnnCreateCTCLossDescriptor(cudnnCTCLossDescriptor ctcLossDesc) |
static int |
cudnnCreateDropoutDescriptor(cudnnDropoutDescriptor dropoutDesc) |
static int |
cudnnCreateFilterDescriptor(cudnnFilterDescriptor filterDesc)
Create an instance of FilterStruct
|
static int |
cudnnCreateFusedOpsConstParamPack(cudnnFusedOpsConstParamPack constPack,
int ops) |
static int |
cudnnCreateFusedOpsPlan(cudnnFusedOpsPlan plan,
int ops) |
static int |
cudnnCreateFusedOpsVariantParamPack(cudnnFusedOpsVariantParamPack varPack,
int ops) |
static int |
cudnnCreateLRNDescriptor(cudnnLRNDescriptor normDesc)
Create an instance of LRN (Local Response Normalization) descriptor
Uses lrnN=5, lrnAlpha=1e-4, lrnBeta=0.75, lrnK=2.0 as defaults from Krizhevsky'12 ImageNet paper
|
static int |
cudnnCreateOpTensorDescriptor(cudnnOpTensorDescriptor opTensorDesc) |
static int |
cudnnCreatePersistentRNNPlan(cudnnRNNDescriptor rnnDesc,
int minibatch,
int dataType,
cudnnPersistentRNNPlan plan)
Deprecated.
|
static int |
cudnnCreatePoolingDescriptor(cudnnPoolingDescriptor poolingDesc)
Create an instance of pooling descriptor
|
static int |
cudnnCreateReduceTensorDescriptor(cudnnReduceTensorDescriptor reduceTensorDesc) |
static int |
cudnnCreateRNNDataDescriptor(cudnnRNNDataDescriptor rnnDataDesc) |
static int |
cudnnCreateRNNDescriptor(cudnnRNNDescriptor rnnDesc) |
static int |
cudnnCreateSeqDataDescriptor(cudnnSeqDataDescriptor seqDataDesc) |
static int |
cudnnCreateSpatialTransformerDescriptor(cudnnSpatialTransformerDescriptor stDesc)
Place hold for future work
|
static int |
cudnnCreateTensorDescriptor(cudnnTensorDescriptor tensorDesc)
Create an instance of a generic Tensor descriptor
|
static int |
cudnnCreateTensorTransformDescriptor(cudnnTensorTransformDescriptor transformDesc)
Create an empty tensor transform descriptor
|
static int |
cudnnCTCLoss_v8(cudnnHandle handle,
int algo,
cudnnCTCLossDescriptor ctcLossDesc,
cudnnTensorDescriptor probsDesc,
Pointer probs,
Pointer labels,
Pointer labelLengths,
Pointer inputLengths,
Pointer costs,
cudnnTensorDescriptor gradientsDesc,
Pointer gradients,
long workSpaceSizeInBytes,
Pointer workspace)
return the ctc costs and gradients, given the probabilities and labels
|
static int |
cudnnCTCLoss(cudnnHandle handle,
cudnnTensorDescriptor probsDesc,
Pointer probs,
int[] hostLabels,
int[] hostLabelLengths,
int[] hostInputLengths,
Pointer costs,
cudnnTensorDescriptor gradientsDesc,
Pointer gradients,
int algo,
cudnnCTCLossDescriptor ctcLossDesc,
Pointer workspace,
long workSpaceSizeInBytes)
return the ctc costs and gradients, given the probabilities and labels
|
static int |
cudnnDeriveBNTensorDescriptor(cudnnTensorDescriptor derivedBnDesc,
cudnnTensorDescriptor xDesc,
int mode)
Derives a tensor descriptor from layer data descriptor for BatchNormalization
scale, invVariance, bnBias, bnScale tensors.
|
static int |
cudnnDeriveNormTensorDescriptor(cudnnTensorDescriptor derivedNormScaleBiasDesc,
cudnnTensorDescriptor derivedNormMeanVarDesc,
cudnnTensorDescriptor xDesc,
int mode,
int groupCnt)
Derives a tensor descriptor from layer data descriptor for Normalization
scale, invVariance, bnBias, bnScale tensors.
|
static int |
cudnnDestroy(cudnnHandle handle) |
static int |
cudnnDestroyActivationDescriptor(cudnnActivationDescriptor activationDesc)
ceiling for clipped RELU, alpha for ELU
|
static int |
cudnnDestroyAlgorithmDescriptor(cudnnAlgorithmDescriptor algoDesc)
Deprecated.
|
static int |
cudnnDestroyAlgorithmPerformance(cudnnAlgorithmPerformance[] algoPerf,
int numberToDestroy)
Deprecated.
|
static int |
cudnnDestroyAttnDescriptor(cudnnAttnDescriptor attnDesc) |
static int |
cudnnDestroyConvolutionDescriptor(cudnnConvolutionDescriptor convDesc)
Destroy an instance of convolution descriptor
|
static int |
cudnnDestroyCTCLossDescriptor(cudnnCTCLossDescriptor ctcLossDesc) |
static int |
cudnnDestroyDropoutDescriptor(cudnnDropoutDescriptor dropoutDesc) |
static int |
cudnnDestroyFilterDescriptor(cudnnFilterDescriptor filterDesc) |
static int |
cudnnDestroyFusedOpsConstParamPack(cudnnFusedOpsConstParamPack constPack) |
static int |
cudnnDestroyFusedOpsPlan(cudnnFusedOpsPlan plan) |
static int |
cudnnDestroyFusedOpsVariantParamPack(cudnnFusedOpsVariantParamPack varPack) |
static int |
cudnnDestroyLRNDescriptor(cudnnLRNDescriptor lrnDesc)
Destroy an instance of LRN descriptor
|
static int |
cudnnDestroyOpTensorDescriptor(cudnnOpTensorDescriptor opTensorDesc) |
static int |
cudnnDestroyPersistentRNNPlan(cudnnPersistentRNNPlan plan)
Deprecated.
|
static int |
cudnnDestroyPoolingDescriptor(cudnnPoolingDescriptor poolingDesc)
Destroy an instance of pooling descriptor
|
static int |
cudnnDestroyReduceTensorDescriptor(cudnnReduceTensorDescriptor reduceTensorDesc) |
static int |
cudnnDestroyRNNDataDescriptor(cudnnRNNDataDescriptor rnnDataDesc) |
static int |
cudnnDestroyRNNDescriptor(cudnnRNNDescriptor rnnDesc) |
static int |
cudnnDestroySeqDataDescriptor(cudnnSeqDataDescriptor seqDataDesc) |
static int |
cudnnDestroySpatialTransformerDescriptor(cudnnSpatialTransformerDescriptor stDesc) |
static int |
cudnnDestroyTensorDescriptor(cudnnTensorDescriptor tensorDesc)
Destroy an instance of Tensor4d descriptor
|
static int |
cudnnDestroyTensorTransformDescriptor(cudnnTensorTransformDescriptor transformDesc)
Destroys a previously created tensor transform descriptor.
|
static int |
cudnnDivisiveNormalizationBackward(cudnnHandle handle,
cudnnLRNDescriptor normDesc,
int mode,
Pointer alpha,
cudnnTensorDescriptor xDesc,
Pointer x,
Pointer means,
Pointer dy,
Pointer temp,
Pointer temp2,
Pointer beta,
cudnnTensorDescriptor dXdMeansDesc,
Pointer dx,
Pointer dMeans) |
static int |
cudnnDivisiveNormalizationForward(cudnnHandle handle,
cudnnLRNDescriptor normDesc,
int mode,
Pointer alpha,
cudnnTensorDescriptor xDesc,
Pointer x,
Pointer means,
Pointer temp,
Pointer temp2,
Pointer beta,
cudnnTensorDescriptor yDesc,
Pointer y)
LCN/divisive normalization functions: y = alpha * normalize(x) + beta * y
|
static int |
cudnnDropoutBackward(cudnnHandle handle,
cudnnDropoutDescriptor dropoutDesc,
cudnnTensorDescriptor dydesc,
Pointer dy,
cudnnTensorDescriptor dxdesc,
Pointer dx,
Pointer reserveSpace,
long reserveSpaceSizeInBytes) |
static int |
cudnnDropoutForward(cudnnHandle handle,
cudnnDropoutDescriptor dropoutDesc,
cudnnTensorDescriptor xdesc,
Pointer x,
cudnnTensorDescriptor ydesc,
Pointer y,
Pointer reserveSpace,
long reserveSpaceSizeInBytes) |
static int |
cudnnDropoutGetReserveSpaceSize(cudnnTensorDescriptor xdesc,
long[] sizeInBytes)
helper function to determine size of the reserve space to be passed to dropout forward/backward calls
|
static int |
cudnnDropoutGetStatesSize(cudnnHandle handle,
long[] sizeInBytes)
helper function to determine size of the states to be passed to cudnnSetDropoutDescriptor
|
static int |
cudnnFindConvolutionBackwardDataAlgorithm(cudnnHandle handle,
cudnnFilterDescriptor wDesc,
cudnnTensorDescriptor dyDesc,
cudnnConvolutionDescriptor convDesc,
cudnnTensorDescriptor dxDesc,
int requestedAlgoCount,
int[] returnedAlgoCount,
cudnnConvolutionBwdDataAlgoPerf[] perfResults) |
static int |
cudnnFindConvolutionBackwardDataAlgorithmEx(cudnnHandle handle,
cudnnFilterDescriptor wDesc,
Pointer w,
cudnnTensorDescriptor dyDesc,
Pointer dy,
cudnnConvolutionDescriptor convDesc,
cudnnTensorDescriptor dxDesc,
Pointer dx,
int requestedAlgoCount,
int[] returnedAlgoCount,
cudnnConvolutionBwdDataAlgoPerf[] perfResults,
Pointer workSpace,
long workSpaceSizeInBytes) |
static int |
cudnnFindConvolutionBackwardFilterAlgorithm(cudnnHandle handle,
cudnnTensorDescriptor xDesc,
cudnnTensorDescriptor dyDesc,
cudnnConvolutionDescriptor convDesc,
cudnnFilterDescriptor dwDesc,
int requestedAlgoCount,
int[] returnedAlgoCount,
cudnnConvolutionBwdFilterAlgoPerf[] perfResults) |
static int |
cudnnFindConvolutionBackwardFilterAlgorithmEx(cudnnHandle handle,
cudnnTensorDescriptor xDesc,
Pointer x,
cudnnTensorDescriptor dyDesc,
Pointer y,
cudnnConvolutionDescriptor convDesc,
cudnnFilterDescriptor dwDesc,
Pointer dw,
int requestedAlgoCount,
int[] returnedAlgoCount,
cudnnConvolutionBwdFilterAlgoPerf[] perfResults,
Pointer workSpace,
long workSpaceSizeInBytes) |
static int |
cudnnFindConvolutionForwardAlgorithm(cudnnHandle handle,
cudnnTensorDescriptor xDesc,
cudnnFilterDescriptor wDesc,
cudnnConvolutionDescriptor convDesc,
cudnnTensorDescriptor yDesc,
int requestedAlgoCount,
int[] returnedAlgoCount,
cudnnConvolutionFwdAlgoPerf[] perfResults) |
static int |
cudnnFindConvolutionForwardAlgorithmEx(cudnnHandle handle,
cudnnTensorDescriptor xDesc,
Pointer x,
cudnnFilterDescriptor wDesc,
Pointer w,
cudnnConvolutionDescriptor convDesc,
cudnnTensorDescriptor yDesc,
Pointer y,
int requestedAlgoCount,
int[] returnedAlgoCount,
cudnnConvolutionFwdAlgoPerf[] perfResults,
Pointer workSpace,
long workSpaceSizeInBytes) |
static int |
cudnnFindRNNBackwardDataAlgorithmEx(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int seqLength,
cudnnTensorDescriptor[] yDesc,
Pointer y,
cudnnTensorDescriptor[] dyDesc,
Pointer dy,
cudnnTensorDescriptor dhyDesc,
Pointer dhy,
cudnnTensorDescriptor dcyDesc,
Pointer dcy,
cudnnFilterDescriptor wDesc,
Pointer w,
cudnnTensorDescriptor hxDesc,
Pointer hx,
cudnnTensorDescriptor cxDesc,
Pointer cx,
cudnnTensorDescriptor[] dxDesc,
Pointer dx,
cudnnTensorDescriptor dhxDesc,
Pointer dhx,
cudnnTensorDescriptor dcxDesc,
Pointer dcx,
float findIntensity,
int requestedAlgoCount,
int[] returnedAlgoCount,
cudnnAlgorithmPerformance[] perfResults,
Pointer workspace,
long workSpaceSizeInBytes,
Pointer reserveSpace,
long reserveSpaceSizeInBytes)
Deprecated.
|
static int |
cudnnFindRNNBackwardWeightsAlgorithmEx(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int seqLength,
cudnnTensorDescriptor[] xDesc,
Pointer x,
cudnnTensorDescriptor hxDesc,
Pointer hx,
cudnnTensorDescriptor[] yDesc,
Pointer y,
float findIntensity,
int requestedAlgoCount,
int[] returnedAlgoCount,
cudnnAlgorithmPerformance[] perfResults,
Pointer workspace,
long workSpaceSizeInBytes,
cudnnFilterDescriptor dwDesc,
Pointer dw,
Pointer reserveSpace,
long reserveSpaceSizeInBytes)
Deprecated.
|
static int |
cudnnFindRNNForwardInferenceAlgorithmEx(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int seqLength,
cudnnTensorDescriptor[] xDesc,
Pointer x,
cudnnTensorDescriptor hxDesc,
Pointer hx,
cudnnTensorDescriptor cxDesc,
Pointer cx,
cudnnFilterDescriptor wDesc,
Pointer w,
cudnnTensorDescriptor[] yDesc,
Pointer y,
cudnnTensorDescriptor hyDesc,
Pointer hy,
cudnnTensorDescriptor cyDesc,
Pointer cy,
float findIntensity,
int requestedAlgoCount,
int[] returnedAlgoCount,
cudnnAlgorithmPerformance[] perfResults,
Pointer workspace,
long workSpaceSizeInBytes)
Deprecated.
|
static int |
cudnnFindRNNForwardTrainingAlgorithmEx(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int seqLength,
cudnnTensorDescriptor[] xDesc,
Pointer x,
cudnnTensorDescriptor hxDesc,
Pointer hx,
cudnnTensorDescriptor cxDesc,
Pointer cx,
cudnnFilterDescriptor wDesc,
Pointer w,
cudnnTensorDescriptor[] yDesc,
Pointer y,
cudnnTensorDescriptor hyDesc,
Pointer hy,
cudnnTensorDescriptor cyDesc,
Pointer cy,
float findIntensity,
int requestedAlgoCount,
int[] returnedAlgoCount,
cudnnAlgorithmPerformance[] perfResults,
Pointer workspace,
long workSpaceSizeInBytes,
Pointer reserveSpace,
long reserveSpaceSizeInBytes)
Deprecated.
|
static int |
cudnnFusedOpsExecute(cudnnHandle handle,
cudnnFusedOpsPlan plan,
cudnnFusedOpsVariantParamPack varPack) |
static int |
cudnnGetActivationDescriptor(cudnnActivationDescriptor activationDesc,
int[] mode,
int[] reluNanOpt,
double[] coef)
ceiling for clipped RELU, alpha for ELU
|
static int |
cudnnGetAlgorithmDescriptor(cudnnAlgorithmDescriptor algoDesc,
int[] algorithm)
Deprecated.
|
static int |
cudnnGetAlgorithmPerformance(cudnnAlgorithmPerformance algoPerf,
cudnnAlgorithmDescriptor algoDesc,
int[] status,
float[] time,
long[] memory)
Deprecated.
|
static int |
cudnnGetAlgorithmSpaceSize(cudnnHandle handle,
cudnnAlgorithmDescriptor algoDesc,
long[] algoSpaceSizeInBytes)
Deprecated.
|
static int |
cudnnGetAttnDescriptor(cudnnAttnDescriptor attnDesc,
int[] attnMode,
int[] nHeads,
double[] smScaler,
int[] dataType,
int[] computePrec,
int[] mathType,
cudnnDropoutDescriptor attnDropoutDesc,
cudnnDropoutDescriptor postDropoutDesc,
int[] qSize,
int[] kSize,
int[] vSize,
int[] qProjSize,
int[] kProjSize,
int[] vProjSize,
int[] oProjSize,
int[] qoMaxSeqLength,
int[] kvMaxSeqLength,
int[] maxBatchSize,
int[] maxBeamSize) |
static int |
cudnnGetBatchNormalizationBackwardExWorkspaceSize(cudnnHandle handle,
int mode,
int bnOps,
cudnnTensorDescriptor xDesc,
cudnnTensorDescriptor yDesc,
cudnnTensorDescriptor dyDesc,
cudnnTensorDescriptor dzDesc,
cudnnTensorDescriptor dxDesc,
cudnnTensorDescriptor dBnScaleBiasDesc,
cudnnActivationDescriptor activationDesc,
long[] sizeInBytes) |
static int |
cudnnGetBatchNormalizationForwardTrainingExWorkspaceSize(cudnnHandle handle,
int mode,
int bnOps,
cudnnTensorDescriptor xDesc,
cudnnTensorDescriptor zDesc,
cudnnTensorDescriptor yDesc,
cudnnTensorDescriptor bnScaleBiasMeanVarDesc,
cudnnActivationDescriptor activationDesc,
long[] sizeInBytes)
output means differential, can be NULL
|
static int |
cudnnGetBatchNormalizationTrainingExReserveSpaceSize(cudnnHandle handle,
int mode,
int bnOps,
cudnnActivationDescriptor activationDesc,
cudnnTensorDescriptor xDesc,
long[] sizeInBytes) |
static int |
cudnnGetCallback(int[] mask,
Object udata,
cudnnCallback[] fptr) |
static int |
cudnnGetConvolution2dDescriptor(cudnnConvolutionDescriptor convDesc,
int[] pad_h,
int[] pad_w,
int[] u,
int[] v,
int[] dilation_h,
int[] dilation_w,
int[] mode,
int[] computeType) |
static int |
cudnnGetConvolution2dForwardOutputDim(cudnnConvolutionDescriptor convDesc,
cudnnTensorDescriptor inputTensorDesc,
cudnnFilterDescriptor filterDesc,
int[] n,
int[] c,
int[] h,
int[] w)
convolution data type
|
static int |
cudnnGetConvolutionBackwardDataAlgorithm_v7(cudnnHandle handle,
cudnnFilterDescriptor filterDesc,
cudnnTensorDescriptor diffDesc,
cudnnConvolutionDescriptor convDesc,
cudnnTensorDescriptor gradDesc,
int requestedAlgoCount,
int[] returnedAlgoCount,
cudnnConvolutionBwdDataAlgoPerf[] perfResults) |
static int |
cudnnGetConvolutionBackwardDataAlgorithmMaxCount(cudnnHandle handle,
int[] count) |
static int |
cudnnGetConvolutionBackwardDataWorkspaceSize(cudnnHandle handle,
cudnnFilterDescriptor wDesc,
cudnnTensorDescriptor dyDesc,
cudnnConvolutionDescriptor convDesc,
cudnnTensorDescriptor dxDesc,
int algo,
long[] sizeInBytes)
Helper function to return the minimum size of the workspace to be passed to the convolution given an algo
|
static int |
cudnnGetConvolutionBackwardFilterAlgorithm_v7(cudnnHandle handle,
cudnnTensorDescriptor srcDesc,
cudnnTensorDescriptor diffDesc,
cudnnConvolutionDescriptor convDesc,
cudnnFilterDescriptor gradDesc,
int requestedAlgoCount,
int[] returnedAlgoCount,
cudnnConvolutionBwdFilterAlgoPerf[] perfResults) |
static int |
cudnnGetConvolutionBackwardFilterAlgorithmMaxCount(cudnnHandle handle,
int[] count) |
static int |
cudnnGetConvolutionBackwardFilterWorkspaceSize(cudnnHandle handle,
cudnnTensorDescriptor xDesc,
cudnnTensorDescriptor dyDesc,
cudnnConvolutionDescriptor convDesc,
cudnnFilterDescriptor gradDesc,
int algo,
long[] sizeInBytes)
Helper function to return the minimum size of the workspace to be passed to the convolution given an algo
|
static int |
cudnnGetConvolutionForwardAlgorithm_v7(cudnnHandle handle,
cudnnTensorDescriptor srcDesc,
cudnnFilterDescriptor filterDesc,
cudnnConvolutionDescriptor convDesc,
cudnnTensorDescriptor destDesc,
int requestedAlgoCount,
int[] returnedAlgoCount,
cudnnConvolutionFwdAlgoPerf[] perfResults) |
static int |
cudnnGetConvolutionForwardAlgorithmMaxCount(cudnnHandle handle,
int[] count)
helper function to provide the convolution forward algo that fit best the requirement
|
static int |
cudnnGetConvolutionForwardWorkspaceSize(cudnnHandle handle,
cudnnTensorDescriptor xDesc,
cudnnFilterDescriptor wDesc,
cudnnConvolutionDescriptor convDesc,
cudnnTensorDescriptor yDesc,
int algo,
long[] sizeInBytes)
Helper function to return the minimum size of the workspace to be passed to the convolution given an algo
|
static int |
cudnnGetConvolutionGroupCount(cudnnConvolutionDescriptor convDesc,
int[] groupCount) |
static int |
cudnnGetConvolutionMathType(cudnnConvolutionDescriptor convDesc,
int[] mathType) |
static int |
cudnnGetConvolutionNdDescriptor(cudnnConvolutionDescriptor convDesc,
int arrayLengthRequested,
int[] arrayLength,
int[] padA,
int[] strideA,
int[] dilationA,
int[] mode,
int[] computeType)
Helper function to return the dimensions of the output tensor given a convolution descriptor
|
static int |
cudnnGetConvolutionNdForwardOutputDim(cudnnConvolutionDescriptor convDesc,
cudnnTensorDescriptor inputTensorDesc,
cudnnFilterDescriptor filterDesc,
int nbDims,
int[] tensorOuputDimA)
Helper function to return the dimensions of the output tensor given a convolution descriptor
|
static int |
cudnnGetConvolutionReorderType(cudnnConvolutionDescriptor convDesc,
int[] reorderType) |
static int |
cudnnGetCTCLossDescriptor_v8(cudnnCTCLossDescriptor ctcLossDesc,
int[] compType,
int[] normMode,
int[] gradMode,
int[] maxLabelLength) |
static int |
cudnnGetCTCLossDescriptor(cudnnCTCLossDescriptor ctcLossDesc,
int[] compType) |
static int |
cudnnGetCTCLossDescriptorEx(cudnnCTCLossDescriptor ctcLossDesc,
int[] compType,
int[] normMode,
int[] gradMode) |
static int |
cudnnGetCTCLossWorkspaceSize_v8(cudnnHandle handle,
int algo,
cudnnCTCLossDescriptor ctcLossDesc,
cudnnTensorDescriptor probsDesc,
cudnnTensorDescriptor gradientsDesc,
long[] sizeInBytes)
return the workspace size needed for ctc
|
static int |
cudnnGetCTCLossWorkspaceSize(cudnnHandle handle,
cudnnTensorDescriptor probsDesc,
cudnnTensorDescriptor gradientsDesc,
int[] labels,
int[] labelLengths,
int[] inputLengths,
int algo,
cudnnCTCLossDescriptor ctcLossDesc,
long[] sizeInBytes)
return the workspace size needed for ctc
|
static long |
cudnnGetCudartVersion()
Returns CUDA Runtime version statically linked against cudnn
|
static int |
cudnnGetDropoutDescriptor(cudnnDropoutDescriptor dropoutDesc,
cudnnHandle handle,
float[] dropout,
Pointer states,
long[] seed) |
static String |
cudnnGetErrorString(int status)
human-readable error messages
|
static int |
cudnnGetFilter4dDescriptor(cudnnFilterDescriptor filterDesc,
int[] dataType,
int[] format,
int[] k,
int[] c,
int[] h,
int[] w)
width of each input filter
|
static int |
cudnnGetFilterNdDescriptor(cudnnFilterDescriptor filterDesc,
int nbDimsRequested,
int[] dataType,
int[] format,
int[] nbDims,
int[] filterDimA) |
static int |
cudnnGetFilterSizeInBytes(cudnnFilterDescriptor filterDesc,
long[] size) |
static int |
cudnnGetFoldedConvBackwardDataDescriptors(cudnnHandle handle,
cudnnFilterDescriptor filterDesc,
cudnnTensorDescriptor diffDesc,
cudnnConvolutionDescriptor convDesc,
cudnnTensorDescriptor gradDesc,
int transformFormat,
cudnnFilterDescriptor foldedFilterDesc,
cudnnTensorDescriptor paddedDiffDesc,
cudnnConvolutionDescriptor foldedConvDesc,
cudnnTensorDescriptor foldedGradDesc,
cudnnTensorTransformDescriptor filterFoldTransDesc,
cudnnTensorTransformDescriptor diffPadTransDesc,
cudnnTensorTransformDescriptor gradFoldTransDesc,
cudnnTensorTransformDescriptor gradUnfoldTransDesc)
Helper function to calculate folding descriptors for dgrad
|
static int |
cudnnGetFusedOpsConstParamPackAttribute(cudnnFusedOpsConstParamPack constPack,
int paramLabel,
Pointer param,
int[] isNULL) |
static int |
cudnnGetFusedOpsVariantParamPackAttribute(cudnnFusedOpsVariantParamPack varPack,
int paramLabel,
Pointer ptr) |
static int |
cudnnGetLRNDescriptor(cudnnLRNDescriptor normDesc,
int[] lrnN,
double[] lrnAlpha,
double[] lrnBeta,
double[] lrnK)
Retrieve the settings currently stored in an LRN layer descriptor
Any of the provided pointers can be NULL (no corresponding value will be returned)
|
static int |
cudnnGetMultiHeadAttnBuffers(cudnnHandle handle,
cudnnAttnDescriptor attnDesc,
long[] weightSizeInBytes,
long[] workSpaceSizeInBytes,
long[] reserveSpaceSizeInBytes) |
static int |
cudnnGetMultiHeadAttnWeights(cudnnHandle handle,
cudnnAttnDescriptor attnDesc,
int wKind,
long weightSizeInBytes,
Pointer weights,
cudnnTensorDescriptor wDesc,
Pointer wAddr) |
static int |
cudnnGetNormalizationBackwardWorkspaceSize(cudnnHandle handle,
int mode,
int normOps,
int algo,
cudnnTensorDescriptor xDesc,
cudnnTensorDescriptor yDesc,
cudnnTensorDescriptor dyDesc,
cudnnTensorDescriptor dzDesc,
cudnnTensorDescriptor dxDesc,
cudnnTensorDescriptor dNormScaleBiasDesc,
cudnnActivationDescriptor activationDesc,
cudnnTensorDescriptor normMeanVarDesc,
long[] sizeInBytes,
int groupCnt)
Place hold for future work, should be set to 1 now
|
static int |
cudnnGetNormalizationForwardTrainingWorkspaceSize(cudnnHandle handle,
int mode,
int normOps,
int algo,
cudnnTensorDescriptor xDesc,
cudnnTensorDescriptor zDesc,
cudnnTensorDescriptor yDesc,
cudnnTensorDescriptor normScaleBiasDesc,
cudnnActivationDescriptor activationDesc,
cudnnTensorDescriptor normMeanVarDesc,
long[] sizeInBytes,
int groupCnt) |
static int |
cudnnGetNormalizationTrainingReserveSpaceSize(cudnnHandle handle,
int mode,
int normOps,
int algo,
cudnnActivationDescriptor activationDesc,
cudnnTensorDescriptor xDesc,
long[] sizeInBytes,
int groupCnt)
Place hold for future work, should be set to 1 now
|
static int |
cudnnGetOpTensorDescriptor(cudnnOpTensorDescriptor opTensorDesc,
int[] opTensorOp,
int[] opTensorCompType,
int[] opTensorNanOpt) |
static int |
cudnnGetPooling2dDescriptor(cudnnPoolingDescriptor poolingDesc,
int[] mode,
int[] maxpoolingNanOpt,
int[] windowHeight,
int[] windowWidth,
int[] verticalPadding,
int[] horizontalPadding,
int[] verticalStride,
int[] horizontalStride) |
static int |
cudnnGetPooling2dForwardOutputDim(cudnnPoolingDescriptor poolingDesc,
cudnnTensorDescriptor inputTensorDesc,
int[] n,
int[] c,
int[] h,
int[] w) |
static int |
cudnnGetPoolingNdDescriptor(cudnnPoolingDescriptor poolingDesc,
int nbDimsRequested,
int[] mode,
int[] maxpoolingNanOpt,
int[] nbDims,
int[] windowDimA,
int[] paddingA,
int[] strideA) |
static int |
cudnnGetPoolingNdForwardOutputDim(cudnnPoolingDescriptor poolingDesc,
cudnnTensorDescriptor inputTensorDesc,
int nbDims,
int[] outputTensorDimA) |
static int |
cudnnGetProperty(int type,
int[] value) |
static int |
cudnnGetReduceTensorDescriptor(cudnnReduceTensorDescriptor reduceTensorDesc,
int[] reduceTensorOp,
int[] reduceTensorCompType,
int[] reduceTensorNanOpt,
int[] reduceTensorIndices,
int[] reduceTensorIndicesType) |
static int |
cudnnGetReductionIndicesSize(cudnnHandle handle,
cudnnReduceTensorDescriptor reduceTensorDesc,
cudnnTensorDescriptor aDesc,
cudnnTensorDescriptor cDesc,
long[] sizeInBytes)
Helper function to return the minimum size of the index space to be passed to the reduction given the input and
output tensors
|
static int |
cudnnGetReductionWorkspaceSize(cudnnHandle handle,
cudnnReduceTensorDescriptor reduceTensorDesc,
cudnnTensorDescriptor aDesc,
cudnnTensorDescriptor cDesc,
long[] sizeInBytes)
Helper function to return the minimum size of the workspace to be passed to the reduction given the input and output
tensors
|
static int |
cudnnGetRNNBackwardDataAlgorithmMaxCount(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int[] count)
Deprecated.
|
static int |
cudnnGetRNNBackwardWeightsAlgorithmMaxCount(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int[] count)
Deprecated.
|
static int |
cudnnGetRNNBiasMode(cudnnRNNDescriptor rnnDesc,
int[] biasMode)
Deprecated.
|
static int |
cudnnGetRNNDataDescriptor(cudnnRNNDataDescriptor rnnDataDesc,
int[] dataType,
int[] layout,
int[] maxSeqLength,
int[] batchSize,
int[] vectorSize,
int arrayLengthRequested,
int[] seqLengthArray,
Pointer paddingFill)
symbol for filling padding position in output
|
static int |
cudnnGetRNNDescriptor_v6(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int[] hiddenSize,
int[] numLayers,
cudnnDropoutDescriptor dropoutDesc,
int[] inputMode,
int[] direction,
int[] cellMode,
int[] algo,
int[] mathPrec)
Deprecated.
|
static int |
cudnnGetRNNDescriptor_v8(cudnnRNNDescriptor rnnDesc,
int[] algo,
int[] cellMode,
int[] biasMode,
int[] dirMode,
int[] inputMode,
int[] dataType,
int[] mathPrec,
int[] mathType,
int[] inputSize,
int[] hiddenSize,
int[] projSize,
int[] numLayers,
cudnnDropoutDescriptor dropoutDesc,
int[] auxFlags) |
static int |
cudnnGetRNNForwardInferenceAlgorithmMaxCount(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int[] count)
Deprecated.
|
static int |
cudnnGetRNNForwardTrainingAlgorithmMaxCount(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int[] count)
Deprecated.
|
static int |
cudnnGetRNNLinLayerBiasParams(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int pseudoLayer,
cudnnTensorDescriptor xDesc,
cudnnFilterDescriptor wDesc,
Pointer w,
int linLayerID,
cudnnFilterDescriptor linLayerBiasDesc,
Pointer linLayerBias)
Deprecated.
|
static int |
cudnnGetRNNLinLayerMatrixParams(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int pseudoLayer,
cudnnTensorDescriptor xDesc,
cudnnFilterDescriptor wDesc,
Pointer w,
int linLayerID,
cudnnFilterDescriptor linLayerMatDesc,
Pointer linLayerMat)
Deprecated.
|
static int |
cudnnGetRNNMatrixMathType(cudnnRNNDescriptor rnnDesc,
int[] mType)
Deprecated.
|
static int |
cudnnGetRNNPaddingMode(cudnnRNNDescriptor rnnDesc,
int[] paddingMode)
Deprecated.
|
static int |
cudnnGetRNNParamsSize(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
cudnnTensorDescriptor xDesc,
long[] sizeInBytes,
int dataType)
Deprecated.
|
static int |
cudnnGetRNNProjectionLayers(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int[] recProjSize,
int[] outProjSize)
Deprecated.
|
static int |
cudnnGetRNNTempSpaceSizes(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int fMode,
cudnnRNNDataDescriptor xDesc,
long[] workSpaceSize,
long[] reserveSpaceSize) |
static int |
cudnnGetRNNTrainingReserveSize(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int seqLength,
cudnnTensorDescriptor[] xDesc,
long[] sizeInBytes)
Deprecated.
|
static int |
cudnnGetRNNWeightParams(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int pseudoLayer,
long weightSpaceSize,
Pointer weightSpace,
int linLayerID,
cudnnTensorDescriptor mDesc,
Pointer mAddr,
cudnnTensorDescriptor bDesc,
Pointer bAddr) |
static int |
cudnnGetRNNWeightSpaceSize(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
long[] weightSpaceSize) |
static int |
cudnnGetRNNWorkspaceSize(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int seqLength,
cudnnTensorDescriptor[] xDesc,
long[] sizeInBytes)
Deprecated.
|
static int |
cudnnGetSeqDataDescriptor(cudnnSeqDataDescriptor seqDataDesc,
int[] dataType,
int[] nbDims,
int nbDimsRequested,
int[] dimA,
int[] axes,
long[] seqLengthArraySize,
long seqLengthSizeRequested,
int[] seqLengthArray,
Pointer paddingFill) |
static int |
cudnnGetStream(cudnnHandle handle,
cudaStream_t streamId) |
static int |
cudnnGetTensor4dDescriptor(cudnnTensorDescriptor tensorDesc,
int[] dataType,
int[] n,
int[] c,
int[] h,
int[] w,
int[] nStride,
int[] cStride,
int[] hStride,
int[] wStride) |
static int |
cudnnGetTensorNdDescriptor(cudnnTensorDescriptor tensorDesc,
int nbDimsRequested,
int[] dataType,
int[] nbDims,
int[] dimA,
int[] strideA) |
static int |
cudnnGetTensorSizeInBytes(cudnnTensorDescriptor tensorDesc,
long[] size) |
static int |
cudnnGetTensorTransformDescriptor(cudnnTensorTransformDescriptor transformDesc,
int nbDimsRequested,
int[] destFormat,
int[] padBeforeA,
int[] padAfterA,
int[] foldA,
int[] direction)
Retrieves the values stored in a previously initialized tensor transform
descriptor.
|
static long |
cudnnGetVersion() |
static int |
cudnnIm2Col(cudnnHandle handle,
cudnnTensorDescriptor xDesc,
Pointer x,
cudnnFilterDescriptor wDesc,
cudnnConvolutionDescriptor convDesc,
Pointer colBuffer) |
static int |
cudnnInitTransformDest(cudnnTensorTransformDescriptor transformDesc,
cudnnTensorDescriptor srcDesc,
cudnnTensorDescriptor destDesc,
long[] destSizeInBytes)
Create a destination descriptor for cudnnTransformTensor
|
static int |
cudnnLRNCrossChannelBackward(cudnnHandle handle,
cudnnLRNDescriptor normDesc,
int lrnMode,
Pointer alpha,
cudnnTensorDescriptor yDesc,
Pointer y,
cudnnTensorDescriptor dyDesc,
Pointer dy,
cudnnTensorDescriptor xDesc,
Pointer x,
Pointer beta,
cudnnTensorDescriptor dxDesc,
Pointer dx)
LRN cross-channel backward computation.
|
static int |
cudnnLRNCrossChannelForward(cudnnHandle handle,
cudnnLRNDescriptor normDesc,
int lrnMode,
Pointer alpha,
cudnnTensorDescriptor xDesc,
Pointer x,
Pointer beta,
cudnnTensorDescriptor yDesc,
Pointer y)
LRN cross-channel forward computation.
|
static int |
cudnnMakeFusedOpsPlan(cudnnHandle handle,
cudnnFusedOpsPlan plan,
cudnnFusedOpsConstParamPack constPack,
long[] workspaceSizeInBytes) |
static int |
cudnnMultiHeadAttnBackwardData(cudnnHandle handle,
cudnnAttnDescriptor attnDesc,
int[] loWinIdx,
int[] hiWinIdx,
int[] devSeqLengthsDQDO,
int[] devSeqLengthsDKDV,
cudnnSeqDataDescriptor doDesc,
Pointer dout,
cudnnSeqDataDescriptor dqDesc,
Pointer dqueries,
Pointer queries,
cudnnSeqDataDescriptor dkDesc,
Pointer dkeys,
Pointer keys,
cudnnSeqDataDescriptor dvDesc,
Pointer dvalues,
Pointer values,
long weightSizeInBytes,
Pointer weights,
long workSpaceSizeInBytes,
Pointer workSpace,
long reserveSpaceSizeInBytes,
Pointer reserveSpace) |
static int |
cudnnMultiHeadAttnBackwardWeights(cudnnHandle handle,
cudnnAttnDescriptor attnDesc,
int addGrad,
cudnnSeqDataDescriptor qDesc,
Pointer queries,
cudnnSeqDataDescriptor kDesc,
Pointer keys,
cudnnSeqDataDescriptor vDesc,
Pointer values,
cudnnSeqDataDescriptor doDesc,
Pointer dout,
long weightSizeInBytes,
Pointer weights,
Pointer dweights,
long workSpaceSizeInBytes,
Pointer workSpace,
long reserveSpaceSizeInBytes,
Pointer reserveSpace) |
static int |
cudnnMultiHeadAttnForward(cudnnHandle handle,
cudnnAttnDescriptor attnDesc,
int currIdx,
int[] loWinIdx,
int[] hiWinIdx,
int[] devSeqLengthsQO,
int[] devSeqLengthsKV,
cudnnSeqDataDescriptor qDesc,
Pointer queries,
Pointer residuals,
cudnnSeqDataDescriptor kDesc,
Pointer keys,
cudnnSeqDataDescriptor vDesc,
Pointer values,
cudnnSeqDataDescriptor oDesc,
Pointer out,
long weightSizeInBytes,
Pointer weights,
long workSpaceSizeInBytes,
Pointer workSpace,
long reserveSpaceSizeInBytes,
Pointer reserveSpace) |
static int |
cudnnNormalizationBackward(cudnnHandle handle,
int mode,
int normOps,
int algo,
Pointer alphaDataDiff,
Pointer betaDataDiff,
Pointer alphaParamDiff,
Pointer betaParamDiff,
cudnnTensorDescriptor xDesc,
Pointer xData,
cudnnTensorDescriptor yDesc,
Pointer yData,
cudnnTensorDescriptor dyDesc,
Pointer dyData,
cudnnTensorDescriptor dzDesc,
Pointer dzData,
cudnnTensorDescriptor dxDesc,
Pointer dxData,
cudnnTensorDescriptor dNormScaleBiasDesc,
Pointer normScaleData,
Pointer normBiasData,
Pointer dNormScaleData,
Pointer dNormBiasData,
double epsilon,
cudnnTensorDescriptor normMeanVarDesc,
Pointer savedMean,
Pointer savedInvVariance,
cudnnActivationDescriptor activationDesc,
Pointer workSpace,
long workSpaceSizeInBytes,
Pointer reserveSpace,
long reserveSpaceSizeInBytes,
int groupCnt)
Place hold for future work, should be set to 1 now
|
static int |
cudnnNormalizationForwardInference(cudnnHandle handle,
int mode,
int normOps,
int algo,
Pointer alpha,
Pointer beta,
cudnnTensorDescriptor xDesc,
Pointer x,
cudnnTensorDescriptor normScaleBiasDesc,
Pointer normScale,
Pointer normBias,
cudnnTensorDescriptor normMeanVarDesc,
Pointer estimatedMean,
Pointer estimatedVariance,
cudnnTensorDescriptor zDesc,
Pointer z,
cudnnActivationDescriptor activationDesc,
cudnnTensorDescriptor yDesc,
Pointer y,
double epsilon,
int groupCnt)
Performs Normalization during Inference:
y[i] = normScale[k]*(x[i]-estimatedMean[k])/sqrt(epsilon+estimatedVariance[k]) + normBias[k]
with normScale, normBias, runningMean, runningInvVariance tensors indexed
according to per-channel or per-activation mode.
|
static int |
cudnnNormalizationForwardTraining(cudnnHandle handle,
int mode,
int normOps,
int algo,
Pointer alpha,
Pointer beta,
cudnnTensorDescriptor xDesc,
Pointer xData,
cudnnTensorDescriptor normScaleBiasDesc,
Pointer normScale,
Pointer normBias,
double exponentialAverageFactor,
cudnnTensorDescriptor normMeanVarDesc,
Pointer resultRunningMean,
Pointer resultRunningVariance,
double epsilon,
Pointer resultSaveMean,
Pointer resultSaveInvVariance,
cudnnActivationDescriptor activationDesc,
cudnnTensorDescriptor zDesc,
Pointer zData,
cudnnTensorDescriptor yDesc,
Pointer yData,
Pointer workspace,
long workSpaceSizeInBytes,
Pointer reserveSpace,
long reserveSpaceSizeInBytes,
int groupCnt)
Computes y = relu(Norm(x) + z).
|
static int |
cudnnOpsInferVersionCheck()
Cross-library version checker..
|
static int |
cudnnOpsTrainVersionCheck()
Cross-library version checker..
|
static int |
cudnnOpTensor(cudnnHandle handle,
cudnnOpTensorDescriptor opTensorDesc,
Pointer alpha1,
cudnnTensorDescriptor aDesc,
Pointer A,
Pointer alpha2,
cudnnTensorDescriptor bDesc,
Pointer B,
Pointer beta,
cudnnTensorDescriptor cDesc,
Pointer C)
B tensor is ignored for CUDNN_OP_TENSOR_SQRT, CUDNN_OP_TENSOR_NOT.
|
static int |
cudnnPoolingBackward(cudnnHandle handle,
cudnnPoolingDescriptor poolingDesc,
Pointer alpha,
cudnnTensorDescriptor yDesc,
Pointer y,
cudnnTensorDescriptor dyDesc,
Pointer dy,
cudnnTensorDescriptor xDesc,
Pointer x,
Pointer beta,
cudnnTensorDescriptor dxDesc,
Pointer dx)
Function to perform backward pooling
|
static int |
cudnnPoolingForward(cudnnHandle handle,
cudnnPoolingDescriptor poolingDesc,
Pointer alpha,
cudnnTensorDescriptor xDesc,
Pointer x,
Pointer beta,
cudnnTensorDescriptor yDesc,
Pointer y)
Function to perform forward pooling
|
static int |
cudnnQueryRuntimeError(cudnnHandle handle,
int[] rstatus,
int mode,
cudnnRuntimeTag tag) |
static int |
cudnnReduceTensor(cudnnHandle handle,
cudnnReduceTensorDescriptor reduceTensorDesc,
Pointer indices,
long indicesSizeInBytes,
Pointer workspace,
long workspaceSizeInBytes,
Pointer alpha,
cudnnTensorDescriptor aDesc,
Pointer A,
Pointer beta,
cudnnTensorDescriptor cDesc,
Pointer C)
The indices space is ignored for reduce ops other than min or max.
|
static int |
cudnnReorderFilterAndBias(cudnnHandle handle,
cudnnFilterDescriptor filterDesc,
int reorderType,
Pointer filterData,
Pointer reorderedFilterData,
int reorderBias,
Pointer biasData,
Pointer reorderedBiasData) |
static int |
cudnnRestoreAlgorithm(cudnnHandle handle,
Pointer algoSpace,
long algoSpaceSizeInBytes,
cudnnAlgorithmDescriptor algoDesc)
Deprecated.
|
static int |
cudnnRestoreDropoutDescriptor(cudnnDropoutDescriptor dropoutDesc,
cudnnHandle handle,
float dropout,
Pointer states,
long stateSizeInBytes,
long seed)
Restores the dropout descriptor to a previously saved-off state
|
static int |
cudnnRNNBackwardData_v8(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int[] devSeqLengths,
cudnnRNNDataDescriptor yDesc,
Pointer y,
Pointer dy,
cudnnRNNDataDescriptor xDesc,
Pointer dx,
cudnnTensorDescriptor hDesc,
Pointer hx,
Pointer dhy,
Pointer dhx,
cudnnTensorDescriptor cDesc,
Pointer cx,
Pointer dcy,
Pointer dcx,
long weightSpaceSize,
Pointer weightSpace,
long workSpaceSize,
Pointer workSpace,
long reserveSpaceSize,
Pointer reserveSpace) |
static int |
cudnnRNNBackwardData(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int seqLength,
cudnnTensorDescriptor[] yDesc,
Pointer y,
cudnnTensorDescriptor[] dyDesc,
Pointer dy,
cudnnTensorDescriptor dhyDesc,
Pointer dhy,
cudnnTensorDescriptor dcyDesc,
Pointer dcy,
cudnnFilterDescriptor wDesc,
Pointer w,
cudnnTensorDescriptor hxDesc,
Pointer hx,
cudnnTensorDescriptor cxDesc,
Pointer cx,
cudnnTensorDescriptor[] dxDesc,
Pointer dx,
cudnnTensorDescriptor dhxDesc,
Pointer dhx,
cudnnTensorDescriptor dcxDesc,
Pointer dcx,
Pointer workSpace,
long workSpaceSizeInBytes,
Pointer reserveSpace,
long reserveSpaceSizeInBytes)
Deprecated.
|
static int |
cudnnRNNBackwardDataEx(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
cudnnRNNDataDescriptor yDesc,
Pointer y,
cudnnRNNDataDescriptor dyDesc,
Pointer dy,
cudnnRNNDataDescriptor dcDesc,
Pointer dcAttn,
cudnnTensorDescriptor dhyDesc,
Pointer dhy,
cudnnTensorDescriptor dcyDesc,
Pointer dcy,
cudnnFilterDescriptor wDesc,
Pointer w,
cudnnTensorDescriptor hxDesc,
Pointer hx,
cudnnTensorDescriptor cxDesc,
Pointer cx,
cudnnRNNDataDescriptor dxDesc,
Pointer dx,
cudnnTensorDescriptor dhxDesc,
Pointer dhx,
cudnnTensorDescriptor dcxDesc,
Pointer dcx,
cudnnRNNDataDescriptor dkDesc,
Pointer dkeys,
Pointer workSpace,
long workSpaceSizeInBytes,
Pointer reserveSpace,
long reserveSpaceSizeInBytes)
Deprecated.
|
static int |
cudnnRNNBackwardWeights_v8(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int addGrad,
int[] devSeqLengths,
cudnnRNNDataDescriptor xDesc,
Pointer x,
cudnnTensorDescriptor hDesc,
Pointer hx,
cudnnRNNDataDescriptor yDesc,
Pointer y,
long weightSpaceSize,
Pointer dweightSpace,
long workSpaceSize,
Pointer workSpace,
long reserveSpaceSize,
Pointer reserveSpace) |
static int |
cudnnRNNBackwardWeights(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int seqLength,
cudnnTensorDescriptor[] xDesc,
Pointer x,
cudnnTensorDescriptor hxDesc,
Pointer hx,
cudnnTensorDescriptor[] yDesc,
Pointer y,
Pointer workSpace,
long workSpaceSizeInBytes,
cudnnFilterDescriptor dwDesc,
Pointer dw,
Pointer reserveSpace,
long reserveSpaceSizeInBytes)
Deprecated.
|
static int |
cudnnRNNBackwardWeightsEx(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
cudnnRNNDataDescriptor xDesc,
Pointer x,
cudnnTensorDescriptor hxDesc,
Pointer hx,
cudnnRNNDataDescriptor yDesc,
Pointer y,
Pointer workSpace,
long workSpaceSizeInBytes,
cudnnFilterDescriptor dwDesc,
Pointer dw,
Pointer reserveSpace,
long reserveSpaceSizeInBytes)
Deprecated.
|
static int |
cudnnRNNForward(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int fwdMode,
int[] devSeqLengths,
cudnnRNNDataDescriptor xDesc,
Pointer x,
cudnnRNNDataDescriptor yDesc,
Pointer y,
cudnnTensorDescriptor hDesc,
Pointer hx,
Pointer hy,
cudnnTensorDescriptor cDesc,
Pointer cx,
Pointer cy,
long weightSpaceSize,
Pointer weightSpace,
long workSpaceSize,
Pointer workSpace,
long reserveSpaceSize,
Pointer reserveSpace) |
static int |
cudnnRNNForwardInference(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int seqLength,
cudnnTensorDescriptor[] xDesc,
Pointer x,
cudnnTensorDescriptor hxDesc,
Pointer hx,
cudnnTensorDescriptor cxDesc,
Pointer cx,
cudnnFilterDescriptor wDesc,
Pointer w,
cudnnTensorDescriptor[] yDesc,
Pointer y,
cudnnTensorDescriptor hyDesc,
Pointer hy,
cudnnTensorDescriptor cyDesc,
Pointer cy,
Pointer workSpace,
long workSpaceSizeInBytes)
Deprecated.
|
static int |
cudnnRNNForwardInferenceEx(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
cudnnRNNDataDescriptor xDesc,
Pointer x,
cudnnTensorDescriptor hxDesc,
Pointer hx,
cudnnTensorDescriptor cxDesc,
Pointer cx,
cudnnFilterDescriptor wDesc,
Pointer w,
cudnnRNNDataDescriptor yDesc,
Pointer y,
cudnnTensorDescriptor hyDesc,
Pointer hy,
cudnnTensorDescriptor cyDesc,
Pointer cy,
cudnnRNNDataDescriptor kDesc,
Pointer keys,
cudnnRNNDataDescriptor cDesc,
Pointer cAttn,
cudnnRNNDataDescriptor iDesc,
Pointer iAttn,
cudnnRNNDataDescriptor qDesc,
Pointer queries,
Pointer workSpace,
long workSpaceSizeInBytes)
Deprecated.
|
static int |
cudnnRNNForwardTraining(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int seqLength,
cudnnTensorDescriptor[] xDesc,
Pointer x,
cudnnTensorDescriptor hxDesc,
Pointer hx,
cudnnTensorDescriptor cxDesc,
Pointer cx,
cudnnFilterDescriptor wDesc,
Pointer w,
cudnnTensorDescriptor[] yDesc,
Pointer y,
cudnnTensorDescriptor hyDesc,
Pointer hy,
cudnnTensorDescriptor cyDesc,
Pointer cy,
Pointer workSpace,
long workSpaceSizeInBytes,
Pointer reserveSpace,
long reserveSpaceSizeInBytes)
Deprecated.
|
static int |
cudnnRNNForwardTrainingEx(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
cudnnRNNDataDescriptor xDesc,
Pointer x,
cudnnTensorDescriptor hxDesc,
Pointer hx,
cudnnTensorDescriptor cxDesc,
Pointer cx,
cudnnFilterDescriptor wDesc,
Pointer w,
cudnnRNNDataDescriptor yDesc,
Pointer y,
cudnnTensorDescriptor hyDesc,
Pointer hy,
cudnnTensorDescriptor cyDesc,
Pointer cy,
cudnnRNNDataDescriptor kDesc,
Pointer keys,
cudnnRNNDataDescriptor cDesc,
Pointer cAttn,
cudnnRNNDataDescriptor iDesc,
Pointer iAttn,
cudnnRNNDataDescriptor qDesc,
Pointer queries,
Pointer workSpace,
long workSpaceSizeInBytes,
Pointer reserveSpace,
long reserveSpaceSizeInBytes)
Deprecated.
|
static int |
cudnnRNNGetClip_v8(cudnnRNNDescriptor rnnDesc,
int[] clipMode,
int[] clipNanOpt,
double[] lclip,
double[] rclip) |
static int |
cudnnRNNGetClip(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int[] clipMode,
int[] clipNanOpt,
double[] lclip,
double[] rclip)
Deprecated.
|
static int |
cudnnRNNSetClip_v8(cudnnRNNDescriptor rnnDesc,
int clipMode,
int clipNanOpt,
double lclip,
double rclip) |
static int |
cudnnRNNSetClip(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int clipMode,
int clipNanOpt,
double lclip,
double rclip)
Deprecated.
|
static int |
cudnnSaveAlgorithm(cudnnHandle handle,
cudnnAlgorithmDescriptor algoDesc,
Pointer algoSpace,
long algoSpaceSizeInBytes)
Deprecated.
|
static int |
cudnnScaleTensor(cudnnHandle handle,
cudnnTensorDescriptor yDesc,
Pointer y,
Pointer alpha)
Scale all values of a tensor by a given factor : y[i] = alpha * y[i]
|
static int |
cudnnSetActivationDescriptor(cudnnActivationDescriptor activationDesc,
int mode,
int reluNanOpt,
double coef) |
static int |
cudnnSetAlgorithmDescriptor(cudnnAlgorithmDescriptor algoDesc,
int algorithm)
Deprecated.
|
static int |
cudnnSetAlgorithmPerformance(cudnnAlgorithmPerformance algoPerf,
cudnnAlgorithmDescriptor algoDesc,
int status,
float time,
long memory)
Deprecated.
|
static int |
cudnnSetAttnDescriptor(cudnnAttnDescriptor attnDesc,
int attnMode,
int nHeads,
double smScaler,
int dataType,
int computePrec,
int mathType,
cudnnDropoutDescriptor attnDropoutDesc,
cudnnDropoutDescriptor postDropoutDesc,
int qSize,
int kSize,
int vSize,
int qProjSize,
int kProjSize,
int vProjSize,
int oProjSize,
int qoMaxSeqLength,
int kvMaxSeqLength,
int maxBatchSize,
int maxBeamSize) |
static int |
cudnnSetCallback(int mask,
Object udata,
cudnnCallback fptr) |
static int |
cudnnSetConvolution2dDescriptor(cudnnConvolutionDescriptor convDesc,
int pad_h,
int pad_w,
int u,
int v,
int dilation_h,
int dilation_w,
int mode,
int computeType) |
static int |
cudnnSetConvolutionGroupCount(cudnnConvolutionDescriptor convDesc,
int groupCount) |
static int |
cudnnSetConvolutionMathType(cudnnConvolutionDescriptor convDesc,
int mathType) |
static int |
cudnnSetConvolutionNdDescriptor(cudnnConvolutionDescriptor convDesc,
int arrayLength,
int[] padA,
int[] filterStrideA,
int[] dilationA,
int mode,
int computeType) |
static int |
cudnnSetConvolutionReorderType(cudnnConvolutionDescriptor convDesc,
int reorderType) |
static int |
cudnnSetCTCLossDescriptor_v8(cudnnCTCLossDescriptor ctcLossDesc,
int compType,
int normMode,
int gradMode,
int maxLabelLength) |
static int |
cudnnSetCTCLossDescriptor(cudnnCTCLossDescriptor ctcLossDesc,
int compType) |
static int |
cudnnSetCTCLossDescriptorEx(cudnnCTCLossDescriptor ctcLossDesc,
int compType,
int normMode,
int gradMode) |
static int |
cudnnSetDropoutDescriptor(cudnnDropoutDescriptor dropoutDesc,
cudnnHandle handle,
float dropout,
Pointer states,
long stateSizeInBytes,
long seed) |
static int |
cudnnSetFilter4dDescriptor(cudnnFilterDescriptor filterDesc,
int dataType,
int format,
int k,
int c,
int h,
int w) |
static int |
cudnnSetFilterNdDescriptor(cudnnFilterDescriptor filterDesc,
int dataType,
int format,
int nbDims,
int[] filterDimA)
width of each input filter
|
static int |
cudnnSetFusedOpsConstParamPackAttribute(cudnnFusedOpsConstParamPack constPack,
int paramLabel,
Pointer param) |
static int |
cudnnSetFusedOpsVariantParamPackAttribute(cudnnFusedOpsVariantParamPack varPack,
int paramLabel,
Pointer ptr) |
static int |
cudnnSetLRNDescriptor(cudnnLRNDescriptor normDesc,
int lrnN,
double lrnAlpha,
double lrnBeta,
double lrnK)
Uses a window [center-lookBehind, center+lookAhead], where
lookBehind = floor( (lrnN-1)/2 ), lookAhead = lrnN-lookBehind-1.
|
static int |
cudnnSetOpTensorDescriptor(cudnnOpTensorDescriptor opTensorDesc,
int opTensorOp,
int opTensorCompType,
int opTensorNanOpt) |
static int |
cudnnSetPersistentRNNPlan(cudnnRNNDescriptor rnnDesc,
cudnnPersistentRNNPlan plan)
Deprecated.
|
static int |
cudnnSetPooling2dDescriptor(cudnnPoolingDescriptor poolingDesc,
int mode,
int maxpoolingNanOpt,
int windowHeight,
int windowWidth,
int verticalPadding,
int horizontalPadding,
int verticalStride,
int horizontalStride) |
static int |
cudnnSetPoolingNdDescriptor(cudnnPoolingDescriptor poolingDesc,
int mode,
int maxpoolingNanOpt,
int nbDims,
int[] windowDimA,
int[] paddingA,
int[] strideA) |
static int |
cudnnSetReduceTensorDescriptor(cudnnReduceTensorDescriptor reduceTensorDesc,
int reduceTensorOp,
int reduceTensorCompType,
int reduceTensorNanOpt,
int reduceTensorIndices,
int reduceTensorIndicesType) |
static int |
cudnnSetRNNAlgorithmDescriptor(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
cudnnAlgorithmDescriptor algoDesc)
Deprecated.
|
static int |
cudnnSetRNNBiasMode(cudnnRNNDescriptor rnnDesc,
int biasMode)
Deprecated.
|
static int |
cudnnSetRNNDataDescriptor(cudnnRNNDataDescriptor rnnDataDesc,
int dataType,
int layout,
int maxSeqLength,
int batchSize,
int vectorSize,
int[] seqLengthArray,
Pointer paddingFill) |
static int |
cudnnSetRNNDescriptor_v6(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int hiddenSize,
int numLayers,
cudnnDropoutDescriptor dropoutDesc,
int inputMode,
int direction,
int cellMode,
int algo,
int mathPrec)
Deprecated.
|
static int |
cudnnSetRNNDescriptor_v8(cudnnRNNDescriptor rnnDesc,
int algo,
int cellMode,
int biasMode,
int dirMode,
int inputMode,
int dataType,
int mathPrec,
int mathType,
int inputSize,
int hiddenSize,
int projSize,
int numLayers,
cudnnDropoutDescriptor dropoutDesc,
int auxFlags) |
static int |
cudnnSetRNNMatrixMathType(cudnnRNNDescriptor rnnDesc,
int mType)
Deprecated.
|
static int |
cudnnSetRNNPaddingMode(cudnnRNNDescriptor rnnDesc,
int paddingMode)
Deprecated.
|
static int |
cudnnSetRNNProjectionLayers(cudnnHandle handle,
cudnnRNNDescriptor rnnDesc,
int recProjSize,
int outProjSize)
Deprecated.
|
static int |
cudnnSetSeqDataDescriptor(cudnnSeqDataDescriptor seqDataDesc,
int dataType,
int nbDims,
int[] dimA,
int[] axes,
long seqLengthArraySize,
int[] seqLengthArray,
Pointer paddingFill) |
static int |
cudnnSetSpatialTransformerNdDescriptor(cudnnSpatialTransformerDescriptor stDesc,
int samplerType,
int dataType,
int nbDims,
int[] dimA) |
static int |
cudnnSetStream(cudnnHandle handle,
cudaStream_t streamId) |
static int |
cudnnSetTensor(cudnnHandle handle,
cudnnTensorDescriptor yDesc,
Pointer y,
Pointer valuePtr)
Set all values of a tensor to a given value : y[i] = value[0]
|
static int |
cudnnSetTensor4dDescriptor(cudnnTensorDescriptor tensorDesc,
int format,
int dataType,
int n,
int c,
int h,
int w) |
static int |
cudnnSetTensor4dDescriptorEx(cudnnTensorDescriptor tensorDesc,
int dataType,
int n,
int c,
int h,
int w,
int nStride,
int cStride,
int hStride,
int wStride)
width of input section
|
static int |
cudnnSetTensorNdDescriptor(cudnnTensorDescriptor tensorDesc,
int dataType,
int nbDims,
int[] dimA,
int[] strideA) |
static int |
cudnnSetTensorNdDescriptorEx(cudnnTensorDescriptor tensorDesc,
int format,
int dataType,
int nbDims,
int[] dimA) |
static int |
cudnnSetTensorTransformDescriptor(cudnnTensorTransformDescriptor transformDesc,
int nbDims,
int destFormat,
int[] padBeforeA,
int[] padAfterA,
int[] foldA,
int direction)
Initialize a previously created tensor transform descriptor.
|
static int |
cudnnSoftmaxBackward(cudnnHandle handle,
int algo,
int mode,
Pointer alpha,
cudnnTensorDescriptor yDesc,
Pointer y,
cudnnTensorDescriptor dyDesc,
Pointer dy,
Pointer beta,
cudnnTensorDescriptor dxDesc,
Pointer dx)
Function to perform backward softmax
|
static int |
cudnnSoftmaxForward(cudnnHandle handle,
int algo,
int mode,
Pointer alpha,
cudnnTensorDescriptor xDesc,
Pointer x,
Pointer beta,
cudnnTensorDescriptor yDesc,
Pointer y)
Function to perform forward softmax
|
static int |
cudnnSpatialTfGridGeneratorBackward(cudnnHandle handle,
cudnnSpatialTransformerDescriptor stDesc,
Pointer dgrid,
Pointer dtheta)
Place hold for future work, should be set to 1 now
|
static int |
cudnnSpatialTfGridGeneratorForward(cudnnHandle handle,
cudnnSpatialTransformerDescriptor stDesc,
Pointer theta,
Pointer grid) |
static int |
cudnnSpatialTfSamplerBackward(cudnnHandle handle,
cudnnSpatialTransformerDescriptor stDesc,
Pointer alpha,
cudnnTensorDescriptor xDesc,
Pointer x,
Pointer beta,
cudnnTensorDescriptor dxDesc,
Pointer dx,
Pointer alphaDgrid,
cudnnTensorDescriptor dyDesc,
Pointer dy,
Pointer grid,
Pointer betaDgrid,
Pointer dgrid) |
static int |
cudnnSpatialTfSamplerForward(cudnnHandle handle,
cudnnSpatialTransformerDescriptor stDesc,
Pointer alpha,
cudnnTensorDescriptor xDesc,
Pointer x,
Pointer grid,
Pointer beta,
cudnnTensorDescriptor yDesc,
Pointer y) |
static int |
cudnnTransformFilter(cudnnHandle handle,
cudnnTensorTransformDescriptor transDesc,
Pointer alpha,
cudnnFilterDescriptor srcDesc,
Pointer srcData,
Pointer beta,
cudnnFilterDescriptor destDesc,
Pointer destData) |
static int |
cudnnTransformTensor(cudnnHandle handle,
Pointer alpha,
cudnnTensorDescriptor xDesc,
Pointer x,
Pointer beta,
cudnnTensorDescriptor yDesc,
Pointer y)
Tensor layout conversion helper (y = alpha * x + beta * y)
|
static int |
cudnnTransformTensorEx(cudnnHandle handle,
cudnnTensorTransformDescriptor transDesc,
Pointer alpha,
cudnnTensorDescriptor srcDesc,
Pointer srcData,
Pointer beta,
cudnnTensorDescriptor destDesc,
Pointer destData) |
static void |
initialize()
Initializes the native library.
|
static void |
setExceptionsEnabled(boolean enabled)
Enables or disables exceptions.
|
static void |
setLogLevel(LogLevel logLevel)
Set the specified log level for the JCudnn library.
|
public static final int CUDNN_MAJOR
public static final int CUDNN_MINOR
public static final int CUDNN_PATCHLEVEL
public static final int CUDNN_VERSION
public static final int CUDNN_DIM_MAX
public static final double CUDNN_BN_MIN_EPSILON
public static final int CUDNN_SEV_ERROR_EN
public static final int CUDNN_SEV_WARNING_EN
public static final int CUDNN_SEV_INFO_EN
public static final int CUDNN_ATTN_QUERYMAP_ALL_TO_ONE
public static final int CUDNN_ATTN_QUERYMAP_ONE_TO_ONE
public static final int CUDNN_ATTN_DISABLE_PROJ_BIASES
public static final int CUDNN_ATTN_ENABLE_PROJ_BIASES
public static final int CUDNN_ATTN_WKIND_COUNT
public static void initialize()
public static void setExceptionsEnabled(boolean enabled)
cudnnStatus
from the native methods.
If exceptions are enabled, a CudaException with a detailed error
message will be thrown if a method is about to set a result code
that is not cudnnStatus.CUDNN_STATUS_SUCCESSenabled
- Whether exceptions are enabledpublic static void setLogLevel(LogLevel logLevel)
logLevel
- The log level to use.public static long cudnnGetVersion()
public static long cudnnGetCudartVersion()
public static String cudnnGetErrorString(int status)
public static int cudnnQueryRuntimeError(cudnnHandle handle, int[] rstatus, int mode, cudnnRuntimeTag tag)
public static int cudnnGetProperty(int type, int[] value)
public static int cudnnCreate(cudnnHandle handle)
public static int cudnnDestroy(cudnnHandle handle)
public static int cudnnSetStream(cudnnHandle handle, cudaStream_t streamId)
public static int cudnnGetStream(cudnnHandle handle, cudaStream_t streamId)
public static int cudnnCreateTensorDescriptor(cudnnTensorDescriptor tensorDesc)
public static int cudnnSetTensor4dDescriptor(cudnnTensorDescriptor tensorDesc, int format, int dataType, int n, int c, int h, int w)
public static int cudnnSetTensor4dDescriptorEx(cudnnTensorDescriptor tensorDesc, int dataType, int n, int c, int h, int w, int nStride, int cStride, int hStride, int wStride)
public static int cudnnGetTensor4dDescriptor(cudnnTensorDescriptor tensorDesc, int[] dataType, int[] n, int[] c, int[] h, int[] w, int[] nStride, int[] cStride, int[] hStride, int[] wStride)
public static int cudnnSetTensorNdDescriptor(cudnnTensorDescriptor tensorDesc, int dataType, int nbDims, int[] dimA, int[] strideA)
public static int cudnnSetTensorNdDescriptorEx(cudnnTensorDescriptor tensorDesc, int format, int dataType, int nbDims, int[] dimA)
public static int cudnnGetTensorNdDescriptor(cudnnTensorDescriptor tensorDesc, int nbDimsRequested, int[] dataType, int[] nbDims, int[] dimA, int[] strideA)
public static int cudnnGetTensorSizeInBytes(cudnnTensorDescriptor tensorDesc, long[] size)
public static int cudnnDestroyTensorDescriptor(cudnnTensorDescriptor tensorDesc)
public static int cudnnInitTransformDest(cudnnTensorTransformDescriptor transformDesc, cudnnTensorDescriptor srcDesc, cudnnTensorDescriptor destDesc, long[] destSizeInBytes)
public static int cudnnCreateTensorTransformDescriptor(cudnnTensorTransformDescriptor transformDesc)
public static int cudnnSetTensorTransformDescriptor(cudnnTensorTransformDescriptor transformDesc, int nbDims, int destFormat, int[] padBeforeA, int[] padAfterA, int[] foldA, int direction)
public static int cudnnGetTensorTransformDescriptor(cudnnTensorTransformDescriptor transformDesc, int nbDimsRequested, int[] destFormat, int[] padBeforeA, int[] padAfterA, int[] foldA, int[] direction)
Retrieves the values stored in a previously initialized tensor transform descriptor.
public static int cudnnDestroyTensorTransformDescriptor(cudnnTensorTransformDescriptor transformDesc)
public static int cudnnTransformTensor(cudnnHandle handle, Pointer alpha, cudnnTensorDescriptor xDesc, Pointer x, Pointer beta, cudnnTensorDescriptor yDesc, Pointer y)
public static int cudnnTransformTensorEx(cudnnHandle handle, cudnnTensorTransformDescriptor transDesc, Pointer alpha, cudnnTensorDescriptor srcDesc, Pointer srcData, Pointer beta, cudnnTensorDescriptor destDesc, Pointer destData)
public static int cudnnAddTensor(cudnnHandle handle, Pointer alpha, cudnnTensorDescriptor aDesc, Pointer A, Pointer beta, cudnnTensorDescriptor cDesc, Pointer C)
public static int cudnnCreateOpTensorDescriptor(cudnnOpTensorDescriptor opTensorDesc)
public static int cudnnSetOpTensorDescriptor(cudnnOpTensorDescriptor opTensorDesc, int opTensorOp, int opTensorCompType, int opTensorNanOpt)
public static int cudnnGetOpTensorDescriptor(cudnnOpTensorDescriptor opTensorDesc, int[] opTensorOp, int[] opTensorCompType, int[] opTensorNanOpt)
public static int cudnnDestroyOpTensorDescriptor(cudnnOpTensorDescriptor opTensorDesc)
public static int cudnnOpTensor(cudnnHandle handle, cudnnOpTensorDescriptor opTensorDesc, Pointer alpha1, cudnnTensorDescriptor aDesc, Pointer A, Pointer alpha2, cudnnTensorDescriptor bDesc, Pointer B, Pointer beta, cudnnTensorDescriptor cDesc, Pointer C)
public static int cudnnCreateReduceTensorDescriptor(cudnnReduceTensorDescriptor reduceTensorDesc)
public static int cudnnSetReduceTensorDescriptor(cudnnReduceTensorDescriptor reduceTensorDesc, int reduceTensorOp, int reduceTensorCompType, int reduceTensorNanOpt, int reduceTensorIndices, int reduceTensorIndicesType)
public static int cudnnGetReduceTensorDescriptor(cudnnReduceTensorDescriptor reduceTensorDesc, int[] reduceTensorOp, int[] reduceTensorCompType, int[] reduceTensorNanOpt, int[] reduceTensorIndices, int[] reduceTensorIndicesType)
public static int cudnnDestroyReduceTensorDescriptor(cudnnReduceTensorDescriptor reduceTensorDesc)
public static int cudnnGetReductionIndicesSize(cudnnHandle handle, cudnnReduceTensorDescriptor reduceTensorDesc, cudnnTensorDescriptor aDesc, cudnnTensorDescriptor cDesc, long[] sizeInBytes)
public static int cudnnGetReductionWorkspaceSize(cudnnHandle handle, cudnnReduceTensorDescriptor reduceTensorDesc, cudnnTensorDescriptor aDesc, cudnnTensorDescriptor cDesc, long[] sizeInBytes)
public static int cudnnReduceTensor(cudnnHandle handle, cudnnReduceTensorDescriptor reduceTensorDesc, Pointer indices, long indicesSizeInBytes, Pointer workspace, long workspaceSizeInBytes, Pointer alpha, cudnnTensorDescriptor aDesc, Pointer A, Pointer beta, cudnnTensorDescriptor cDesc, Pointer C)
public static int cudnnSetTensor(cudnnHandle handle, cudnnTensorDescriptor yDesc, Pointer y, Pointer valuePtr)
public static int cudnnScaleTensor(cudnnHandle handle, cudnnTensorDescriptor yDesc, Pointer y, Pointer alpha)
public static int cudnnCreateFilterDescriptor(cudnnFilterDescriptor filterDesc)
public static int cudnnSetFilter4dDescriptor(cudnnFilterDescriptor filterDesc, int dataType, int format, int k, int c, int h, int w)
public static int cudnnGetFilter4dDescriptor(cudnnFilterDescriptor filterDesc, int[] dataType, int[] format, int[] k, int[] c, int[] h, int[] w)
public static int cudnnSetFilterNdDescriptor(cudnnFilterDescriptor filterDesc, int dataType, int format, int nbDims, int[] filterDimA)
public static int cudnnGetFilterNdDescriptor(cudnnFilterDescriptor filterDesc, int nbDimsRequested, int[] dataType, int[] format, int[] nbDims, int[] filterDimA)
public static int cudnnGetFilterSizeInBytes(cudnnFilterDescriptor filterDesc, long[] size)
public static int cudnnTransformFilter(cudnnHandle handle, cudnnTensorTransformDescriptor transDesc, Pointer alpha, cudnnFilterDescriptor srcDesc, Pointer srcData, Pointer beta, cudnnFilterDescriptor destDesc, Pointer destData)
public static int cudnnDestroyFilterDescriptor(cudnnFilterDescriptor filterDesc)
public static int cudnnSoftmaxForward(cudnnHandle handle, int algo, int mode, Pointer alpha, cudnnTensorDescriptor xDesc, Pointer x, Pointer beta, cudnnTensorDescriptor yDesc, Pointer y)
public static int cudnnCreatePoolingDescriptor(cudnnPoolingDescriptor poolingDesc)
public static int cudnnSetPooling2dDescriptor(cudnnPoolingDescriptor poolingDesc, int mode, int maxpoolingNanOpt, int windowHeight, int windowWidth, int verticalPadding, int horizontalPadding, int verticalStride, int horizontalStride)
public static int cudnnGetPooling2dDescriptor(cudnnPoolingDescriptor poolingDesc, int[] mode, int[] maxpoolingNanOpt, int[] windowHeight, int[] windowWidth, int[] verticalPadding, int[] horizontalPadding, int[] verticalStride, int[] horizontalStride)
public static int cudnnSetPoolingNdDescriptor(cudnnPoolingDescriptor poolingDesc, int mode, int maxpoolingNanOpt, int nbDims, int[] windowDimA, int[] paddingA, int[] strideA)
public static int cudnnGetPoolingNdDescriptor(cudnnPoolingDescriptor poolingDesc, int nbDimsRequested, int[] mode, int[] maxpoolingNanOpt, int[] nbDims, int[] windowDimA, int[] paddingA, int[] strideA)
public static int cudnnGetPoolingNdForwardOutputDim(cudnnPoolingDescriptor poolingDesc, cudnnTensorDescriptor inputTensorDesc, int nbDims, int[] outputTensorDimA)
public static int cudnnGetPooling2dForwardOutputDim(cudnnPoolingDescriptor poolingDesc, cudnnTensorDescriptor inputTensorDesc, int[] n, int[] c, int[] h, int[] w)
public static int cudnnDestroyPoolingDescriptor(cudnnPoolingDescriptor poolingDesc)
public static int cudnnPoolingForward(cudnnHandle handle, cudnnPoolingDescriptor poolingDesc, Pointer alpha, cudnnTensorDescriptor xDesc, Pointer x, Pointer beta, cudnnTensorDescriptor yDesc, Pointer y)
public static int cudnnCreateActivationDescriptor(cudnnActivationDescriptor activationDesc)
public static int cudnnSetActivationDescriptor(cudnnActivationDescriptor activationDesc, int mode, int reluNanOpt, double coef)
public static int cudnnGetActivationDescriptor(cudnnActivationDescriptor activationDesc, int[] mode, int[] reluNanOpt, double[] coef)
public static int cudnnDestroyActivationDescriptor(cudnnActivationDescriptor activationDesc)
public static int cudnnActivationForward(cudnnHandle handle, cudnnActivationDescriptor activationDesc, Pointer alpha, cudnnTensorDescriptor xDesc, Pointer x, Pointer beta, cudnnTensorDescriptor yDesc, Pointer y)
public static int cudnnCreateLRNDescriptor(cudnnLRNDescriptor normDesc)
Create an instance of LRN (Local Response Normalization) descriptor Uses lrnN=5, lrnAlpha=1e-4, lrnBeta=0.75, lrnK=2.0 as defaults from Krizhevsky'12 ImageNet paper
public static int cudnnSetLRNDescriptor(cudnnLRNDescriptor normDesc, int lrnN, double lrnAlpha, double lrnBeta, double lrnK)
Uses a window [center-lookBehind, center+lookAhead], where lookBehind = floor( (lrnN-1)/2 ), lookAhead = lrnN-lookBehind-1. Values of double parameters cast to tensor data type.
public static int cudnnGetLRNDescriptor(cudnnLRNDescriptor normDesc, int[] lrnN, double[] lrnAlpha, double[] lrnBeta, double[] lrnK)
Retrieve the settings currently stored in an LRN layer descriptor Any of the provided pointers can be NULL (no corresponding value will be returned)
public static int cudnnDestroyLRNDescriptor(cudnnLRNDescriptor lrnDesc)
public static int cudnnLRNCrossChannelForward(cudnnHandle handle, cudnnLRNDescriptor normDesc, int lrnMode, Pointer alpha, cudnnTensorDescriptor xDesc, Pointer x, Pointer beta, cudnnTensorDescriptor yDesc, Pointer y)
public static int cudnnDivisiveNormalizationForward(cudnnHandle handle, cudnnLRNDescriptor normDesc, int mode, Pointer alpha, cudnnTensorDescriptor xDesc, Pointer x, Pointer means, Pointer temp, Pointer temp2, Pointer beta, cudnnTensorDescriptor yDesc, Pointer y)
public static int cudnnDeriveBNTensorDescriptor(cudnnTensorDescriptor derivedBnDesc, cudnnTensorDescriptor xDesc, int mode)
Derives a tensor descriptor from layer data descriptor for BatchNormalization scale, invVariance, bnBias, bnScale tensors. Use this tensor desc for bnScaleBiasMeanVarDesc and bnScaleBiasDiffDesc in Batch Normalization forward and backward functions.
public static int cudnnBatchNormalizationForwardInference(cudnnHandle handle, int mode, Pointer alpha, Pointer beta, cudnnTensorDescriptor xDesc, Pointer x, cudnnTensorDescriptor yDesc, Pointer y, cudnnTensorDescriptor bnScaleBiasMeanVarDesc, Pointer bnScale, Pointer bnBias, Pointer estimatedMean, Pointer estimatedVariance, double epsilon)
Performs Batch Normalization during Inference: y[i] = bnScale[k]*(x[i]-estimatedMean[k])/sqrt(epsilon+estimatedVariance[k]) + bnBias[k] with bnScale, bnBias, runningMean, runningInvVariance tensors indexed according to spatial or per-activation mode. Refer to cudnnBatchNormalizationForwardTraining above for notes on function arguments.
public static int cudnnDeriveNormTensorDescriptor(cudnnTensorDescriptor derivedNormScaleBiasDesc, cudnnTensorDescriptor derivedNormMeanVarDesc, cudnnTensorDescriptor xDesc, int mode, int groupCnt)
Derives a tensor descriptor from layer data descriptor for Normalization scale, invVariance, bnBias, bnScale tensors. Use this tensor desc for normScaleBiasMeanVarDesc and normScaleBiasDiffDesc in Normalization forward and backward functions.
public static int cudnnNormalizationForwardInference(cudnnHandle handle, int mode, int normOps, int algo, Pointer alpha, Pointer beta, cudnnTensorDescriptor xDesc, Pointer x, cudnnTensorDescriptor normScaleBiasDesc, Pointer normScale, Pointer normBias, cudnnTensorDescriptor normMeanVarDesc, Pointer estimatedMean, Pointer estimatedVariance, cudnnTensorDescriptor zDesc, Pointer z, cudnnActivationDescriptor activationDesc, cudnnTensorDescriptor yDesc, Pointer y, double epsilon, int groupCnt)
Performs Normalization during Inference: y[i] = normScale[k]*(x[i]-estimatedMean[k])/sqrt(epsilon+estimatedVariance[k]) + normBias[k] with normScale, normBias, runningMean, runningInvVariance tensors indexed according to per-channel or per-activation mode. Refer to cudnnNormalizationForwardTraining above for notes on function arguments.
public static int cudnnCreateSpatialTransformerDescriptor(cudnnSpatialTransformerDescriptor stDesc)
public static int cudnnSetSpatialTransformerNdDescriptor(cudnnSpatialTransformerDescriptor stDesc, int samplerType, int dataType, int nbDims, int[] dimA)
public static int cudnnDestroySpatialTransformerDescriptor(cudnnSpatialTransformerDescriptor stDesc)
public static int cudnnSpatialTfGridGeneratorForward(cudnnHandle handle, cudnnSpatialTransformerDescriptor stDesc, Pointer theta, Pointer grid)
public static int cudnnSpatialTfSamplerForward(cudnnHandle handle, cudnnSpatialTransformerDescriptor stDesc, Pointer alpha, cudnnTensorDescriptor xDesc, Pointer x, Pointer grid, Pointer beta, cudnnTensorDescriptor yDesc, Pointer y)
public static int cudnnCreateDropoutDescriptor(cudnnDropoutDescriptor dropoutDesc)
public static int cudnnDestroyDropoutDescriptor(cudnnDropoutDescriptor dropoutDesc)
public static int cudnnDropoutGetStatesSize(cudnnHandle handle, long[] sizeInBytes)
public static int cudnnDropoutGetReserveSpaceSize(cudnnTensorDescriptor xdesc, long[] sizeInBytes)
public static int cudnnSetDropoutDescriptor(cudnnDropoutDescriptor dropoutDesc, cudnnHandle handle, float dropout, Pointer states, long stateSizeInBytes, long seed)
public static int cudnnRestoreDropoutDescriptor(cudnnDropoutDescriptor dropoutDesc, cudnnHandle handle, float dropout, Pointer states, long stateSizeInBytes, long seed)
public static int cudnnGetDropoutDescriptor(cudnnDropoutDescriptor dropoutDesc, cudnnHandle handle, float[] dropout, Pointer states, long[] seed)
public static int cudnnDropoutForward(cudnnHandle handle, cudnnDropoutDescriptor dropoutDesc, cudnnTensorDescriptor xdesc, Pointer x, cudnnTensorDescriptor ydesc, Pointer y, Pointer reserveSpace, long reserveSpaceSizeInBytes)
@Deprecated public static int cudnnCreateAlgorithmDescriptor(cudnnAlgorithmDescriptor algoDesc)
@Deprecated public static int cudnnSetAlgorithmDescriptor(cudnnAlgorithmDescriptor algoDesc, int algorithm)
@Deprecated public static int cudnnGetAlgorithmDescriptor(cudnnAlgorithmDescriptor algoDesc, int[] algorithm)
@Deprecated public static int cudnnCopyAlgorithmDescriptor(cudnnAlgorithmDescriptor src, cudnnAlgorithmDescriptor dest)
@Deprecated public static int cudnnDestroyAlgorithmDescriptor(cudnnAlgorithmDescriptor algoDesc)
@Deprecated public static int cudnnCreateAlgorithmPerformance(cudnnAlgorithmPerformance[] algoPerf, int numberToCreate)
@Deprecated public static int cudnnSetAlgorithmPerformance(cudnnAlgorithmPerformance algoPerf, cudnnAlgorithmDescriptor algoDesc, int status, float time, long memory)
@Deprecated public static int cudnnGetAlgorithmPerformance(cudnnAlgorithmPerformance algoPerf, cudnnAlgorithmDescriptor algoDesc, int[] status, float[] time, long[] memory)
@Deprecated public static int cudnnDestroyAlgorithmPerformance(cudnnAlgorithmPerformance[] algoPerf, int numberToDestroy)
@Deprecated public static int cudnnGetAlgorithmSpaceSize(cudnnHandle handle, cudnnAlgorithmDescriptor algoDesc, long[] algoSpaceSizeInBytes)
@Deprecated public static int cudnnSaveAlgorithm(cudnnHandle handle, cudnnAlgorithmDescriptor algoDesc, Pointer algoSpace, long algoSpaceSizeInBytes)
@Deprecated public static int cudnnRestoreAlgorithm(cudnnHandle handle, Pointer algoSpace, long algoSpaceSizeInBytes, cudnnAlgorithmDescriptor algoDesc)
public static int cudnnSetCallback(int mask, Object udata, cudnnCallback fptr)
public static int cudnnGetCallback(int[] mask, Object udata, cudnnCallback[] fptr)
public static int cudnnOpsInferVersionCheck()
Cross-library version checker.. This function is implemented differently in each sub-library. Each sublib checks whether its own version matches that of its dependencies.
public static int cudnnSoftmaxBackward(cudnnHandle handle, int algo, int mode, Pointer alpha, cudnnTensorDescriptor yDesc, Pointer y, cudnnTensorDescriptor dyDesc, Pointer dy, Pointer beta, cudnnTensorDescriptor dxDesc, Pointer dx)
public static int cudnnPoolingBackward(cudnnHandle handle, cudnnPoolingDescriptor poolingDesc, Pointer alpha, cudnnTensorDescriptor yDesc, Pointer y, cudnnTensorDescriptor dyDesc, Pointer dy, cudnnTensorDescriptor xDesc, Pointer x, Pointer beta, cudnnTensorDescriptor dxDesc, Pointer dx)
public static int cudnnActivationBackward(cudnnHandle handle, cudnnActivationDescriptor activationDesc, Pointer alpha, cudnnTensorDescriptor yDesc, Pointer y, cudnnTensorDescriptor dyDesc, Pointer dy, cudnnTensorDescriptor xDesc, Pointer x, Pointer beta, cudnnTensorDescriptor dxDesc, Pointer dx)
public static int cudnnLRNCrossChannelBackward(cudnnHandle handle, cudnnLRNDescriptor normDesc, int lrnMode, Pointer alpha, cudnnTensorDescriptor yDesc, Pointer y, cudnnTensorDescriptor dyDesc, Pointer dy, cudnnTensorDescriptor xDesc, Pointer x, Pointer beta, cudnnTensorDescriptor dxDesc, Pointer dx)
public static int cudnnDivisiveNormalizationBackward(cudnnHandle handle, cudnnLRNDescriptor normDesc, int mode, Pointer alpha, cudnnTensorDescriptor xDesc, Pointer x, Pointer means, Pointer dy, Pointer temp, Pointer temp2, Pointer beta, cudnnTensorDescriptor dXdMeansDesc, Pointer dx, Pointer dMeans)
public static int cudnnGetBatchNormalizationForwardTrainingExWorkspaceSize(cudnnHandle handle, int mode, int bnOps, cudnnTensorDescriptor xDesc, cudnnTensorDescriptor zDesc, cudnnTensorDescriptor yDesc, cudnnTensorDescriptor bnScaleBiasMeanVarDesc, cudnnActivationDescriptor activationDesc, long[] sizeInBytes)
public static int cudnnGetBatchNormalizationBackwardExWorkspaceSize(cudnnHandle handle, int mode, int bnOps, cudnnTensorDescriptor xDesc, cudnnTensorDescriptor yDesc, cudnnTensorDescriptor dyDesc, cudnnTensorDescriptor dzDesc, cudnnTensorDescriptor dxDesc, cudnnTensorDescriptor dBnScaleBiasDesc, cudnnActivationDescriptor activationDesc, long[] sizeInBytes)
public static int cudnnGetBatchNormalizationTrainingExReserveSpaceSize(cudnnHandle handle, int mode, int bnOps, cudnnActivationDescriptor activationDesc, cudnnTensorDescriptor xDesc, long[] sizeInBytes)
public static int cudnnBatchNormalizationForwardTraining(cudnnHandle handle, int mode, Pointer alpha, Pointer beta, cudnnTensorDescriptor xDesc, Pointer x, cudnnTensorDescriptor yDesc, Pointer y, cudnnTensorDescriptor bnScaleBiasMeanVarDesc, Pointer bnScale, Pointer bnBias, double exponentialAverageFactor, Pointer resultRunningMean, Pointer resultRunningVariance, double epsilon, Pointer resultSaveMean, Pointer resultSaveInvVariance)
public static int cudnnBatchNormalizationForwardTrainingEx(cudnnHandle handle, int mode, int bnOps, Pointer alpha, Pointer beta, cudnnTensorDescriptor xDesc, Pointer xData, cudnnTensorDescriptor zDesc, Pointer zData, cudnnTensorDescriptor yDesc, Pointer yData, cudnnTensorDescriptor bnScaleBiasMeanVarDesc, Pointer bnScale, Pointer bnBias, double exponentialAverageFactor, Pointer resultRunningMean, Pointer resultRunningVariance, double epsilon, Pointer resultSaveMean, Pointer resultSaveInvVariance, cudnnActivationDescriptor activationDesc, Pointer workspace, long workSpaceSizeInBytes, Pointer reserveSpace, long reserveSpaceSizeInBytes)
public static int cudnnBatchNormalizationBackward(cudnnHandle handle, int mode, Pointer alphaDataDiff, Pointer betaDataDiff, Pointer alphaParamDiff, Pointer betaParamDiff, cudnnTensorDescriptor xDesc, Pointer x, cudnnTensorDescriptor dyDesc, Pointer dy, cudnnTensorDescriptor dxDesc, Pointer dx, cudnnTensorDescriptor dBnScaleBiasDesc, Pointer bnScale, Pointer dBnScaleResult, Pointer dBnBiasResult, double epsilon, Pointer savedMean, Pointer savedInvVariance)
public static int cudnnBatchNormalizationBackwardEx(cudnnHandle handle, int mode, int bnOps, Pointer alphaDataDiff, Pointer betaDataDiff, Pointer alphaParamDiff, Pointer betaParamDiff, cudnnTensorDescriptor xDesc, Pointer xData, cudnnTensorDescriptor yDesc, Pointer yData, cudnnTensorDescriptor dyDesc, Pointer dyData, cudnnTensorDescriptor dzDesc, Pointer dzData, cudnnTensorDescriptor dxDesc, Pointer dxData, cudnnTensorDescriptor dBnScaleBiasDesc, Pointer bnScaleData, Pointer bnBiasData, Pointer dBnScaleData, Pointer dBnBiasData, double epsilon, Pointer savedMean, Pointer savedInvVariance, cudnnActivationDescriptor activationDesc, Pointer workSpace, long workSpaceSizeInBytes, Pointer reserveSpace, long reserveSpaceSizeInBytes)
public static int cudnnGetNormalizationForwardTrainingWorkspaceSize(cudnnHandle handle, int mode, int normOps, int algo, cudnnTensorDescriptor xDesc, cudnnTensorDescriptor zDesc, cudnnTensorDescriptor yDesc, cudnnTensorDescriptor normScaleBiasDesc, cudnnActivationDescriptor activationDesc, cudnnTensorDescriptor normMeanVarDesc, long[] sizeInBytes, int groupCnt)
public static int cudnnGetNormalizationBackwardWorkspaceSize(cudnnHandle handle, int mode, int normOps, int algo, cudnnTensorDescriptor xDesc, cudnnTensorDescriptor yDesc, cudnnTensorDescriptor dyDesc, cudnnTensorDescriptor dzDesc, cudnnTensorDescriptor dxDesc, cudnnTensorDescriptor dNormScaleBiasDesc, cudnnActivationDescriptor activationDesc, cudnnTensorDescriptor normMeanVarDesc, long[] sizeInBytes, int groupCnt)
public static int cudnnGetNormalizationTrainingReserveSpaceSize(cudnnHandle handle, int mode, int normOps, int algo, cudnnActivationDescriptor activationDesc, cudnnTensorDescriptor xDesc, long[] sizeInBytes, int groupCnt)
public static int cudnnNormalizationForwardTraining(cudnnHandle handle, int mode, int normOps, int algo, Pointer alpha, Pointer beta, cudnnTensorDescriptor xDesc, Pointer xData, cudnnTensorDescriptor normScaleBiasDesc, Pointer normScale, Pointer normBias, double exponentialAverageFactor, cudnnTensorDescriptor normMeanVarDesc, Pointer resultRunningMean, Pointer resultRunningVariance, double epsilon, Pointer resultSaveMean, Pointer resultSaveInvVariance, cudnnActivationDescriptor activationDesc, cudnnTensorDescriptor zDesc, Pointer zData, cudnnTensorDescriptor yDesc, Pointer yData, Pointer workspace, long workSpaceSizeInBytes, Pointer reserveSpace, long reserveSpaceSizeInBytes, int groupCnt)
public static int cudnnNormalizationBackward(cudnnHandle handle, int mode, int normOps, int algo, Pointer alphaDataDiff, Pointer betaDataDiff, Pointer alphaParamDiff, Pointer betaParamDiff, cudnnTensorDescriptor xDesc, Pointer xData, cudnnTensorDescriptor yDesc, Pointer yData, cudnnTensorDescriptor dyDesc, Pointer dyData, cudnnTensorDescriptor dzDesc, Pointer dzData, cudnnTensorDescriptor dxDesc, Pointer dxData, cudnnTensorDescriptor dNormScaleBiasDesc, Pointer normScaleData, Pointer normBiasData, Pointer dNormScaleData, Pointer dNormBiasData, double epsilon, cudnnTensorDescriptor normMeanVarDesc, Pointer savedMean, Pointer savedInvVariance, cudnnActivationDescriptor activationDesc, Pointer workSpace, long workSpaceSizeInBytes, Pointer reserveSpace, long reserveSpaceSizeInBytes, int groupCnt)
public static int cudnnSpatialTfGridGeneratorBackward(cudnnHandle handle, cudnnSpatialTransformerDescriptor stDesc, Pointer dgrid, Pointer dtheta)
public static int cudnnSpatialTfSamplerBackward(cudnnHandle handle, cudnnSpatialTransformerDescriptor stDesc, Pointer alpha, cudnnTensorDescriptor xDesc, Pointer x, Pointer beta, cudnnTensorDescriptor dxDesc, Pointer dx, Pointer alphaDgrid, cudnnTensorDescriptor dyDesc, Pointer dy, Pointer grid, Pointer betaDgrid, Pointer dgrid)
public static int cudnnDropoutBackward(cudnnHandle handle, cudnnDropoutDescriptor dropoutDesc, cudnnTensorDescriptor dydesc, Pointer dy, cudnnTensorDescriptor dxdesc, Pointer dx, Pointer reserveSpace, long reserveSpaceSizeInBytes)
public static int cudnnOpsTrainVersionCheck()
Cross-library version checker.. This function is implemented differently in each sub-library. Each sublib checks whether its own version matches that of its dependencies.
public static int cudnnCreateRNNDescriptor(cudnnRNNDescriptor rnnDesc)
public static int cudnnDestroyRNNDescriptor(cudnnRNNDescriptor rnnDesc)
public static int cudnnSetRNNDescriptor_v8(cudnnRNNDescriptor rnnDesc, int algo, int cellMode, int biasMode, int dirMode, int inputMode, int dataType, int mathPrec, int mathType, int inputSize, int hiddenSize, int projSize, int numLayers, cudnnDropoutDescriptor dropoutDesc, int auxFlags)
public static int cudnnGetRNNDescriptor_v8(cudnnRNNDescriptor rnnDesc, int[] algo, int[] cellMode, int[] biasMode, int[] dirMode, int[] inputMode, int[] dataType, int[] mathPrec, int[] mathType, int[] inputSize, int[] hiddenSize, int[] projSize, int[] numLayers, cudnnDropoutDescriptor dropoutDesc, int[] auxFlags)
@Deprecated public static int cudnnSetRNNDescriptor_v6(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int hiddenSize, int numLayers, cudnnDropoutDescriptor dropoutDesc, int inputMode, int direction, int cellMode, int algo, int mathPrec)
mathPrec in cudnnSetRNNDescriptor_v6() specifies compute precision compute precision is further modified by cudnnSetRNNMatrixMathType() dataType in cudnnGetRNNParamsSize() and wDesc specify weight storage dropout is between RNN layers, not between recurrent steps
@Deprecated public static int cudnnGetRNNDescriptor_v6(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int[] hiddenSize, int[] numLayers, cudnnDropoutDescriptor dropoutDesc, int[] inputMode, int[] direction, int[] cellMode, int[] algo, int[] mathPrec)
@Deprecated public static int cudnnSetRNNMatrixMathType(cudnnRNNDescriptor rnnDesc, int mType)
@Deprecated public static int cudnnGetRNNMatrixMathType(cudnnRNNDescriptor rnnDesc, int[] mType)
@Deprecated public static int cudnnSetRNNBiasMode(cudnnRNNDescriptor rnnDesc, int biasMode)
@Deprecated public static int cudnnGetRNNBiasMode(cudnnRNNDescriptor rnnDesc, int[] biasMode)
public static int cudnnRNNSetClip_v8(cudnnRNNDescriptor rnnDesc, int clipMode, int clipNanOpt, double lclip, double rclip)
public static int cudnnRNNGetClip_v8(cudnnRNNDescriptor rnnDesc, int[] clipMode, int[] clipNanOpt, double[] lclip, double[] rclip)
@Deprecated public static int cudnnRNNSetClip(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int clipMode, int clipNanOpt, double lclip, double rclip)
@Deprecated public static int cudnnRNNGetClip(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int[] clipMode, int[] clipNanOpt, double[] lclip, double[] rclip)
@Deprecated public static int cudnnSetRNNProjectionLayers(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int recProjSize, int outProjSize)
@Deprecated public static int cudnnGetRNNProjectionLayers(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int[] recProjSize, int[] outProjSize)
@Deprecated public static int cudnnCreatePersistentRNNPlan(cudnnRNNDescriptor rnnDesc, int minibatch, int dataType, cudnnPersistentRNNPlan plan)
@Deprecated public static int cudnnDestroyPersistentRNNPlan(cudnnPersistentRNNPlan plan)
@Deprecated public static int cudnnSetPersistentRNNPlan(cudnnRNNDescriptor rnnDesc, cudnnPersistentRNNPlan plan)
public static int cudnnBuildRNNDynamic(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int miniBatch)
@Deprecated public static int cudnnGetRNNWorkspaceSize(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int seqLength, cudnnTensorDescriptor[] xDesc, long[] sizeInBytes)
@Deprecated public static int cudnnGetRNNTrainingReserveSize(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int seqLength, cudnnTensorDescriptor[] xDesc, long[] sizeInBytes)
public static int cudnnGetRNNTempSpaceSizes(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int fMode, cudnnRNNDataDescriptor xDesc, long[] workSpaceSize, long[] reserveSpaceSize)
@Deprecated public static int cudnnGetRNNParamsSize(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, cudnnTensorDescriptor xDesc, long[] sizeInBytes, int dataType)
public static int cudnnGetRNNWeightSpaceSize(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, long[] weightSpaceSize)
@Deprecated public static int cudnnGetRNNLinLayerMatrixParams(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int pseudoLayer, cudnnTensorDescriptor xDesc, cudnnFilterDescriptor wDesc, Pointer w, int linLayerID, cudnnFilterDescriptor linLayerMatDesc, Pointer linLayerMat)
@Deprecated public static int cudnnGetRNNLinLayerBiasParams(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int pseudoLayer, cudnnTensorDescriptor xDesc, cudnnFilterDescriptor wDesc, Pointer w, int linLayerID, cudnnFilterDescriptor linLayerBiasDesc, Pointer linLayerBias)
public static int cudnnGetRNNWeightParams(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int pseudoLayer, long weightSpaceSize, Pointer weightSpace, int linLayerID, cudnnTensorDescriptor mDesc, Pointer mAddr, cudnnTensorDescriptor bDesc, Pointer bAddr)
@Deprecated public static int cudnnRNNForwardInference(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int seqLength, cudnnTensorDescriptor[] xDesc, Pointer x, cudnnTensorDescriptor hxDesc, Pointer hx, cudnnTensorDescriptor cxDesc, Pointer cx, cudnnFilterDescriptor wDesc, Pointer w, cudnnTensorDescriptor[] yDesc, Pointer y, cudnnTensorDescriptor hyDesc, Pointer hy, cudnnTensorDescriptor cyDesc, Pointer cy, Pointer workSpace, long workSpaceSizeInBytes)
@Deprecated public static int cudnnSetRNNPaddingMode(cudnnRNNDescriptor rnnDesc, int paddingMode)
@Deprecated public static int cudnnGetRNNPaddingMode(cudnnRNNDescriptor rnnDesc, int[] paddingMode)
public static int cudnnCreateRNNDataDescriptor(cudnnRNNDataDescriptor rnnDataDesc)
public static int cudnnDestroyRNNDataDescriptor(cudnnRNNDataDescriptor rnnDataDesc)
public static int cudnnSetRNNDataDescriptor(cudnnRNNDataDescriptor rnnDataDesc, int dataType, int layout, int maxSeqLength, int batchSize, int vectorSize, int[] seqLengthArray, Pointer paddingFill)
public static int cudnnGetRNNDataDescriptor(cudnnRNNDataDescriptor rnnDataDesc, int[] dataType, int[] layout, int[] maxSeqLength, int[] batchSize, int[] vectorSize, int arrayLengthRequested, int[] seqLengthArray, Pointer paddingFill)
@Deprecated public static int cudnnRNNForwardInferenceEx(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, cudnnRNNDataDescriptor xDesc, Pointer x, cudnnTensorDescriptor hxDesc, Pointer hx, cudnnTensorDescriptor cxDesc, Pointer cx, cudnnFilterDescriptor wDesc, Pointer w, cudnnRNNDataDescriptor yDesc, Pointer y, cudnnTensorDescriptor hyDesc, Pointer hy, cudnnTensorDescriptor cyDesc, Pointer cy, cudnnRNNDataDescriptor kDesc, Pointer keys, cudnnRNNDataDescriptor cDesc, Pointer cAttn, cudnnRNNDataDescriptor iDesc, Pointer iAttn, cudnnRNNDataDescriptor qDesc, Pointer queries, Pointer workSpace, long workSpaceSizeInBytes)
public static int cudnnRNNForward(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int fwdMode, int[] devSeqLengths, cudnnRNNDataDescriptor xDesc, Pointer x, cudnnRNNDataDescriptor yDesc, Pointer y, cudnnTensorDescriptor hDesc, Pointer hx, Pointer hy, cudnnTensorDescriptor cDesc, Pointer cx, Pointer cy, long weightSpaceSize, Pointer weightSpace, long workSpaceSize, Pointer workSpace, long reserveSpaceSize, Pointer reserveSpace)
@Deprecated public static int cudnnSetRNNAlgorithmDescriptor(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, cudnnAlgorithmDescriptor algoDesc)
@Deprecated public static int cudnnGetRNNForwardInferenceAlgorithmMaxCount(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int[] count)
@Deprecated public static int cudnnFindRNNForwardInferenceAlgorithmEx(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int seqLength, cudnnTensorDescriptor[] xDesc, Pointer x, cudnnTensorDescriptor hxDesc, Pointer hx, cudnnTensorDescriptor cxDesc, Pointer cx, cudnnFilterDescriptor wDesc, Pointer w, cudnnTensorDescriptor[] yDesc, Pointer y, cudnnTensorDescriptor hyDesc, Pointer hy, cudnnTensorDescriptor cyDesc, Pointer cy, float findIntensity, int requestedAlgoCount, int[] returnedAlgoCount, cudnnAlgorithmPerformance[] perfResults, Pointer workspace, long workSpaceSizeInBytes)
public static int cudnnCreateSeqDataDescriptor(cudnnSeqDataDescriptor seqDataDesc)
public static int cudnnDestroySeqDataDescriptor(cudnnSeqDataDescriptor seqDataDesc)
public static int cudnnSetSeqDataDescriptor(cudnnSeqDataDescriptor seqDataDesc, int dataType, int nbDims, int[] dimA, int[] axes, long seqLengthArraySize, int[] seqLengthArray, Pointer paddingFill)
public static int cudnnGetSeqDataDescriptor(cudnnSeqDataDescriptor seqDataDesc, int[] dataType, int[] nbDims, int nbDimsRequested, int[] dimA, int[] axes, long[] seqLengthArraySize, long seqLengthSizeRequested, int[] seqLengthArray, Pointer paddingFill)
public static int cudnnCreateAttnDescriptor(cudnnAttnDescriptor attnDesc)
public static int cudnnDestroyAttnDescriptor(cudnnAttnDescriptor attnDesc)
public static int cudnnSetAttnDescriptor(cudnnAttnDescriptor attnDesc, int attnMode, int nHeads, double smScaler, int dataType, int computePrec, int mathType, cudnnDropoutDescriptor attnDropoutDesc, cudnnDropoutDescriptor postDropoutDesc, int qSize, int kSize, int vSize, int qProjSize, int kProjSize, int vProjSize, int oProjSize, int qoMaxSeqLength, int kvMaxSeqLength, int maxBatchSize, int maxBeamSize)
public static int cudnnGetAttnDescriptor(cudnnAttnDescriptor attnDesc, int[] attnMode, int[] nHeads, double[] smScaler, int[] dataType, int[] computePrec, int[] mathType, cudnnDropoutDescriptor attnDropoutDesc, cudnnDropoutDescriptor postDropoutDesc, int[] qSize, int[] kSize, int[] vSize, int[] qProjSize, int[] kProjSize, int[] vProjSize, int[] oProjSize, int[] qoMaxSeqLength, int[] kvMaxSeqLength, int[] maxBatchSize, int[] maxBeamSize)
public static int cudnnGetMultiHeadAttnBuffers(cudnnHandle handle, cudnnAttnDescriptor attnDesc, long[] weightSizeInBytes, long[] workSpaceSizeInBytes, long[] reserveSpaceSizeInBytes)
public static int cudnnGetMultiHeadAttnWeights(cudnnHandle handle, cudnnAttnDescriptor attnDesc, int wKind, long weightSizeInBytes, Pointer weights, cudnnTensorDescriptor wDesc, Pointer wAddr)
public static int cudnnMultiHeadAttnForward(cudnnHandle handle, cudnnAttnDescriptor attnDesc, int currIdx, int[] loWinIdx, int[] hiWinIdx, int[] devSeqLengthsQO, int[] devSeqLengthsKV, cudnnSeqDataDescriptor qDesc, Pointer queries, Pointer residuals, cudnnSeqDataDescriptor kDesc, Pointer keys, cudnnSeqDataDescriptor vDesc, Pointer values, cudnnSeqDataDescriptor oDesc, Pointer out, long weightSizeInBytes, Pointer weights, long workSpaceSizeInBytes, Pointer workSpace, long reserveSpaceSizeInBytes, Pointer reserveSpace)
public static int cudnnAdvInferVersionCheck()
Cross-library version checker.. This function is implemented differently in each sub-library. Each sublib checks whether its own version matches that of its dependencies.
@Deprecated public static int cudnnRNNForwardTraining(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int seqLength, cudnnTensorDescriptor[] xDesc, Pointer x, cudnnTensorDescriptor hxDesc, Pointer hx, cudnnTensorDescriptor cxDesc, Pointer cx, cudnnFilterDescriptor wDesc, Pointer w, cudnnTensorDescriptor[] yDesc, Pointer y, cudnnTensorDescriptor hyDesc, Pointer hy, cudnnTensorDescriptor cyDesc, Pointer cy, Pointer workSpace, long workSpaceSizeInBytes, Pointer reserveSpace, long reserveSpaceSizeInBytes)
@Deprecated public static int cudnnRNNBackwardData(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int seqLength, cudnnTensorDescriptor[] yDesc, Pointer y, cudnnTensorDescriptor[] dyDesc, Pointer dy, cudnnTensorDescriptor dhyDesc, Pointer dhy, cudnnTensorDescriptor dcyDesc, Pointer dcy, cudnnFilterDescriptor wDesc, Pointer w, cudnnTensorDescriptor hxDesc, Pointer hx, cudnnTensorDescriptor cxDesc, Pointer cx, cudnnTensorDescriptor[] dxDesc, Pointer dx, cudnnTensorDescriptor dhxDesc, Pointer dhx, cudnnTensorDescriptor dcxDesc, Pointer dcx, Pointer workSpace, long workSpaceSizeInBytes, Pointer reserveSpace, long reserveSpaceSizeInBytes)
public static int cudnnRNNBackwardData_v8(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int[] devSeqLengths, cudnnRNNDataDescriptor yDesc, Pointer y, Pointer dy, cudnnRNNDataDescriptor xDesc, Pointer dx, cudnnTensorDescriptor hDesc, Pointer hx, Pointer dhy, Pointer dhx, cudnnTensorDescriptor cDesc, Pointer cx, Pointer dcy, Pointer dcx, long weightSpaceSize, Pointer weightSpace, long workSpaceSize, Pointer workSpace, long reserveSpaceSize, Pointer reserveSpace)
@Deprecated public static int cudnnRNNBackwardWeights(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int seqLength, cudnnTensorDescriptor[] xDesc, Pointer x, cudnnTensorDescriptor hxDesc, Pointer hx, cudnnTensorDescriptor[] yDesc, Pointer y, Pointer workSpace, long workSpaceSizeInBytes, cudnnFilterDescriptor dwDesc, Pointer dw, Pointer reserveSpace, long reserveSpaceSizeInBytes)
public static int cudnnRNNBackwardWeights_v8(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int addGrad, int[] devSeqLengths, cudnnRNNDataDescriptor xDesc, Pointer x, cudnnTensorDescriptor hDesc, Pointer hx, cudnnRNNDataDescriptor yDesc, Pointer y, long weightSpaceSize, Pointer dweightSpace, long workSpaceSize, Pointer workSpace, long reserveSpaceSize, Pointer reserveSpace)
@Deprecated public static int cudnnRNNForwardTrainingEx(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, cudnnRNNDataDescriptor xDesc, Pointer x, cudnnTensorDescriptor hxDesc, Pointer hx, cudnnTensorDescriptor cxDesc, Pointer cx, cudnnFilterDescriptor wDesc, Pointer w, cudnnRNNDataDescriptor yDesc, Pointer y, cudnnTensorDescriptor hyDesc, Pointer hy, cudnnTensorDescriptor cyDesc, Pointer cy, cudnnRNNDataDescriptor kDesc, Pointer keys, cudnnRNNDataDescriptor cDesc, Pointer cAttn, cudnnRNNDataDescriptor iDesc, Pointer iAttn, cudnnRNNDataDescriptor qDesc, Pointer queries, Pointer workSpace, long workSpaceSizeInBytes, Pointer reserveSpace, long reserveSpaceSizeInBytes)
@Deprecated public static int cudnnRNNBackwardDataEx(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, cudnnRNNDataDescriptor yDesc, Pointer y, cudnnRNNDataDescriptor dyDesc, Pointer dy, cudnnRNNDataDescriptor dcDesc, Pointer dcAttn, cudnnTensorDescriptor dhyDesc, Pointer dhy, cudnnTensorDescriptor dcyDesc, Pointer dcy, cudnnFilterDescriptor wDesc, Pointer w, cudnnTensorDescriptor hxDesc, Pointer hx, cudnnTensorDescriptor cxDesc, Pointer cx, cudnnRNNDataDescriptor dxDesc, Pointer dx, cudnnTensorDescriptor dhxDesc, Pointer dhx, cudnnTensorDescriptor dcxDesc, Pointer dcx, cudnnRNNDataDescriptor dkDesc, Pointer dkeys, Pointer workSpace, long workSpaceSizeInBytes, Pointer reserveSpace, long reserveSpaceSizeInBytes)
@Deprecated public static int cudnnRNNBackwardWeightsEx(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, cudnnRNNDataDescriptor xDesc, Pointer x, cudnnTensorDescriptor hxDesc, Pointer hx, cudnnRNNDataDescriptor yDesc, Pointer y, Pointer workSpace, long workSpaceSizeInBytes, cudnnFilterDescriptor dwDesc, Pointer dw, Pointer reserveSpace, long reserveSpaceSizeInBytes)
@Deprecated public static int cudnnGetRNNForwardTrainingAlgorithmMaxCount(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int[] count)
@Deprecated public static int cudnnFindRNNForwardTrainingAlgorithmEx(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int seqLength, cudnnTensorDescriptor[] xDesc, Pointer x, cudnnTensorDescriptor hxDesc, Pointer hx, cudnnTensorDescriptor cxDesc, Pointer cx, cudnnFilterDescriptor wDesc, Pointer w, cudnnTensorDescriptor[] yDesc, Pointer y, cudnnTensorDescriptor hyDesc, Pointer hy, cudnnTensorDescriptor cyDesc, Pointer cy, float findIntensity, int requestedAlgoCount, int[] returnedAlgoCount, cudnnAlgorithmPerformance[] perfResults, Pointer workspace, long workSpaceSizeInBytes, Pointer reserveSpace, long reserveSpaceSizeInBytes)
@Deprecated public static int cudnnGetRNNBackwardDataAlgorithmMaxCount(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int[] count)
@Deprecated public static int cudnnFindRNNBackwardDataAlgorithmEx(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int seqLength, cudnnTensorDescriptor[] yDesc, Pointer y, cudnnTensorDescriptor[] dyDesc, Pointer dy, cudnnTensorDescriptor dhyDesc, Pointer dhy, cudnnTensorDescriptor dcyDesc, Pointer dcy, cudnnFilterDescriptor wDesc, Pointer w, cudnnTensorDescriptor hxDesc, Pointer hx, cudnnTensorDescriptor cxDesc, Pointer cx, cudnnTensorDescriptor[] dxDesc, Pointer dx, cudnnTensorDescriptor dhxDesc, Pointer dhx, cudnnTensorDescriptor dcxDesc, Pointer dcx, float findIntensity, int requestedAlgoCount, int[] returnedAlgoCount, cudnnAlgorithmPerformance[] perfResults, Pointer workspace, long workSpaceSizeInBytes, Pointer reserveSpace, long reserveSpaceSizeInBytes)
@Deprecated public static int cudnnGetRNNBackwardWeightsAlgorithmMaxCount(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int[] count)
@Deprecated public static int cudnnFindRNNBackwardWeightsAlgorithmEx(cudnnHandle handle, cudnnRNNDescriptor rnnDesc, int seqLength, cudnnTensorDescriptor[] xDesc, Pointer x, cudnnTensorDescriptor hxDesc, Pointer hx, cudnnTensorDescriptor[] yDesc, Pointer y, float findIntensity, int requestedAlgoCount, int[] returnedAlgoCount, cudnnAlgorithmPerformance[] perfResults, Pointer workspace, long workSpaceSizeInBytes, cudnnFilterDescriptor dwDesc, Pointer dw, Pointer reserveSpace, long reserveSpaceSizeInBytes)
public static int cudnnMultiHeadAttnBackwardData(cudnnHandle handle, cudnnAttnDescriptor attnDesc, int[] loWinIdx, int[] hiWinIdx, int[] devSeqLengthsDQDO, int[] devSeqLengthsDKDV, cudnnSeqDataDescriptor doDesc, Pointer dout, cudnnSeqDataDescriptor dqDesc, Pointer dqueries, Pointer queries, cudnnSeqDataDescriptor dkDesc, Pointer dkeys, Pointer keys, cudnnSeqDataDescriptor dvDesc, Pointer dvalues, Pointer values, long weightSizeInBytes, Pointer weights, long workSpaceSizeInBytes, Pointer workSpace, long reserveSpaceSizeInBytes, Pointer reserveSpace)
public static int cudnnMultiHeadAttnBackwardWeights(cudnnHandle handle, cudnnAttnDescriptor attnDesc, int addGrad, cudnnSeqDataDescriptor qDesc, Pointer queries, cudnnSeqDataDescriptor kDesc, Pointer keys, cudnnSeqDataDescriptor vDesc, Pointer values, cudnnSeqDataDescriptor doDesc, Pointer dout, long weightSizeInBytes, Pointer weights, Pointer dweights, long workSpaceSizeInBytes, Pointer workSpace, long reserveSpaceSizeInBytes, Pointer reserveSpace)
public static int cudnnCreateCTCLossDescriptor(cudnnCTCLossDescriptor ctcLossDesc)
public static int cudnnSetCTCLossDescriptor(cudnnCTCLossDescriptor ctcLossDesc, int compType)
public static int cudnnSetCTCLossDescriptorEx(cudnnCTCLossDescriptor ctcLossDesc, int compType, int normMode, int gradMode)
public static int cudnnSetCTCLossDescriptor_v8(cudnnCTCLossDescriptor ctcLossDesc, int compType, int normMode, int gradMode, int maxLabelLength)
public static int cudnnGetCTCLossDescriptor(cudnnCTCLossDescriptor ctcLossDesc, int[] compType)
public static int cudnnGetCTCLossDescriptorEx(cudnnCTCLossDescriptor ctcLossDesc, int[] compType, int[] normMode, int[] gradMode)
public static int cudnnGetCTCLossDescriptor_v8(cudnnCTCLossDescriptor ctcLossDesc, int[] compType, int[] normMode, int[] gradMode, int[] maxLabelLength)
public static int cudnnDestroyCTCLossDescriptor(cudnnCTCLossDescriptor ctcLossDesc)
public static int cudnnCTCLoss(cudnnHandle handle, cudnnTensorDescriptor probsDesc, Pointer probs, int[] hostLabels, int[] hostLabelLengths, int[] hostInputLengths, Pointer costs, cudnnTensorDescriptor gradientsDesc, Pointer gradients, int algo, cudnnCTCLossDescriptor ctcLossDesc, Pointer workspace, long workSpaceSizeInBytes)
public static int cudnnCTCLoss_v8(cudnnHandle handle, int algo, cudnnCTCLossDescriptor ctcLossDesc, cudnnTensorDescriptor probsDesc, Pointer probs, Pointer labels, Pointer labelLengths, Pointer inputLengths, Pointer costs, cudnnTensorDescriptor gradientsDesc, Pointer gradients, long workSpaceSizeInBytes, Pointer workspace)
public static int cudnnGetCTCLossWorkspaceSize(cudnnHandle handle, cudnnTensorDescriptor probsDesc, cudnnTensorDescriptor gradientsDesc, int[] labels, int[] labelLengths, int[] inputLengths, int algo, cudnnCTCLossDescriptor ctcLossDesc, long[] sizeInBytes)
public static int cudnnGetCTCLossWorkspaceSize_v8(cudnnHandle handle, int algo, cudnnCTCLossDescriptor ctcLossDesc, cudnnTensorDescriptor probsDesc, cudnnTensorDescriptor gradientsDesc, long[] sizeInBytes)
public static int cudnnAdvTrainVersionCheck()
Cross-library version checker.. This function is implemented differently in each sub-library. Each sublib checks whether its own version matches that of its dependencies.
public static int cudnnCreateConvolutionDescriptor(cudnnConvolutionDescriptor convDesc)
public static int cudnnDestroyConvolutionDescriptor(cudnnConvolutionDescriptor convDesc)
public static int cudnnSetConvolutionMathType(cudnnConvolutionDescriptor convDesc, int mathType)
public static int cudnnGetConvolutionMathType(cudnnConvolutionDescriptor convDesc, int[] mathType)
public static int cudnnSetConvolutionGroupCount(cudnnConvolutionDescriptor convDesc, int groupCount)
public static int cudnnGetConvolutionGroupCount(cudnnConvolutionDescriptor convDesc, int[] groupCount)
public static int cudnnSetConvolutionReorderType(cudnnConvolutionDescriptor convDesc, int reorderType)
public static int cudnnGetConvolutionReorderType(cudnnConvolutionDescriptor convDesc, int[] reorderType)
public static int cudnnSetConvolution2dDescriptor(cudnnConvolutionDescriptor convDesc, int pad_h, int pad_w, int u, int v, int dilation_h, int dilation_w, int mode, int computeType)
public static int cudnnGetConvolution2dDescriptor(cudnnConvolutionDescriptor convDesc, int[] pad_h, int[] pad_w, int[] u, int[] v, int[] dilation_h, int[] dilation_w, int[] mode, int[] computeType)
public static int cudnnSetConvolutionNdDescriptor(cudnnConvolutionDescriptor convDesc, int arrayLength, int[] padA, int[] filterStrideA, int[] dilationA, int mode, int computeType)
public static int cudnnGetConvolutionNdDescriptor(cudnnConvolutionDescriptor convDesc, int arrayLengthRequested, int[] arrayLength, int[] padA, int[] strideA, int[] dilationA, int[] mode, int[] computeType)
public static int cudnnGetConvolution2dForwardOutputDim(cudnnConvolutionDescriptor convDesc, cudnnTensorDescriptor inputTensorDesc, cudnnFilterDescriptor filterDesc, int[] n, int[] c, int[] h, int[] w)
public static int cudnnGetConvolutionNdForwardOutputDim(cudnnConvolutionDescriptor convDesc, cudnnTensorDescriptor inputTensorDesc, cudnnFilterDescriptor filterDesc, int nbDims, int[] tensorOuputDimA)
public static int cudnnGetConvolutionForwardAlgorithmMaxCount(cudnnHandle handle, int[] count)
public static int cudnnGetConvolutionForwardAlgorithm_v7(cudnnHandle handle, cudnnTensorDescriptor srcDesc, cudnnFilterDescriptor filterDesc, cudnnConvolutionDescriptor convDesc, cudnnTensorDescriptor destDesc, int requestedAlgoCount, int[] returnedAlgoCount, cudnnConvolutionFwdAlgoPerf[] perfResults)
public static int cudnnFindConvolutionForwardAlgorithm(cudnnHandle handle, cudnnTensorDescriptor xDesc, cudnnFilterDescriptor wDesc, cudnnConvolutionDescriptor convDesc, cudnnTensorDescriptor yDesc, int requestedAlgoCount, int[] returnedAlgoCount, cudnnConvolutionFwdAlgoPerf[] perfResults)
public static int cudnnFindConvolutionForwardAlgorithmEx(cudnnHandle handle, cudnnTensorDescriptor xDesc, Pointer x, cudnnFilterDescriptor wDesc, Pointer w, cudnnConvolutionDescriptor convDesc, cudnnTensorDescriptor yDesc, Pointer y, int requestedAlgoCount, int[] returnedAlgoCount, cudnnConvolutionFwdAlgoPerf[] perfResults, Pointer workSpace, long workSpaceSizeInBytes)
public static int cudnnIm2Col(cudnnHandle handle, cudnnTensorDescriptor xDesc, Pointer x, cudnnFilterDescriptor wDesc, cudnnConvolutionDescriptor convDesc, Pointer colBuffer)
public static int cudnnReorderFilterAndBias(cudnnHandle handle, cudnnFilterDescriptor filterDesc, int reorderType, Pointer filterData, Pointer reorderedFilterData, int reorderBias, Pointer biasData, Pointer reorderedBiasData)
public static int cudnnGetConvolutionForwardWorkspaceSize(cudnnHandle handle, cudnnTensorDescriptor xDesc, cudnnFilterDescriptor wDesc, cudnnConvolutionDescriptor convDesc, cudnnTensorDescriptor yDesc, int algo, long[] sizeInBytes)
public static int cudnnConvolutionForward(cudnnHandle handle, Pointer alpha, cudnnTensorDescriptor xDesc, Pointer x, cudnnFilterDescriptor wDesc, Pointer w, cudnnConvolutionDescriptor convDesc, int algo, Pointer workSpace, long workSpaceSizeInBytes, Pointer beta, cudnnTensorDescriptor yDesc, Pointer y)
public static int cudnnConvolutionBiasActivationForward(cudnnHandle handle, Pointer alpha1, cudnnTensorDescriptor xDesc, Pointer x, cudnnFilterDescriptor wDesc, Pointer w, cudnnConvolutionDescriptor convDesc, int algo, Pointer workSpace, long workSpaceSizeInBytes, Pointer alpha2, cudnnTensorDescriptor zDesc, Pointer z, cudnnTensorDescriptor biasDesc, Pointer bias, cudnnActivationDescriptor activationDesc, cudnnTensorDescriptor yDesc, Pointer y)
public static int cudnnGetConvolutionBackwardDataAlgorithmMaxCount(cudnnHandle handle, int[] count)
public static int cudnnFindConvolutionBackwardDataAlgorithm(cudnnHandle handle, cudnnFilterDescriptor wDesc, cudnnTensorDescriptor dyDesc, cudnnConvolutionDescriptor convDesc, cudnnTensorDescriptor dxDesc, int requestedAlgoCount, int[] returnedAlgoCount, cudnnConvolutionBwdDataAlgoPerf[] perfResults)
public static int cudnnFindConvolutionBackwardDataAlgorithmEx(cudnnHandle handle, cudnnFilterDescriptor wDesc, Pointer w, cudnnTensorDescriptor dyDesc, Pointer dy, cudnnConvolutionDescriptor convDesc, cudnnTensorDescriptor dxDesc, Pointer dx, int requestedAlgoCount, int[] returnedAlgoCount, cudnnConvolutionBwdDataAlgoPerf[] perfResults, Pointer workSpace, long workSpaceSizeInBytes)
public static int cudnnGetConvolutionBackwardDataAlgorithm_v7(cudnnHandle handle, cudnnFilterDescriptor filterDesc, cudnnTensorDescriptor diffDesc, cudnnConvolutionDescriptor convDesc, cudnnTensorDescriptor gradDesc, int requestedAlgoCount, int[] returnedAlgoCount, cudnnConvolutionBwdDataAlgoPerf[] perfResults)
public static int cudnnGetConvolutionBackwardDataWorkspaceSize(cudnnHandle handle, cudnnFilterDescriptor wDesc, cudnnTensorDescriptor dyDesc, cudnnConvolutionDescriptor convDesc, cudnnTensorDescriptor dxDesc, int algo, long[] sizeInBytes)
public static int cudnnConvolutionBackwardData(cudnnHandle handle, Pointer alpha, cudnnFilterDescriptor wDesc, Pointer w, cudnnTensorDescriptor dyDesc, Pointer dy, cudnnConvolutionDescriptor convDesc, int algo, Pointer workSpace, long workSpaceSizeInBytes, Pointer beta, cudnnTensorDescriptor dxDesc, Pointer dx)
public static int cudnnGetFoldedConvBackwardDataDescriptors(cudnnHandle handle, cudnnFilterDescriptor filterDesc, cudnnTensorDescriptor diffDesc, cudnnConvolutionDescriptor convDesc, cudnnTensorDescriptor gradDesc, int transformFormat, cudnnFilterDescriptor foldedFilterDesc, cudnnTensorDescriptor paddedDiffDesc, cudnnConvolutionDescriptor foldedConvDesc, cudnnTensorDescriptor foldedGradDesc, cudnnTensorTransformDescriptor filterFoldTransDesc, cudnnTensorTransformDescriptor diffPadTransDesc, cudnnTensorTransformDescriptor gradFoldTransDesc, cudnnTensorTransformDescriptor gradUnfoldTransDesc)
public static int cudnnCnnInferVersionCheck()
public static int cudnnGetConvolutionBackwardFilterAlgorithmMaxCount(cudnnHandle handle, int[] count)
public static int cudnnFindConvolutionBackwardFilterAlgorithm(cudnnHandle handle, cudnnTensorDescriptor xDesc, cudnnTensorDescriptor dyDesc, cudnnConvolutionDescriptor convDesc, cudnnFilterDescriptor dwDesc, int requestedAlgoCount, int[] returnedAlgoCount, cudnnConvolutionBwdFilterAlgoPerf[] perfResults)
public static int cudnnFindConvolutionBackwardFilterAlgorithmEx(cudnnHandle handle, cudnnTensorDescriptor xDesc, Pointer x, cudnnTensorDescriptor dyDesc, Pointer y, cudnnConvolutionDescriptor convDesc, cudnnFilterDescriptor dwDesc, Pointer dw, int requestedAlgoCount, int[] returnedAlgoCount, cudnnConvolutionBwdFilterAlgoPerf[] perfResults, Pointer workSpace, long workSpaceSizeInBytes)
public static int cudnnGetConvolutionBackwardFilterAlgorithm_v7(cudnnHandle handle, cudnnTensorDescriptor srcDesc, cudnnTensorDescriptor diffDesc, cudnnConvolutionDescriptor convDesc, cudnnFilterDescriptor gradDesc, int requestedAlgoCount, int[] returnedAlgoCount, cudnnConvolutionBwdFilterAlgoPerf[] perfResults)
public static int cudnnGetConvolutionBackwardFilterWorkspaceSize(cudnnHandle handle, cudnnTensorDescriptor xDesc, cudnnTensorDescriptor dyDesc, cudnnConvolutionDescriptor convDesc, cudnnFilterDescriptor gradDesc, int algo, long[] sizeInBytes)
public static int cudnnConvolutionBackwardFilter(cudnnHandle handle, Pointer alpha, cudnnTensorDescriptor xDesc, Pointer x, cudnnTensorDescriptor dyDesc, Pointer dy, cudnnConvolutionDescriptor convDesc, int algo, Pointer workSpace, long workSpaceSizeInBytes, Pointer beta, cudnnFilterDescriptor dwDesc, Pointer dw)
public static int cudnnConvolutionBackwardBias(cudnnHandle handle, Pointer alpha, cudnnTensorDescriptor dyDesc, Pointer dy, Pointer beta, cudnnTensorDescriptor dbDesc, Pointer db)
public static int cudnnCreateFusedOpsConstParamPack(cudnnFusedOpsConstParamPack constPack, int ops)
public static int cudnnDestroyFusedOpsConstParamPack(cudnnFusedOpsConstParamPack constPack)
public static int cudnnSetFusedOpsConstParamPackAttribute(cudnnFusedOpsConstParamPack constPack, int paramLabel, Pointer param)
public static int cudnnGetFusedOpsConstParamPackAttribute(cudnnFusedOpsConstParamPack constPack, int paramLabel, Pointer param, int[] isNULL)
public static int cudnnCreateFusedOpsVariantParamPack(cudnnFusedOpsVariantParamPack varPack, int ops)
public static int cudnnDestroyFusedOpsVariantParamPack(cudnnFusedOpsVariantParamPack varPack)
public static int cudnnSetFusedOpsVariantParamPackAttribute(cudnnFusedOpsVariantParamPack varPack, int paramLabel, Pointer ptr)
public static int cudnnGetFusedOpsVariantParamPackAttribute(cudnnFusedOpsVariantParamPack varPack, int paramLabel, Pointer ptr)
public static int cudnnCreateFusedOpsPlan(cudnnFusedOpsPlan plan, int ops)
public static int cudnnDestroyFusedOpsPlan(cudnnFusedOpsPlan plan)
public static int cudnnMakeFusedOpsPlan(cudnnHandle handle, cudnnFusedOpsPlan plan, cudnnFusedOpsConstParamPack constPack, long[] workspaceSizeInBytes)
public static int cudnnFusedOpsExecute(cudnnHandle handle, cudnnFusedOpsPlan plan, cudnnFusedOpsVariantParamPack varPack)
public static int cudnnCnnTrainVersionCheck()
public static int cudnnBackendCreateDescriptor(int descriptorType, cudnnBackendDescriptor descriptor)
public static int cudnnBackendDestroyDescriptor(cudnnBackendDescriptor descriptor)
public static int cudnnBackendInitialize(cudnnBackendDescriptor descriptor)
public static int cudnnBackendFinalize(cudnnBackendDescriptor descriptor)
public static int cudnnBackendSetAttribute(cudnnBackendDescriptor descriptor, int attributeName, int attributeType, long elementCount, Pointer arrayOfElements)
public static int cudnnBackendGetAttribute(cudnnBackendDescriptor descriptor, int attributeName, int attributeType, long requestedElementCount, long[] elementCount, Pointer arrayOfElements)
public static int cudnnBackendExecute(cudnnHandle handle, cudnnBackendDescriptor executionPlan, cudnnBackendDescriptor variantPack)
Copyright © 2020. All rights reserved.