Package | Description |
---|---|
org.bytedeco.cuda.cublas | |
org.bytedeco.cuda.global |
Modifier and Type | Method and Description |
---|---|
cublasLtMatrixLayoutOpaque_t |
cublasLtMatrixLayoutOpaque_t.data(int i,
long setter) |
cublasLtMatrixLayoutOpaque_t |
cublasLtMatrixLayoutOpaque_t.getPointer(long i) |
cublasLtMatrixLayoutOpaque_t |
cublasLtMatrixLayoutOpaque_t.position(long position) |
Modifier and Type | Method and Description |
---|---|
static int |
cublas.cublasLtMatmul(cublasLtContext lightHandle,
cublasLtMatmulDescOpaque_t computeDesc,
Pointer alpha,
Pointer A,
cublasLtMatrixLayoutOpaque_t Adesc,
Pointer B,
cublasLtMatrixLayoutOpaque_t Bdesc,
Pointer beta,
Pointer C,
cublasLtMatrixLayoutOpaque_t Cdesc,
Pointer D,
cublasLtMatrixLayoutOpaque_t Ddesc,
cublasLtMatmulAlgo_t algo,
Pointer workspace,
long workspaceSizeInBytes,
CUstream_st stream)
Execute matrix multiplication (D = alpha * op(A) * op(B) + beta * C).
|
static int |
cublas.cublasLtMatmulAlgoCheck(cublasLtContext lightHandle,
cublasLtMatmulDescOpaque_t operationDesc,
cublasLtMatrixLayoutOpaque_t Adesc,
cublasLtMatrixLayoutOpaque_t Bdesc,
cublasLtMatrixLayoutOpaque_t Cdesc,
cublasLtMatrixLayoutOpaque_t Ddesc,
cublasLtMatmulAlgo_t algo,
cublasLtMatmulHeuristicResult_t result)
Check configured algo descriptor for correctness and support on current device.
|
static int |
cublas.cublasLtMatmulAlgoGetHeuristic(cublasLtContext lightHandle,
cublasLtMatmulDescOpaque_t operationDesc,
cublasLtMatrixLayoutOpaque_t Adesc,
cublasLtMatrixLayoutOpaque_t Bdesc,
cublasLtMatrixLayoutOpaque_t Cdesc,
cublasLtMatrixLayoutOpaque_t Ddesc,
cublasLtMatmulPreferenceOpaque_t preference,
int requestedAlgoCount,
cublasLtMatmulHeuristicResult_t heuristicResultsArray,
int[] returnAlgoCount) |
static int |
cublas.cublasLtMatmulAlgoGetHeuristic(cublasLtContext lightHandle,
cublasLtMatmulDescOpaque_t operationDesc,
cublasLtMatrixLayoutOpaque_t Adesc,
cublasLtMatrixLayoutOpaque_t Bdesc,
cublasLtMatrixLayoutOpaque_t Cdesc,
cublasLtMatrixLayoutOpaque_t Ddesc,
cublasLtMatmulPreferenceOpaque_t preference,
int requestedAlgoCount,
cublasLtMatmulHeuristicResult_t heuristicResultsArray,
IntBuffer returnAlgoCount) |
static int |
cublas.cublasLtMatmulAlgoGetHeuristic(cublasLtContext lightHandle,
cublasLtMatmulDescOpaque_t operationDesc,
cublasLtMatrixLayoutOpaque_t Adesc,
cublasLtMatrixLayoutOpaque_t Bdesc,
cublasLtMatrixLayoutOpaque_t Cdesc,
cublasLtMatrixLayoutOpaque_t Ddesc,
cublasLtMatmulPreferenceOpaque_t preference,
int requestedAlgoCount,
cublasLtMatmulHeuristicResult_t heuristicResultsArray,
IntPointer returnAlgoCount)
Query cublasLt heuristic for algorithm appropriate for given use case.
|
static int |
cublas.cublasLtMatrixLayoutDestroy(cublasLtMatrixLayoutOpaque_t matLayout)
Destroy matrix layout descriptor.
|
static int |
cublas.cublasLtMatrixLayoutGetAttribute(cublasLtMatrixLayoutOpaque_t matLayout,
int attr,
Pointer buf,
long sizeInBytes,
SizeTPointer sizeWritten)
Get matrix layout descriptor attribute.
|
static int |
cublas.cublasLtMatrixLayoutInit_internal(cublasLtMatrixLayoutOpaque_t matLayout,
long size,
int type,
long rows,
long cols,
long ld)
Internal.
|
static int |
cublas.cublasLtMatrixLayoutInit(cublasLtMatrixLayoutOpaque_t matLayout,
int type,
long rows,
long cols,
long ld)
Initialize matrix layout descriptor in pre-allocated space.
|
static int |
cublas.cublasLtMatrixLayoutSetAttribute(cublasLtMatrixLayoutOpaque_t matLayout,
int attr,
Pointer buf,
long sizeInBytes)
Set matrix layout descriptor attribute.
|
static int |
cublas.cublasLtMatrixTransform(cublasLtContext lightHandle,
cublasLtMatrixTransformDescOpaque_t transformDesc,
Pointer alpha,
Pointer A,
cublasLtMatrixLayoutOpaque_t Adesc,
Pointer beta,
Pointer B,
cublasLtMatrixLayoutOpaque_t Bdesc,
Pointer C,
cublasLtMatrixLayoutOpaque_t Cdesc,
CUstream_st stream)
Matrix layout conversion helper (C = alpha * op(A) + beta * op(B))
Can be used to change memory order of data or to scale and shift the values.
|
Copyright © 2024. All rights reserved.