Sparse Generic Functions

Sparse Generic Functions#

This module holds all sparse generic routines.

The sparse generic routines describe operations that manipulate sparse matrices.

hipsparseAxpby()#

hipsparseStatus_t hipsparseAxpby(hipsparseHandle_t handle, const void *alpha, hipsparseConstSpVecDescr_t vecX, const void *beta, hipsparseDnVecDescr_t vecY)#

Scale a sparse vector and add it to a scaled dense vector.

hipsparseAxpby multiplies the sparse vector $x$ with scalar $α$ and adds the result to the dense vector $y$ that is multiplied with scalar $β$ , such that

y := α \cdot x + β \cdot y

for(i = 0; i < size; ++i)
{
    y[i] = beta * y[i]
}
for(i = 0; i < nnz; ++i)
{
    y[xInd[i]] += alpha * xVal[i]
}

Example

// Number of non-zeros of the sparse vector
int nnz = 3;

// Size of sparse and dense vector
int size = 9;

// Sparse index vector
std::vector<int> hxInd = {0, 3, 5};

// Sparse value vector
std::vector<float> hxVal = {1.0f, 2.0f, 3.0f};

// Dense vector
std::vector<float> hy = {1.0f, 2.0f, 3.0f, 4.0f, 5.0f, 6.0f, 7.0f, 8.0f, 9.0f};

// Scalar alpha
float alpha = 3.7f;

// Scalar beta
float beta = 1.2f;

// Offload data to device
int* dxInd;
float* dxVal;
float* dy;
hipMalloc((void**)&dxInd, sizeof(int) * nnz);
hipMalloc((void**)&dxVal, sizeof(float) * nnz);
hipMalloc((void**)&dy, sizeof(float) * size);

hipMemcpy(dxInd, hxInd.data(), sizeof(int) * nnz, hipMemcpyHostToDevice);
hipMemcpy(dxVal, hxVal.data(), sizeof(float) * nnz, hipMemcpyHostToDevice);
hipMemcpy(dy, hy.data(), sizeof(float) * size, hipMemcpyHostToDevice);

hipsparseHandle_t handle;
hipsparseCreate(&handle);

// Create sparse vector X
hipsparseSpVecDescr_t vecX;
hipsparseCreateSpVec(&vecX,
                    size,
                    nnz,
                    dxInd,
                    dxVal,
                    HIPSPARSE_INDEX_32I,
                    HIPSPARSE_INDEX_BASE_ZERO,
                    HIP_R_32F);

// Create dense vector Y
hipsparseDnVecDescr_t vecY;
hipsparseCreateDnVec(&vecY, size, dy, HIP_R_32F);

// Call axpby to perform y = beta * y + alpha * x
hipsparseAxpby(handle, &alpha, vecX, &beta, vecY);

hipsparseDnVecGetValues(vecY, (void**)&dy);

// Copy result back to host
hipMemcpy(hy.data(), dy, sizeof(float) * size, hipMemcpyDeviceToHost);


// Clear hipSPARSE
hipsparseDestroySpVec(vecX);
hipsparseDestroyDnVec(vecY);
hipsparseDestroy(handle);

// Clear device memory
hipFree(dxInd);
hipFree(dxVal);
hipFree(dy);

Parameters:

handle – [in] handle to the hipsparse library context queue.
alpha – [in] scalar $α$ .
vecX – [in] sparse matrix descriptor.
beta – [in] scalar $β$ .
vecY – [inout] dense matrix descriptor.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, vecX, beta or vecY pointer is invalid.

hipsparseGather()#

hipsparseStatus_t hipsparseGather(hipsparseHandle_t handle, hipsparseConstDnVecDescr_t vecY, hipsparseSpVecDescr_t vecX)#

Gather elements from a dense vector and store them into a sparse vector.

hipsparseGather gathers the elements from the dense vector $y$ and stores them in the sparse vector $x$ .

for(i = 0; i < nnz; ++i)
{
    xVal[i] = y[xInd[i]];
}

Example

// Number of non-zeros of the sparse vector
int nnz = 3;

// Size of sparse and dense vector
int size = 9;

// Sparse index vector
std::vector<int> hxInd = {0, 3, 5};

// Dense vector
std::vector<float> hy = {1.0f, 2.0f, 3.0f, 4.0f, 5.0f, 6.0f, 7.0f, 8.0f, 9.0f};

// Offload data to device
int* dxInd;
float* dxVal;
float* dy;
hipMalloc((void**)&dxInd, sizeof(int) * nnz);
hipMalloc((void**)&dxVal, sizeof(float) * nnz);
hipMalloc((void**)&dy, sizeof(float) * size);

hipMemcpy(dxInd, hxInd.data(), sizeof(int) * nnz, hipMemcpyHostToDevice);
hipMemcpy(dy, hy.data(), sizeof(float) * size, hipMemcpyHostToDevice);

hipsparseHandle_t handle;
hipsparseCreate(&handle);

// Create sparse vector X
hipsparseSpVecDescr_t vecX;
hipsparseCreateSpVec(&vecX,
                     size,
                     nnz,
                     dxInd,
                     dxVal,
                     HIPSPARSE_INDEX_32I,
                     HIPSPARSE_INDEX_BASE_ZERO,
                     HIP_R_32F);

// Create dense vector Y
hipsparseDnVecDescr_t vecY;
hipsparseCreateDnVec(&vecY, size, dy, HIP_R_32F);

// Perform gather
hipsparseGather(handle, vecY, vecX);

hipsparseSpVecGetValues(vecX, (void**)&dxVal);

// Copy result back to host
std::vector<float> hxVal(nnz, 0.0f);
hipMemcpy(hxVal.data(), dxVal, sizeof(float) * nnz, hipMemcpyDeviceToHost);

// Clear hipSPARSE
hipsparseDestroySpVec(vecX);
hipsparseDestroyDnVec(vecY);
hipsparseDestroy(handle);

// Clear device memory
hipFree(dxInd);
hipFree(dxVal);
hipFree(dy);

Parameters:

handle – [in] handle to the hipsparse library context queue.
vecY – [in] dense vector descriptor $y$ .
vecX – [out] sparse vector descriptor $x$ .

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, vecX or vecY pointer is invalid.

hipsparseScatter()#

hipsparseStatus_t hipsparseScatter(hipsparseHandle_t handle, hipsparseConstSpVecDescr_t vecX, hipsparseDnVecDescr_t vecY)#

Scatter elements from a sparse vector into a dense vector.

hipsparseScatter scatters the elements from the sparse vector $x$ in the dense vector $y$ .

for(i = 0; i < nnz; ++i)
{
    y[xInd[i]] = xVal[i];
}

Example

// Number of non-zeros of the sparse vector
int nnz = 3;

// Size of sparse and dense vector
int size = 9;

// Sparse index vector
std::vector<int> hxInd = {0, 3, 5};

// Sparse value vector
std::vector<float> hxVal = {1.0f, 2.0f, 3.0f};

// Dense vector
std::vector<float> hy = {1.0f, 2.0f, 3.0f, 4.0f, 5.0f, 6.0f, 7.0f, 8.0f, 9.0f};

// Offload data to device
int* dxInd;
float* dxVal;
float* dy;
hipMalloc((void**)&dxInd, sizeof(int) * nnz);
hipMalloc((void**)&dxVal, sizeof(float) * nnz);
hipMalloc((void**)&dy, sizeof(float) * size);

hipMemcpy(dxInd, hxInd.data(), sizeof(int) * nnz, hipMemcpyHostToDevice);
hipMemcpy(dxVal, hxVal.data(), sizeof(float) * nnz, hipMemcpyHostToDevice);
hipMemcpy(dy, hy.data(), sizeof(float) * size, hipMemcpyHostToDevice);

hipsparseHandle_t handle;
hipsparseCreate(&handle);

// Create sparse vector X
hipsparseSpVecDescr_t vecX;
hipsparseCreateSpVec(&vecX,
                            size,
                            nnz,
                            dxInd,
                            dxVal,
                            HIPSPARSE_INDEX_32I,
                            HIPSPARSE_INDEX_BASE_ZERO,
                            HIP_R_32F);

// Create dense vector Y
hipsparseDnVecDescr_t vecY;
hipsparseCreateDnVec(&vecY, size, dy, HIP_R_32F);

// Perform scatter
hipsparseScatter(handle, vecX, vecY);

hipsparseDnVecGetValues(vecY, (void**)&dy);

// Copy result back to host
hipMemcpy(hy.data(), dy, sizeof(float) * size, hipMemcpyDeviceToHost);

// Clear hipSPARSE
hipsparseDestroySpVec(vecX);
hipsparseDestroyDnVec(vecY);
hipsparseDestroy(handle);

// Clear device memory
hipFree(dxInd);
hipFree(dxVal);
hipFree(dy);

Parameters:

handle – [in] handle to the hipsparse library context queue.
vecX – [in] sparse vector descriptor $x$ .
vecY – [out] dense vector descriptor $y$ .

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, vecX or vecY pointer is invalid.

hipsparseRot()#

hipsparseStatus_t hipsparseRot(hipsparseHandle_t handle, const void *c_coeff, const void *s_coeff, hipsparseSpVecDescr_t vecX, hipsparseDnVecDescr_t vecY)#

Apply Givens rotation to a dense and a sparse vector.

hipsparseRot applies the Givens rotation matrix $G$ to the sparse vector $x$ and the dense vector $y$ , where

\begin{array}{r} G = (\begin{array}{c} c & s \\ - s & c \end{array}) \end{array}

for(i = 0; i < nnz; ++i)
{
    x_tmp = xVal[i];
    y_tmp = y[xInd[i]];

    xVal[i]    = c * x_tmp + s * y_tmp;
    y[xInd[i]] = c * y_tmp - s * x_tmp;
}

Example

// Number of non-zeros of the sparse vector
int nnz = 3;

// Size of sparse and dense vector
int size = 9;

// Sparse index vector
std::vector<int> hxInd = {0, 3, 5};

// Sparse value vector
std::vector<float> hxVal = {1.0f, 2.0f, 3.0f};

// Dense vector
std::vector<float> hy = {1.0f, 2.0f, 3.0f, 4.0f, 5.0f, 6.0f, 7.0f, 8.0f, 9.0f};

// Scalar c
float c = 3.7f;

// Scalar s
float s = 1.2f;

// Offload data to device
int* dxInd;
float* dxVal;
float* dy;
hipMalloc((void**)&dxInd, sizeof(int) * nnz);
hipMalloc((void**)&dxVal, sizeof(float) * nnz);
hipMalloc((void**)&dy, sizeof(float) * size);

hipMemcpy(dxInd, hxInd.data(), sizeof(int) * nnz, hipMemcpyHostToDevice);
hipMemcpy(dxVal, hxVal.data(), sizeof(float) * nnz, hipMemcpyHostToDevice);
hipMemcpy(dy, hy.data(), sizeof(float) * size, hipMemcpyHostToDevice);

hipsparseHandle_t handle;
hipsparseCreate(&handle);

// Create sparse vector X
hipsparseSpVecDescr_t vecX;
hipsparseCreateSpVec(&vecX,
                            size,
                            nnz,
                            dxInd,
                            dxVal,
                            HIPSPARSE_INDEX_32I,
                            HIPSPARSE_INDEX_BASE_ZERO,
                            HIP_R_32F);

// Create dense vector Y
hipsparseDnVecDescr_t vecY;
hipsparseCreateDnVec(&vecY, size, dy, HIP_R_32F);

// Call rot
hipsparseRot(handle, (void*)&c, (void*)&s, vecX, vecY);

hipsparseSpVecGetValues(vecX, (void**)&dxVal);
hipsparseDnVecGetValues(vecY, (void**)&dy);

// Copy result back to host
hipMemcpy(hxVal.data(), dxVal, sizeof(float) * nnz, hipMemcpyDeviceToHost);
hipMemcpy(hy.data(), dy, sizeof(float) * size, hipMemcpyDeviceToHost);

// Clear hipSPARSE
hipsparseDestroySpVec(vecX);
hipsparseDestroyDnVec(vecY);
hipsparseDestroy(handle);

// Clear device memory
hipFree(dxInd);
hipFree(dxVal);
hipFree(dy);

Parameters:

handle – [in] handle to the hipsparse library context queue.
c_coeff – [in] pointer to the cosine element of $G$ , can be on host or device.
s_coeff – [in] pointer to the sine element of $G$ , can be on host or device.
vecX – [inout] sparse vector descriptor $x$ .
vecY – [inout] dense vector descriptor $y$ .

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, c_coeff, s_coeff, vecX or vecY pointer is invalid.

hipsparseSparseToDense_bufferSize()#

hipsparseStatus_t hipsparseSparseToDense_bufferSize(hipsparseHandle_t handle, hipsparseConstSpMatDescr_t matA, hipsparseDnMatDescr_t matB, hipsparseSparseToDenseAlg_t alg, size_t *pBufferSizeInBytes)#

Sparse matrix to dense matrix conversion.

hipsparseSparseToDense_bufferSize computes the required user allocated buffer size needed when converting a sparse matrix to a dense matrix.

Parameters:

handle – [in] handle to the hipsparse library context queue.
matA – [in] sparse matrix descriptor.
matB – [in] dense matrix descriptor.
alg – [in] algorithm for the sparse to dense computation.
pBufferSizeInBytes – [out] number of bytes of the temporary storage buffer.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, matA, matB, or pBufferSizeInBytes pointer is invalid.

hipsparseSparseToDense()#

hipsparseStatus_t hipsparseSparseToDense(hipsparseHandle_t handle, hipsparseConstSpMatDescr_t matA, hipsparseDnMatDescr_t matB, hipsparseSparseToDenseAlg_t alg, void *externalBuffer)#

Sparse matrix to dense matrix conversion.

hipsparseSparseToDense converts a sparse matrix to a dense matrix. This routine takes a user allocated buffer whose size must first be computed by calling hipsparseSparseToDense_bufferSize

Parameters:

handle – [in] handle to the hipsparse library context queue.
matA – [in] sparse matrix descriptor.
matB – [in] dense matrix descriptor.
alg – [in] algorithm for the sparse to dense computation.
externalBuffer – [in] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, matA, matB, or externalBuffer pointer is invalid.

hipsparseDenseToSparse_bufferSize()#

hipsparseStatus_t hipsparseDenseToSparse_bufferSize(hipsparseHandle_t handle, hipsparseConstDnMatDescr_t matA, hipsparseSpMatDescr_t matB, hipsparseDenseToSparseAlg_t alg, size_t *pBufferSizeInBytes)#

Dense matrix to sparse matrix conversion.

hipsparseDenseToSparse_bufferSize computes the required user allocated buffer size needed when converting a dense matrix to a sparse matrix.

Parameters:

handle – [in] handle to the hipsparse library context queue.
matA – [in] dense matrix descriptor.
matB – [in] sparse matrix descriptor.
alg – [in] algorithm for the dense to sparse computation.
pBufferSizeInBytes – [out] number of bytes of the temporary storage buffer.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, matA, matB, or pBufferSizeInBytes pointer is invalid.

hipsparseDenseToSparse_analysis()#

hipsparseStatus_t hipsparseDenseToSparse_analysis(hipsparseHandle_t handle, hipsparseConstDnMatDescr_t matA, hipsparseSpMatDescr_t matB, hipsparseDenseToSparseAlg_t alg, void *externalBuffer)#

Dense matrix to sparse matrix conversion.

hipsparseDenseToSparse_analysis performs analysis that is later used in hipsparseDenseToSparse_convert when converting a dense matrix to sparse matrix. This routine takes a user allocated buffer whose size must first be computed using hipsparseDenseToSparse_bufferSize.

Parameters:

handle – [in] handle to the hipsparse library context queue.
matA – [in] dense matrix descriptor.
matB – [in] sparse matrix descriptor.
alg – [in] algorithm for the dense to sparse computation.
externalBuffer – [out] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, matA, matB, or externalBuffer pointer is invalid.

hipsparseDenseToSparse_convert()#

hipsparseStatus_t hipsparseDenseToSparse_convert(hipsparseHandle_t handle, hipsparseConstDnMatDescr_t matA, hipsparseSpMatDescr_t matB, hipsparseDenseToSparseAlg_t alg, void *externalBuffer)#

Dense matrix to sparse matrix conversion.

hipsparseDenseToSparse_convert converts a dense matrix to a sparse matrix. This routine requires a user allocated buffer whose size must be determined by first calling hipsparseDenseToSparse_bufferSize.

Parameters:

handle – [in] handle to the hipsparse library context queue.
matA – [in] dense matrix descriptor.
matB – [in] sparse matrix descriptor.
alg – [in] algorithm for the dense to sparse computation.
externalBuffer – [out] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, matA, matB, or externalBuffer pointer is invalid.

hipsparseSpVV_bufferSize()#

hipsparseStatus_t hipsparseSpVV_bufferSize(hipsparseHandle_t handle, hipsparseOperation_t opX, hipsparseConstSpVecDescr_t vecX, hipsparseConstDnVecDescr_t vecY, void *result, hipDataType computeType, size_t *pBufferSizeInBytes)#

Compute the inner dot product of a sparse vector with a dense vector.

hipsparseSpVV_bufferSize computes the required user allocated buffer size needed when computing the inner dot product of a sparse vector with a dense vector

See hipsparseSpVV for full code example.

Parameters:

handle – [in] handle to the hipsparse library context queue.
opX – [in] sparse vector operation type.
vecX – [in] sparse vector descriptor.
vecY – [in] dense vector descriptor.
result – [out] pointer to the result, can be host or device memory
computeType – [in] floating point precision for the SpVV computation.
pBufferSizeInBytes – [out] number of bytes of the temporary storage buffer.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, vecX, vecY, result or pBufferSizeInBytes pointer is invalid.
HIPSPARSE_STATUS_NOT_SUPPORTED – computeType is currently not supported.

hipsparseSpVV()#

hipsparseStatus_t hipsparseSpVV(hipsparseHandle_t handle, hipsparseOperation_t opX, hipsparseConstSpVecDescr_t vecX, hipsparseConstDnVecDescr_t vecY, void *result, hipDataType computeType, void *externalBuffer)#

Compute the inner dot product of a sparse vector with a dense vector.

hipsparseSpVV computes the inner dot product of a sparse vector with a dense vector. This routine takes a user allocated buffer whose size must first be computed by calling hipsparseSpVV_bufferSize

Example

// Number of non-zeros of the sparse vector
int nnz = 3;

// Size of sparse and dense vector
int size = 9;

// Sparse index vector
std::vector<int> hxInd = {0, 3, 5};

// Sparse value vector
std::vector<float> hxVal = {1.0f, 2.0f, 3.0f};

// Dense vector
std::vector<float> hy = {1.0f, 2.0f, 3.0f, 4.0f, 5.0f, 6.0f, 7.0f, 8.0f, 9.0f};

// Offload data to device
int* dxInd;
float* dxVal;
float* dy;
hipMalloc((void**)&dxInd, sizeof(int) * nnz);
hipMalloc((void**)&dxVal, sizeof(float) * nnz);
hipMalloc((void**)&dy, sizeof(float) * size);

hipMemcpy(dxInd, hxInd.data(), sizeof(int) * nnz, hipMemcpyHostToDevice);
hipMemcpy(dxVal, hxVal.data(), sizeof(float) * nnz, hipMemcpyHostToDevice);
hipMemcpy(dy, hy.data(), sizeof(float) * size, hipMemcpyHostToDevice);

hipsparseHandle_t handle;
hipsparseCreate(&handle);

// Create sparse vector X
hipsparseSpVecDescr_t vecX;
hipsparseCreateSpVec(&vecX,
                    size,
                    nnz,
                    dxInd,
                    dxVal,
                    HIPSPARSE_INDEX_32I,
                    HIPSPARSE_INDEX_BASE_ZERO,
                    HIP_R_32F);

// Create dense vector Y
hipsparseDnVecDescr_t vecY;
hipsparseCreateDnVec(&vecY, size, dy, HIP_R_32F);

// Obtain buffer size
float hresult = 0.0f;
size_t buffer_size;
hipsparseSpVV_bufferSize(handle,
            HIPSPARSE_OPERATION_NON_TRANSPOSE,
            vecX,
            vecY,
            &hresult,
            HIP_R_32F,
            &buffer_size);

void* temp_buffer;
hipMalloc(&temp_buffer, buffer_size);

// SpVV
hipsparseSpVV(handle,
            HIPSPARSE_OPERATION_NON_TRANSPOSE,
            vecX,
            vecY,
            &hresult,
            HIP_R_32F,
            temp_buffer);

hipDeviceSynchronize();

std::cout << "hresult: " << hresult << std::endl;

// Clear hipSPARSE
hipsparseDestroySpVec(vecX);
hipsparseDestroyDnVec(vecY);
hipsparseDestroy(handle);

// Clear device memory
hipFree(dxInd);
hipFree(dxVal);
hipFree(dy);
hipFree(temp_buffer);

Parameters:

handle – [in] handle to the hipsparse library context queue.
opX – [in] sparse vector operation type.
vecX – [in] sparse vector descriptor.
vecY – [in] dense vector descriptor.
result – [out] pointer to the result, can be host or device memory
computeType – [in] floating point precision for the SpVV computation.
externalBuffer – [out] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, vecX, vecY, result or externalBuffer pointer is invalid.
HIPSPARSE_STATUS_NOT_SUPPORTED – computeType is currently not supported.

hipsparseSpMV_bufferSize()#

hipsparseStatus_t hipsparseSpMV_bufferSize(hipsparseHandle_t handle, hipsparseOperation_t opA, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstDnVecDescr_t vecX, const void *beta, const hipsparseDnVecDescr_t vecY, hipDataType computeType, hipsparseSpMVAlg_t alg, size_t *pBufferSizeInBytes)#

Buffer size step of the sparse matrix multiplication with a dense vector.

hipsparseSpMV_bufferSize computes the required user allocated buffer size needed when computing the sparse matrix multiplication with a dense vector:

y := α \cdot o p (A) \cdot x + β \cdot y,

where

o p (A)

is a sparse

m \times n

matrix in CSR format,

x

is a dense vector of length

n

and

y

is a dense vector of length

m

.

hipsparseSpMV_bufferSize supports multiple combinations of data types and compute types. See hipsparseSpMV for a complete listing of all the data type and compute type combinations available.

See hipsparseSpMV for full code example.

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] matrix operation type.
alpha – [in] scalar $α$ .
matA – [in] matrix descriptor.
vecX – [in] vector descriptor.
beta – [in] scalar $β$ .
vecY – [inout] vector descriptor.
computeType – [in] floating point precision for the SpMV computation.
alg – [in] SpMV algorithm for the SpMV computation.
pBufferSizeInBytes – [out] number of bytes of the temporary storage buffer.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, matA, x, beta, y or pBufferSizeInBytes pointer is invalid or if opA, computeType, alg is incorrect.
HIPSPARSE_STATUS_NOT_SUPPORTED – computeType or alg is currently not supported.

hipsparseSpMV_preprocess()#

hipsparseStatus_t hipsparseSpMV_preprocess(hipsparseHandle_t handle, hipsparseOperation_t opA, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstDnVecDescr_t vecX, const void *beta, const hipsparseDnVecDescr_t vecY, hipDataType computeType, hipsparseSpMVAlg_t alg, void *externalBuffer)#

Preprocess step of the sparse matrix multiplication with a dense vector (optional)

hipsparseSpMV_preprocess performs analysis on the sparse matrix $A$ when computing the sparse matrix multiplication with a dense vector:

y := α \cdot o p (A) \cdot x + β \cdot y,

where

o p (A)

is a sparse

m \times n

matrix in CSR format,

x

is a dense vector of length

n

and

y

is a dense vector of length

m

.

This step is optional but if used may results in better performance.

hipsparseSpMV_preprocess supports multiple combinations of data types and compute types. See hipsparseSpMV for a complete listing of all the data type and compute type combinations available.

See hipsparseSpMV for full code example.

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] matrix operation type.
alpha – [in] scalar $α$ .
matA – [in] matrix descriptor.
vecX – [in] vector descriptor.
beta – [in] scalar $β$ .
vecY – [inout] vector descriptor.
computeType – [in] floating point precision for the SpMV computation.
alg – [in] SpMV algorithm for the SpMV computation.
externalBuffer – [out] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, matA, x, beta, y or externalBuffer pointer is invalid or if opA, computeType, alg is incorrect.
HIPSPARSE_STATUS_NOT_SUPPORTED – computeType or alg is currently not supported.

hipsparseSpMV()#

hipsparseStatus_t hipsparseSpMV(hipsparseHandle_t handle, hipsparseOperation_t opA, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstDnVecDescr_t vecX, const void *beta, const hipsparseDnVecDescr_t vecY, hipDataType computeType, hipsparseSpMVAlg_t alg, void *externalBuffer)#

Compute the sparse matrix multiplication with a dense vector.

hipsparseSpMV computes sparse matrix multiplication with a dense vector:

y := α \cdot o p (A) \cdot x + β \cdot y,

where

o p (A)

is a sparse

m \times n

matrix in CSR format,

x

is a dense vector of length

n

and

y

is a dense vector of length

m

.

hipsparseSpMV supports multiple combinations of data types and compute types. The tables below indicate the currently supported different data types that can be used for for the sparse matrix A and the dense vectors X and Y and the compute type for $α$ and $β$ . The advantage of using different data types is to save on memory bandwidth and storage when a user application allows while performing the actual computation in a higher precision.

Uniform Precisions:

A / X / Y / compute_type
HIP_R_32F
HIP_R_64F
HIP_C_32F
HIP_C_64F

Mixed precisions:

A / X	Y	compute_type
HIP_R_8I	HIP_R_32I	HIP_R_32I
HIP_R_8I	HIP_R_32F	HIP_R_32F

Mixed-regular real precisions

A	X / Y / compute_type
HIP_R_32F	HIP_R_64F
HIP_C_32F	HIP_C_64F

Mixed-regular Complex precisions

A	X / Y / compute_type
HIP_R_32F	HIP_C_32F
HIP_R_64F	HIP_C_64F

Example

// A, x, and y are m×k, k×1, and m×1
int m = 3, k = 4;
int nnz_A = 8;
hipsparseOperation_t transA = HIPSPARSE_OPERATION_NON_TRANSPOSE;

// alpha and beta
float alpha = 0.5f;
float beta  = 0.25f;

std::vector<int> hcsrRowPtr = {0, 3, 5, 8};
std::vector<int> hcsrColInd = {0, 1, 3, 1, 2, 0, 2, 3}; 
std::vector<float> hcsrVal     = {1, 2, 3, 4, 5, 6, 7, 8}; 

std::vector<float> hx(k, 1.0f);
std::vector<float> hy(m, 1.0f);

int *dcsrRowPtr;
int *dcsrColInd;
float *dcsrVal;
hipMalloc((void**)&dcsrRowPtr, sizeof(int) * (m + 1));
hipMalloc((void**)&dcsrColInd, sizeof(int) * nnz_A);
hipMalloc((void**)&dcsrVal, sizeof(float) * nnz_A);

hipMemcpy(dcsrRowPtr, hcsrRowPtr.data(), sizeof(int) * (m + 1), hipMemcpyHostToDevice);
hipMemcpy(dcsrColInd, hcsrColInd.data(), sizeof(int) * nnz_A, hipMemcpyHostToDevice);
hipMemcpy(dcsrVal, hcsrVal.data(), sizeof(float) * nnz_A, hipMemcpyHostToDevice);

hipsparseHandle_t handle;
hipsparseCreate(&handle);

hipsparseSpMatDescr_t matA;
hipsparseCreateCsr(&matA, m, k, nnz_A,
                    dcsrRowPtr, dcsrColInd, dcsrVal,
                    HIPSPARSE_INDEX_32I, HIPSPARSE_INDEX_32I,
                    HIPSPARSE_INDEX_BASE_ZERO, HIP_R_32F);

// Allocate memory for the vector x
float* dx;
hipMalloc((void**)&dx, sizeof(float) * k);
hipMemcpy(dx, hx.data(), sizeof(float) * k, hipMemcpyHostToDevice);

hipsparseDnVecDescr_t vecX;
hipsparseCreateDnVec(&vecX, k, dx, HIP_R_32F);

// Allocate memory for the resulting vector y
float* dy;
hipMalloc((void**)&dy, sizeof(float) * m);
hipMemcpy(dy, hy.data(), sizeof(float) * m, hipMemcpyHostToDevice);

hipsparseDnMatDescr_t vecY;
hipsparseCreateDnVec(&vecY, m, dy, HIP_R_32F);

// Compute buffersize
size_t bufferSize;
hipsparseSpMV_bufferSize(handle,
                         transA,
                         &alpha,
                         matA,
                         vecX,
                         &beta,
                         vecY,
                         HIP_R_32F,
                         HIPSPARSE_MV_ALG_DEFAULT,
                         &bufferSize);

void* buffer;
hipMalloc(&buffer, bufferSize);

// Preprocess operation (Optional)
hipsparseSpMV_preprocess(handle,
                        transA,
                        &alpha,
                        matA,
                        vecX,
                        &beta,
                        vecY,
                        HIP_R_32F,
                        HIPSPARSE_MV_ALG_DEFAULT,
                        &buffer);

// Perform operation
hipsparseSpMV(handle,
             transA,
             &alpha,
             matA,
             vecX,
             &beta,
             vecY,
             HIP_R_32F,
             HIPSPARSE_MV_ALG_DEFAULT,
             &buffer);

// Copy device to host
hipMemcpy(hy.data(), dy, sizeof(float) * m, hipMemcpyDeviceToHost);

// Destroy matrix descriptors and handles
hipsparseDestroySpMat(matA);
hipsparseDestroyDnVec(vecX);
hipsparseDestroyDnVec(vecY);
hipsparseDestroy(handle);

hipFree(buffer);
hipFree(dcsrRowPtr);
hipFree(dcsrColInd);
hipFree(dcsrVal);
hipFree(dx);
hipFree(dy);

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] matrix operation type.
alpha – [in] scalar $α$ .
matA – [in] matrix descriptor.
vecX – [in] vector descriptor.
beta – [in] scalar $β$ .
vecY – [inout] vector descriptor.
computeType – [in] floating point precision for the SpMV computation.
alg – [in] SpMV algorithm for the SpMV computation.
externalBuffer – [out] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, matA, x, beta, y or externalBuffer pointer is invalid or if opA, computeType, alg is incorrect.
HIPSPARSE_STATUS_NOT_SUPPORTED – computeType or alg is currently not supported.

hipsparseSpMM_bufferSize()#

hipsparseStatus_t hipsparseSpMM_bufferSize(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstDnMatDescr_t matB, const void *beta, const hipsparseDnMatDescr_t matC, hipDataType computeType, hipsparseSpMMAlg_t alg, size_t *pBufferSizeInBytes)#

Calculate the buffer size required for the sparse matrix multiplication with a dense matrix.

hipsparseSpMM_bufferSize computes the required user allocated buffer size needed when computing the sparse matrix multiplication with a dense matrix:

C := α \cdot o p (A) \cdot o p (B) + β \cdot C,

where

o p (A)

is a sparse

m \times k

matrix in CSR format,

B

is a dense matrix of size

k \times n

and

C

is a dense matrix of size

m \times n

.

hipsparseSpMM_bufferSize supports multiple combinations of data types and compute types. See hipsparseSpMM for a complete listing of all the data type and compute type combinations available.

See hipsparseSpMM for full code example.

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] matrix operation type.
opB – [in] matrix operation type.
alpha – [in] scalar $α$ .
matA – [in] matrix descriptor.
matB – [in] matrix descriptor.
beta – [in] scalar $β$ .
matC – [in] matrix descriptor.
computeType – [in] floating point precision for the SpMM computation.
alg – [in] SpMM algorithm for the SpMM computation.
pBufferSizeInBytes – [out] number of bytes of the temporary storage buffer.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, matA, matB, matC, beta, or pBufferSizeInBytes pointer is invalid.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA, opB, computeType or alg is currently not supported.

hipsparseSpMM_preprocess()#

hipsparseStatus_t hipsparseSpMM_preprocess(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstDnMatDescr_t matB, const void *beta, const hipsparseDnMatDescr_t matC, hipDataType computeType, hipsparseSpMMAlg_t alg, void *externalBuffer)#

Preprocess step of the sparse matrix multiplication with a dense matrix.

hipsparseSpMM_preprocess performs the required preprocessing used when computing the sparse matrix multiplication with a dense matrix:

C := α \cdot o p (A) \cdot o p (B) + β \cdot C,

where

o p (A)

is a sparse

m \times k

matrix in CSR format,

B

is a dense matrix of size

k \times n

and

C

is a dense matrix of size

m \times n

.

hipsparseSpMM_preprocess supports multiple combinations of data types and compute types. See hipsparseSpMM for a complete listing of all the data type and compute type combinations available.

See hipsparseSpMM for full code example.

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] matrix operation type.
opB – [in] matrix operation type.
alpha – [in] scalar $α$ .
matA – [in] matrix descriptor.
matB – [in] matrix descriptor.
beta – [in] scalar $β$ .
matC – [in] matrix descriptor.
computeType – [in] floating point precision for the SpMM computation.
alg – [in] SpMM algorithm for the SpMM computation.
externalBuffer – [out] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, matA, matB, matC, beta, or externalBuffer pointer is invalid.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA, opB, computeType or alg is currently not supported.

hipsparseSpMM()#

hipsparseStatus_t hipsparseSpMM(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstDnMatDescr_t matB, const void *beta, const hipsparseDnMatDescr_t matC, hipDataType computeType, hipsparseSpMMAlg_t alg, void *externalBuffer)#

Compute the sparse matrix multiplication with a dense matrix.

hipsparseSpMM computes sparse matrix multiplication with a dense matrix:

C := α \cdot o p (A) \cdot o p (B) + β \cdot C,

where

o p (A)

is a sparse

m \times k

matrix in CSR format,

B

is a dense matrix of size

k \times n

and

C

is a dense matrix of size

m \times n

.

hipsparseSpMM supports multiple combinations of data types and compute types. The tables below indicate the currently supported different data types that can be used for for the sparse matrix A and the dense matrices B and C and the compute type for $α$ and $β$ . The advantage of using different data types is to save on memory bandwidth and storage when a user application allows while performing the actual computation in a higher precision.

Uniform Precisions:

A / B / C / compute_type
HIP_R_32F
HIP_R_64F
HIP_C_32F
HIP_C_64F

Mixed precisions:

A / B	C	compute_type
HIP_R_8I	HIP_R_32I	HIP_R_32I
HIP_R_8I	HIP_R_32F	HIP_R_32F

Example

// A, B, and C are m×k, k×n, and m×n
int m = 3, n = 5, k = 4;
int ldb = n, ldc = n;
int nnz_A = 8, nnz_B = 20, nnz_C = 15;
hipsparseOperation_t transA = HIPSPARSE_OPERATION_NON_TRANSPOSE;
hipsparseOperation_t transB = HIPSPARSE_OPERATION_NON_TRANSPOSE;
hipsparseOperation_t transC = HIPSPARSE_OPERATION_NON_TRANSPOSE;
hipsparseOrder_t order = HIPSPARSE_ORDER_ROW;

// alpha and beta
float alpha = 0.5f;
float beta  = 0.25f;

std::vector<int> hcsrRowPtr = {0, 3, 5, 8};
std::vector<int> hcsrColInd = {0, 1, 3, 1, 2, 0, 2, 3}; 
std::vector<float> hcsrVal     = {1, 2, 3, 4, 5, 6, 7, 8}; 

std::vector<float> hB(nnz_B, 1.0f);
std::vector<float> hC(nnz_C, 1.0f);

int *dcsrRowPtr;
int *dcsrColInd;
float *dcsrVal;
hipMalloc((void**)&dcsrRowPtr, sizeof(int) * (m + 1));
hipMalloc((void**)&dcsrColInd, sizeof(int) * nnz_A);
hipMalloc((void**)&dcsrVal, sizeof(float) * nnz_A);

hipMemcpy(dcsrRowPtr, hcsrRowPtr.data(), sizeof(int) * (m + 1), hipMemcpyHostToDevice);
hipMemcpy(dcsrColInd, hcsrColInd.data(), sizeof(int) * nnz_A, hipMemcpyHostToDevice);
hipMemcpy(dcsrVal, hcsrVal.data(), sizeof(float) * nnz_A, hipMemcpyHostToDevice);

hipsparseHandle_t handle;
hipsparseCreate(&handle);

hipsparseSpMatDescr_t matA;
hipsparseCreateCsr(&matA, m, k, nnz_A,
                    dcsrRowPtr, dcsrColInd, dcsrVal,
                    HIPSPARSE_INDEX_32I, HIPSPARSE_INDEX_32I,
                    HIPSPARSE_INDEX_BASE_ZERO, HIP_R_32F);

// Allocate memory for the matrix B
float* dB;
hipMalloc((void**)&dB, sizeof(float) * nnz_B);
hipMemcpy(dB, hB.data(), sizeof(float) * nnz_B, hipMemcpyHostToDevice);

hipsparseDnMatDescr_t matB;
hipsparseCreateDnMat(&matB, k, n, ldb, dB, HIP_R_32F, order);

// Allocate memory for the resulting matrix C
float* dC;
hipMalloc((void**)&dC, sizeof(float) * nnz_C);
hipMemcpy(dC, hC.data(), sizeof(float) * nnz_C, hipMemcpyHostToDevice);

hipsparseDnMatDescr_t matC;
hipsparseCreateDnMat(&matC, m, n, ldc, dC, HIP_R_32F, HIPSPARSE_ORDER_ROW);

// Compute buffersize
size_t bufferSize;
hipsparseSpMM_bufferSize(handle,
                         transA,
                         transB,
                         &alpha,
                         matA,
                         matB,
                         &beta,
                         matC,
                         HIP_R_32F,
                         HIPSPARSE_MM_ALG_DEFAULT,
                         &bufferSize);

void* buffer;
hipMalloc(&buffer, bufferSize);

// Preprocess operation (Optional)
hipsparseSpMM_preprocess(handle,
                        transA,
                        transB,
                        &alpha,
                        matA,
                        matB,
                        &beta,
                        matC,
                        HIP_R_32F,
                        HIPSPARSE_MM_ALG_DEFAULT,
                        &buffer);

// Perform operation
hipsparseSpMM(handle,
             transA,
             transB,
             &alpha,
             matA,
             matB,
             &beta,
             matC,
             HIP_R_32F,
             HIPSPARSE_MM_ALG_DEFAULT,
             &buffer);

// Copy device to host
hipMemcpy(hC.data(), dC, sizeof(float) * nnz_C, hipMemcpyDeviceToHost);

// Destroy matrix descriptors and handles
hipsparseDestroySpMat(matA);
hipsparseDestroyDnMat(matB);
hipsparseDestroyDnMat(matC);
hipsparseDestroy(handle);

hipFree(buffer);
hipFree(dcsrRowPtr);
hipFree(dcsrColInd);
hipFree(dcsrVal);
hipFree(dB);
hipFree(dC);

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] matrix operation type.
opB – [in] matrix operation type.
alpha – [in] scalar $α$ .
matA – [in] matrix descriptor.
matB – [in] matrix descriptor.
beta – [in] scalar $β$ .
matC – [in] matrix descriptor.
computeType – [in] floating point precision for the SpMM computation.
alg – [in] SpMM algorithm for the SpMM computation.
externalBuffer – [out] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, matA, matB, matC, beta, or externalBuffer pointer is invalid.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA, opB, computeType or alg is currently not supported.

hipsparseSpGEMM_createDescr()#

hipsparseStatus_t hipsparseSpGEMM_createDescr(hipsparseSpGEMMDescr_t *descr)#

Create sparse matrix sparse matrix product descriptor.

hipsparseSpGEMM_createDescr creates a sparse matrix sparse matrix product descriptor. It should be destroyed at the end using hipsparseSpGEMM_destroyDescr().

hipsparseSpGEMM_destroyDescr()#

hipsparseStatus_t hipsparseSpGEMM_destroyDescr(hipsparseSpGEMMDescr_t descr)#

Destroy sparse matrix sparse matrix product descriptor.

hipsparseSpGEMM_destroyDescr destroys a sparse matrix sparse matrix product descriptor and releases all resources used by the descriptor.

hipsparseSpGEMM_workEstimation()#

hipsparseStatus_t hipsparseSpGEMM_workEstimation(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstSpMatDescr_t matB, const void *beta, hipsparseSpMatDescr_t matC, hipDataType computeType, hipsparseSpGEMMAlg_t alg, hipsparseSpGEMMDescr_t spgemmDescr, size_t *bufferSize1, void *externalBuffer1)#

Work estimation step of the sparse matrix sparse matrix product:

C^{'} := α \cdot o p (A) \cdot o p (B) + β \cdot C,

where

C^{'}

,

A

,

B

,

C

are sparse matrices and

C^{'}

and

C

have the same sparsity pattern.

hipsparseSpGEMM_workEstimation is called twice. We call it to compute the size of the first required user allocated buffer. After this buffer size is determined, the user allocates it and calls hipsparseSpGEMM_workEstimation a second time with the newly allocated buffer passed in. This second call inspects the matrices $A$ and $B$ to determine the number of intermediate products that will result from multipltying $A$ and $B$ together.

Example (See full example below)

void*  dBuffer1  = NULL; 
size_t bufferSize1 = 0;

hipsparseSpGEMMDescr_t spgemmDesc;
hipsparseSpGEMM_createDescr(&spgemmDesc);

size_t bufferSize1 = 0;
hipsparseSpGEMM_workEstimation(handle, opA, opB,
                              &alpha, matA, matB, &beta, matC,
                              computeType, HIPSPARSE_SPGEMM_DEFAULT,
                              spgemmDesc, &bufferSize1, NULL);
hipMalloc((void**) &dBuffer1, bufferSize1);

// Determine number of intermediate product when computing A * B
hipsparseSpGEMM_workEstimation(handle, opA, opB,
                                &alpha, matA, matB, &beta, matC,
                                computeType, HIPSPARSE_SPGEMM_DEFAULT,
                                spgemmDesc, &bufferSize1, dBuffer1);

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] sparse matrix $A$ operation type.
opB – [in] sparse matrix $B$ operation type.
alpha – [in] scalar $α$ .
matA – [in] sparse matrix $A$ descriptor.
matB – [in] sparse matrix $B$ descriptor.
beta – [in] scalar $β$ .
matC – [out] sparse matrix $C$ descriptor.
computeType – [in] floating point precision for the SpGEMM computation.
alg – [in] SpGEMM algorithm for the SpGEMM computation.
spgemmDescr – [in] SpGEMM descriptor.
bufferSize1 – [out] number of bytes of the temporary storage buffer.
externalBuffer1 – [in] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, beta, matA, matB, matC or bufferSize1 pointer is invalid.
HIPSPARSE_STATUS_ALLOC_FAILED – additional buffer for long rows could not be allocated.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA != HIPSPARSE_OPERATION_NON_TRANSPOSE or opB != HIPSPARSE_OPERATION_NON_TRANSPOSE.

hipsparseSpGEMM_compute()#

hipsparseStatus_t hipsparseSpGEMM_compute(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstSpMatDescr_t matB, const void *beta, hipsparseSpMatDescr_t matC, hipDataType computeType, hipsparseSpGEMMAlg_t alg, hipsparseSpGEMMDescr_t spgemmDescr, size_t *bufferSize2, void *externalBuffer2)#

Compute step of the sparse matrix sparse matrix product:

C^{'} := α \cdot o p (A) \cdot o p (B) + β \cdot C,

where

C^{'}

,

A

,

B

,

C

are sparse matrices and

C^{'}

and

C

have the same sparsity pattern.

hipsparseSpGEMM_compute is called twice. First to compute the size of the second required user allocated buffer. After this buffer size is determined, the user allocates it and calls hipsparseSpGEMM_compute a second time with the newly allocated buffer passed in. This second call performs the actual computation of $C^{'} = α \cdot A \cdot B$ (the result is stored in the temporary buffers).

Example (See full example below)

void*  dBuffer2  = NULL; 
size_t bufferSize2 = 0;

size_t bufferSize2 = 0;
hipsparseSpGEMM_compute(handle, opA, opB,
                        &alpha, matA, matB, &beta, matC,
                        computeType, HIPSPARSE_SPGEMM_DEFAULT,
                        spgemmDesc, &bufferSize2, NULL);
hipMalloc((void**) &dBuffer2, bufferSize2);

// compute the intermediate product of A * B
hipsparseSpGEMM_compute(handle, opA, opB,
                        &alpha, matA, matB, &beta, matC,
                        computeType, HIPSPARSE_SPGEMM_DEFAULT,
                        spgemmDesc, &bufferSize2, dBuffer2);

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] sparse matrix $A$ operation type.
opB – [in] sparse matrix $B$ operation type.
alpha – [in] scalar $α$ .
matA – [in] sparse matrix $A$ descriptor.
matB – [in] sparse matrix $B$ descriptor.
beta – [in] scalar $β$ .
matC – [out] sparse matrix $C$ descriptor.
computeType – [in] floating point precision for the SpGEMM computation.
alg – [in] SpGEMM algorithm for the SpGEMM computation.
spgemmDescr – [in] SpGEMM descriptor.
bufferSize2 – [out] number of bytes of the temporary storage buffer.
externalBuffer2 – [in] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, beta, matA, matB, matC or bufferSize2 pointer is invalid.
HIPSPARSE_STATUS_ALLOC_FAILED – additional buffer for long rows could not be allocated.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA != HIPSPARSE_OPERATION_NON_TRANSPOSE or opB != HIPSPARSE_OPERATION_NON_TRANSPOSE.

hipsparseSpGEMM_copy()#

hipsparseStatus_t hipsparseSpGEMM_copy(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstSpMatDescr_t matB, const void *beta, hipsparseSpMatDescr_t matC, hipDataType computeType, hipsparseSpGEMMAlg_t alg, hipsparseSpGEMMDescr_t spgemmDescr)#

Copy step of the sparse matrix sparse matrix product:

C^{'} := α \cdot o p (A) \cdot o p (B) + β \cdot C,

where

C^{'}

,

A

,

B

,

C

are sparse matrices and

C^{'}

and

C

have the same sparsity pattern.

hipsparseSpGEMM_copy is called once to copy the results (that are currently stored in the temporary arrays) to the output sparse matrix. If $β! = 0$ , then the $b e t a \cdot C$ portion of the computation: $C^{'} = α \cdot A \cdot B + β * C$ is handled. This is possible because $C^{'}$ and $C$ must have the same sparsity pattern.

Example (Full example)

hipsparseHandle_t     handle = NULL;
hipsparseSpMatDescr_t matA, matB, matC;
void*  dBuffer1  = NULL; 
void*  dBuffer2  = NULL;
size_t bufferSize1 = 0;  
size_t bufferSize2 = 0;

hipsparseCreate(&handle);

// Create sparse matrix A in CSR format
hipsparseCreateCsr(&matA, m, k, nnzA,
                                    dcsrRowPtrA, dcsrColIndA, dcsrValA,
                                    HIPSPARSE_INDEX_32I, HIPSPARSE_INDEX_32I,
                                    HIPSPARSE_INDEX_BASE_ZERO, HIP_R_32F);
hipsparseCreateCsr(&matB, k, n, nnzB,
                                    dcsrRowPtrB, dcsrColIndB, dcsrValB,
                                    HIPSPARSE_INDEX_32I, HIPSPARSE_INDEX_32I,
                                    HIPSPARSE_INDEX_BASE_ZERO, HIP_R_32F);
hipsparseCreateCsr(&matC, m, n, 0,
                                    dcsrRowPtrC, NULL, NULL,
                                    HIPSPARSE_INDEX_32I, HIPSPARSE_INDEX_32I,
                                    HIPSPARSE_INDEX_BASE_ZERO, HIP_R_32F);

hipsparseSpGEMMDescr_t spgemmDesc;
hipsparseSpGEMM_createDescr(&spgemmDesc);

// Determine size of first user allocated buffer
hipsparseSpGEMM_workEstimation(handle, opA, opB,
                                    &alpha, matA, matB, &beta, matC,
                                    computeType, HIPSPARSE_SPGEMM_DEFAULT,
                                    spgemmDesc, &bufferSize1, NULL);
hipMalloc((void**) &dBuffer1, bufferSize1);

// Inspect the matrices A and B to determine the number of intermediate product in 
// C = alpha * A * B
hipsparseSpGEMM_workEstimation(handle, opA, opB,
                                    &alpha, matA, matB, &beta, matC,
                                    computeType, HIPSPARSE_SPGEMM_DEFAULT,
                                    spgemmDesc, &bufferSize1, dBuffer1);

// Determine size of second user allocated buffer
hipsparseSpGEMM_compute(handle, opA, opB,
                            &alpha, matA, matB, &beta, matC,
                            computeType, HIPSPARSE_SPGEMM_DEFAULT,
                            spgemmDesc, &bufferSize2, NULL);
hipMalloc((void**) &dBuffer2, bufferSize2);

// Compute C = alpha * A * B and store result in temporary buffers
hipsparseSpGEMM_compute(handle, opA, opB,
                                    &alpha, matA, matB, &beta, matC,
                                    computeType, HIPSPARSE_SPGEMM_DEFAULT,
                                    spgemmDesc, &bufferSize2, dBuffer2);

// Get matrix C non-zero entries C_nnz1
int64_t C_num_rows1, C_num_cols1, C_nnz1;
hipsparseSpMatGetSize(matC, &C_num_rows1, &C_num_cols1, &C_nnz1);

// Allocate the CSR structures for the matrix C
hipMalloc((void**) &dcsrColIndC, C_nnz1 * sizeof(int));
hipMalloc((void**) &dcsrValC,  C_nnz1 * sizeof(float));

// Update matC with the new pointers
hipsparseCsrSetPointers(matC, dcsrRowPtrC, dcsrColIndC, dcsrValC);

// Copy the final products to the matrix C
hipsparseSpGEMM_copy(handle, opA, opB,
                        &alpha, matA, matB, &beta, matC,
                        computeType, HIPSPARSE_SPGEMM_DEFAULT, spgemmDesc);

// Destroy matrix descriptors and handles
hipsparseSpGEMM_destroyDescr(spgemmDesc);
hipsparseDestroySpMat(matA);
hipsparseDestroySpMat(matB);
hipsparseDestroySpMat(matC);
hipsparseDestroy(handle);

// Free device memory
hipFree(dBuffer1);
hipFree(dBuffer2);

Note

The two user allocated temporary buffers can only be freed after the call to hipsparseSpGEMM_copy

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] sparse matrix $A$ operation type.
opB – [in] sparse matrix $B$ operation type.
alpha – [in] scalar $α$ .
matA – [in] sparse matrix $A$ descriptor.
matB – [in] sparse matrix $B$ descriptor.
beta – [in] scalar $β$ .
matC – [out] sparse matrix $C$ descriptor.
computeType – [in] floating point precision for the SpGEMM computation.
alg – [in] SpGEMM algorithm for the SpGEMM computation.
spgemmDescr – [in] SpGEMM descriptor.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, beta, matA, matB, matC pointer is invalid.
HIPSPARSE_STATUS_ALLOC_FAILED – additional buffer for long rows could not be allocated.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA != HIPSPARSE_OPERATION_NON_TRANSPOSE or opB != HIPSPARSE_OPERATION_NON_TRANSPOSE.

hipsparseSpGEMMreuse_workEstimation()#

hipsparseStatus_t hipsparseSpGEMMreuse_workEstimation(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, hipsparseConstSpMatDescr_t matA, hipsparseConstSpMatDescr_t matB, hipsparseSpMatDescr_t matC, hipsparseSpGEMMAlg_t alg, hipsparseSpGEMMDescr_t spgemmDescr, size_t *bufferSize1, void *externalBuffer1)#

Work estimation step of the sparse matrix sparse matrix product:

C^{'} := α \cdot o p (A) \cdot o p (B) + β \cdot C,

where

C^{'}

,

A

,

B

,

C

are sparse matrices and

C^{'}

and

C

have the same sparsity pattern.

hipsparseSpGEMMreuse_workEstimation is called twice. We call it to compute the size of the first required user allocated buffer. After this buffer size is determined, the user allocates it and calls hipsparseSpGEMMreuse_workEstimation a second time with the newly allocated buffer passed in. This second call inspects the matrices $A$ and $B$ to determine the number of intermediate products that will result from multipltying $A$ and $B$ together.

Example (See full example below)

void*  dBuffer1  = NULL; 
size_t bufferSize1 = 0;

hipsparseSpGEMMDescr_t spgemmDesc;
hipsparseSpGEMM_createDescr(&spgemmDesc);

size_t bufferSize1 = 0;
hipsparseSpGEMMreuse_workEstimation(handle, opA, opB, matA, matB, matC,
                                    HIPSPARSE_SPGEMM_DEFAULT, spgemmDesc, 
                                    &bufferSize1, NULL);
hipMalloc((void**) &dBuffer1, bufferSize1);

// Determine number of intermediate product when computing A * B
hipsparseSpGEMMreuse_workEstimation(handle, opA, opB, matA, matB, matC,
                                    HIPSPARSE_SPGEMM_DEFAULT, spgemmDesc, 
                                    &bufferSize1, dBuffer1);

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] sparse matrix $A$ operation type.
opB – [in] sparse matrix $B$ operation type.
matA – [in] sparse matrix $A$ descriptor.
matB – [in] sparse matrix $B$ descriptor.
matC – [out] sparse matrix $C$ descriptor.
alg – [in] SpGEMM algorithm for the SpGEMM computation.
spgemmDescr – [in] SpGEMM descriptor.
bufferSize1 – [out] number of bytes of the temporary storage buffer.
externalBuffer1 – [in] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, matA, matB, matC or bufferSize1 pointer is invalid.
HIPSPARSE_STATUS_ALLOC_FAILED – additional buffer for long rows could not be allocated.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA != HIPSPARSE_OPERATION_NON_TRANSPOSE or opB != HIPSPARSE_OPERATION_NON_TRANSPOSE.

hipsparseSpGEMMreuse_nnz()#

hipsparseStatus_t hipsparseSpGEMMreuse_nnz(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, hipsparseConstSpMatDescr_t matA, hipsparseConstSpMatDescr_t matB, hipsparseSpMatDescr_t matC, hipsparseSpGEMMAlg_t alg, hipsparseSpGEMMDescr_t spgemmDescr, size_t *bufferSize2, void *externalBuffer2, size_t *bufferSize3, void *externalBuffer3, size_t *bufferSize4, void *externalBuffer4)#

Nnz calculation step of the sparse matrix sparse matrix product:

C^{'} := α \cdot o p (A) \cdot o p (B) + β \cdot C,

where

C^{'}

,

A

,

B

,

C

are sparse matrices and

C^{'}

and

C

have the same sparsity pattern.

Example (See full example below)

// Determine size of second, third, and fourth user allocated buffer
hipsparseSpGEMMreuse_nnz(handle, opA, opB, matA, matB,
                            matC, HIPSPARSE_SPGEMM_DEFAULT, spgemmDesc,
                            &bufferSize2, NULL, &bufferSize3, NULL,
                            &bufferSize4, NULL);

hipMalloc((void**) &dBuffer2, bufferSize2);
hipMalloc((void**) &dBuffer3, bufferSize3);
hipMalloc((void**) &dBuffer4, bufferSize4);

// COmpute sparsity pattern of C matrix and store in temporary buffers
hipsparseSpGEMMreuse_nnz(handle, opA, opB, matA, matB,
                            matC, HIPSPARSE_SPGEMM_DEFAULT, spgemmDesc,
                            &bufferSize2, dBuffer2, &bufferSize3, dBuffer3,
                            &bufferSize4, dBuffer4);

// We can now free buffer 1 and 2
hipFree(dBuffer1);
hipFree(dBuffer2);

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] sparse matrix $A$ operation type.
opB – [in] sparse matrix $B$ operation type.
matA – [in] sparse matrix $A$ descriptor.
matB – [in] sparse matrix $B$ descriptor.
matC – [out] sparse matrix $C$ descriptor.
alg – [in] SpGEMM algorithm for the SpGEMM computation.
spgemmDescr – [in] SpGEMM descriptor.
bufferSize2 – [out] number of bytes of the temporary storage externalBuffer2.
externalBuffer2 – [in] temporary storage buffer allocated by the user.
bufferSize3 – [out] number of bytes of the temporary storage externalBuffer3.
externalBuffer3 – [in] temporary storage buffer allocated by the user.
bufferSize4 – [out] number of bytes of the temporary storage externalBuffer4.
externalBuffer4 – [in] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, matA, matB, matC, bufferSize2, bufferSize3 or bufferSize4 pointer is invalid.
HIPSPARSE_STATUS_ALLOC_FAILED – additional buffer for long rows could not be allocated.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA != HIPSPARSE_OPERATION_NON_TRANSPOSE or opB != HIPSPARSE_OPERATION_NON_TRANSPOSE.

hipsparseSpGEMMreuse_copy()#

hipsparseStatus_t hipsparseSpGEMMreuse_copy(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, hipsparseConstSpMatDescr_t matA, hipsparseConstSpMatDescr_t matB, hipsparseSpMatDescr_t matC, hipsparseSpGEMMAlg_t alg, hipsparseSpGEMMDescr_t spgemmDescr, size_t *bufferSize5, void *externalBuffer5)#

Copy step of the sparse matrix sparse matrix product:

C^{'} := α \cdot o p (A) \cdot o p (B) + β \cdot C,

where

C^{'}

,

A

,

B

,

C

are sparse matrices and

C^{'}

and

C

have the same sparsity pattern.

Example (See full example below)

// Get matrix C non-zero entries nnzC
int64_t rowsC, colsC, nnzC;
hipsparseSpMatGetSize(matC, &rowsC, &colsC, &nnzC);

// Allocate matrix C
hipMalloc((void**) &dcsrColIndC, sizeof(int) * nnzC);
hipMalloc((void**) &dcsrValC,  sizeof(float) * nnzC);

// Update matC with the new pointers. The C values array can be filled with data here
// which is used if beta != 0.
hipsparseCsrSetPointers(matC, dcsrRowPtrC, dcsrColIndC, dcsrValC);

// Determine size of fifth user allocated buffer
hipsparseSpGEMMreuse_copy(handle, opA, opB, matA, matB, matC,
                             HIPSPARSE_SPGEMM_DEFAULT, spgemmDesc,
                             &bufferSize5, NULL);

hipMalloc((void**) &dBuffer5, bufferSize5);

// Copy data from temporary buffers to the newly allocated C matrix
hipsparseSpGEMMreuse_copy(handle, opA, opB, matA, matB, matC,
                             HIPSPARSE_SPGEMM_DEFAULT, spgemmDesc,
                             &bufferSize5, dBuffer5);

// We can now free buffer 3
hipFree(dBuffer3);

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] sparse matrix $A$ operation type.
opB – [in] sparse matrix $B$ operation type.
matA – [in] sparse matrix $A$ descriptor.
matB – [in] sparse matrix $B$ descriptor.
matC – [out] sparse matrix $C$ descriptor.
alg – [in] SpGEMM algorithm for the SpGEMM computation.
spgemmDescr – [in] SpGEMM descriptor.
bufferSize5 – [out] number of bytes of the temporary storage externalBuffer5.
externalBuffer5 – [in] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, matA, matB, matC, or bufferSize5 pointer is invalid.
HIPSPARSE_STATUS_ALLOC_FAILED – additional buffer for long rows could not be allocated.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA != HIPSPARSE_OPERATION_NON_TRANSPOSE or opB != HIPSPARSE_OPERATION_NON_TRANSPOSE.

hipsparseSpGEMMreuse_compute()#

hipsparseStatus_t hipsparseSpGEMMreuse_compute(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstSpMatDescr_t matB, const void *beta, hipsparseSpMatDescr_t matC, hipDataType computeType, hipsparseSpGEMMAlg_t alg, hipsparseSpGEMMDescr_t spgemmDescr)#

Copy step of the sparse matrix sparse matrix product:

C^{'} := α \cdot o p (A) \cdot o p (B) + β \cdot C,

where

C^{'}

,

A

,

B

,

C

are sparse matrices and

C^{'}

and

C

have the same sparsity pattern.

Full example

int m = 2;
int k = 2;
int n = 3;
int nnzA = 4;
int nnzB = 4;

float alpha{1.0f};
float beta{0.0f};

hipsparseOperation_t opA        = HIPSPARSE_OPERATION_NON_TRANSPOSE;
hipsparseOperation_t opB        = HIPSPARSE_OPERATION_NON_TRANSPOSE;
hipDataType computeType         = HIP_R_32F;

// A, B, and C are m×k, k×n, and m×n

// A
std::vector<int> hcsrRowPtrA = {0, 2, 4};
std::vector<int> hcsrColIndA = {0, 1, 0, 1};
std::vector<float> hcsrValA = {1.0f, 2.0f, 3.0f, 4.0f};

// B
std::vector<int> hcsrRowPtrB = {0, 2, 4};
std::vector<int> hcsrColIndB = {1, 2, 0, 2};
std::vector<float> hcsrValB = {5.0f , 6.0f, 7.0f, 8.0f};

// Device memory management: Allocate and copy A, B
int* dcsrRowPtrA;
int* dcsrColIndA;
float* dcsrValA;
int* dcsrRowPtrB;
int* dcsrColIndB;
float* dcsrValB;
int* dcsrRowPtrC;
int* dcsrColIndC;
float* dcsrValC;
hipMalloc((void**)&dcsrRowPtrA, (m + 1) * sizeof(int));
hipMalloc((void**)&dcsrColIndA, nnzA * sizeof(int));
hipMalloc((void**)&dcsrValA, nnzA * sizeof(float));
hipMalloc((void**)&dcsrRowPtrB, (k + 1) * sizeof(int));
hipMalloc((void**)&dcsrColIndB, nnzB * sizeof(int));
hipMalloc((void**)&dcsrValB, nnzB * sizeof(float));
hipMalloc((void**)&dcsrRowPtrC, (m + 1) * sizeof(int));

hipMemcpy(dcsrRowPtrA, hcsrRowPtrA.data(), (m + 1) * sizeof(int), hipMemcpyHostToDevice);
hipMemcpy(dcsrColIndA, hcsrColIndA.data(), nnzA * sizeof(int), hipMemcpyHostToDevice);
hipMemcpy(dcsrValA, hcsrValA.data(), nnzA * sizeof(float), hipMemcpyHostToDevice);
hipMemcpy(dcsrRowPtrB, hcsrRowPtrB.data(), (k + 1) * sizeof(int), hipMemcpyHostToDevice);
hipMemcpy(dcsrColIndB, hcsrColIndB.data(), nnzB * sizeof(int), hipMemcpyHostToDevice);
hipMemcpy(dcsrValB, hcsrValB.data(), nnzB * sizeof(float), hipMemcpyHostToDevice);

hipsparseHandle_t     handle = NULL;
hipsparseSpMatDescr_t matA, matB, matC;
void*  dBuffer1  = NULL; 
void*  dBuffer2  = NULL;
void*  dBuffer3  = NULL;
void*  dBuffer4  = NULL;
void*  dBuffer5  = NULL;
size_t bufferSize1 = 0;  
size_t bufferSize2 = 0;
size_t bufferSize3 = 0;
size_t bufferSize4 = 0;
size_t bufferSize5 = 0;

hipsparseCreate(&handle);

// Create sparse matrix A in CSR format
hipsparseCreateCsr(&matA, m, k, nnzA,
                    dcsrRowPtrA, dcsrColIndA, dcsrValA,
                    HIPSPARSE_INDEX_32I, HIPSPARSE_INDEX_32I,
                    HIPSPARSE_INDEX_BASE_ZERO, HIP_R_32F);
hipsparseCreateCsr(&matB, k, n, nnzB,
                    dcsrRowPtrB, dcsrColIndB, dcsrValB,
                    HIPSPARSE_INDEX_32I, HIPSPARSE_INDEX_32I,
                    HIPSPARSE_INDEX_BASE_ZERO, HIP_R_32F);
hipsparseCreateCsr(&matC, m, n, 0,
                    dcsrRowPtrC, NULL, NULL,
                    HIPSPARSE_INDEX_32I, HIPSPARSE_INDEX_32I,
                    HIPSPARSE_INDEX_BASE_ZERO, HIP_R_32F);

hipsparseSpGEMMDescr_t spgemmDesc;
hipsparseSpGEMM_createDescr(&spgemmDesc);

// Determine size of first user allocated buffer
hipsparseSpGEMMreuse_workEstimation(handle, opA, opB, matA, matB, matC,
                                    HIPSPARSE_SPGEMM_DEFAULT, spgemmDesc, 
                                    &bufferSize1, NULL);

hipMalloc((void**) &dBuffer1, bufferSize1);

// Inspect the matrices A and B to determine the number of intermediate product in 
// C = alpha * A * B
hipsparseSpGEMMreuse_workEstimation(handle, opA, opB, matA, matB, matC,
                                    HIPSPARSE_SPGEMM_DEFAULT, spgemmDesc, 
                                    &bufferSize1, dBuffer1);

// Determine size of second, third, and fourth user allocated buffer
hipsparseSpGEMMreuse_nnz(handle, opA, opB, matA, matB,
                            matC, HIPSPARSE_SPGEMM_DEFAULT, spgemmDesc,
                            &bufferSize2, NULL, &bufferSize3, NULL,
                            &bufferSize4, NULL);

hipMalloc((void**) &dBuffer2, bufferSize2);
hipMalloc((void**) &dBuffer3, bufferSize3);
hipMalloc((void**) &dBuffer4, bufferSize4);

// COmpute sparsity pattern of C matrix and store in temporary buffers
hipsparseSpGEMMreuse_nnz(handle, opA, opB, matA, matB,
                            matC, HIPSPARSE_SPGEMM_DEFAULT, spgemmDesc,
                            &bufferSize2, dBuffer2, &bufferSize3, dBuffer3,
                            &bufferSize4, dBuffer4);

// We can now free buffer 1 and 2
hipFree(dBuffer1);
hipFree(dBuffer2);

// Get matrix C non-zero entries nnzC
int64_t rowsC, colsC, nnzC;
hipsparseSpMatGetSize(matC, &rowsC, &colsC, &nnzC);

// Allocate matrix C
hipMalloc((void**) &dcsrColIndC, sizeof(int) * nnzC);
hipMalloc((void**) &dcsrValC,  sizeof(float) * nnzC);

// Update matC with the new pointers. The C values array can be filled with data here
// which is used if beta != 0.
hipsparseCsrSetPointers(matC, dcsrRowPtrC, dcsrColIndC, dcsrValC);

// Determine size of fifth user allocated buffer
hipsparseSpGEMMreuse_copy(handle, opA, opB, matA, matB, matC,
                             HIPSPARSE_SPGEMM_DEFAULT, spgemmDesc,
                             &bufferSize5, NULL);

hipMalloc((void**) &dBuffer5, bufferSize5);

// Copy data from temporary buffers to the newly allocated C matrix
hipsparseSpGEMMreuse_copy(handle, opA, opB, matA, matB, matC,
                             HIPSPARSE_SPGEMM_DEFAULT, spgemmDesc,
                             &bufferSize5, dBuffer5);

// We can now free buffer 3
hipFree(dBuffer3);

// Compute C' = alpha * A * B + beta * C
hipsparseSpGEMMreuse_compute(handle, opA, opB, &alpha, matA, matB, &beta,
                                matC, computeType, HIPSPARSE_SPGEMM_DEFAULT,
                                spgemmDesc);

// Copy results back to host if required using hipsparseCsrGet...

// Update dcsrValA, dcsrValB with new values
for(size_t i = 0; i < hcsrValA.size(); i++){ hcsrValA[i] = 1.0f; }
for(size_t i = 0; i < hcsrValB.size(); i++){ hcsrValB[i] = 2.0f; }

hipMemcpy(dcsrValA, hcsrValA.data(), sizeof(float) * nnzA, hipMemcpyHostToDevice);
hipMemcpy(dcsrValB, hcsrValB.data(), sizeof(float) * nnzB, hipMemcpyHostToDevice);

// Compute C' = alpha * A * B + beta * C again with the new A and B values
hipsparseSpGEMMreuse_compute(handle, opA, opB, &alpha, matA, matB, &beta,
                                matC, computeType, HIPSPARSE_SPGEMM_DEFAULT,
                                spgemmDesc);

// Copy results back to host if required using hipsparseCsrGet...

// Destroy matrix descriptors and handles
hipsparseSpGEMM_destroyDescr(spgemmDesc);
hipsparseDestroySpMat(matA);
hipsparseDestroySpMat(matB);
hipsparseDestroySpMat(matC);
hipsparseDestroy(handle);

// Free device memory
hipFree(dBuffer4);
hipFree(dBuffer5);
hipFree(dcsrRowPtrA);
hipFree(dcsrColIndA);
hipFree(dcsrValA);
hipFree(dcsrRowPtrB);
hipFree(dcsrColIndB);
hipFree(dcsrValB);
hipFree(dcsrRowPtrC);
hipFree(dcsrColIndC);
hipFree(dcsrValC);

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] sparse matrix $A$ operation type.
opB – [in] sparse matrix $B$ operation type.
alpha – [in] scalar $α$ .
matA – [in] sparse matrix $A$ descriptor.
matB – [in] sparse matrix $B$ descriptor.
beta – [in] scalar $β$ .
matC – [out] sparse matrix $C$ descriptor.
computeType – [in] floating point precision for the SpGEMM computation.
alg – [in] SpGEMM algorithm for the SpGEMM computation.
spgemmDescr – [in] SpGEMM descriptor.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, beta, matA, matB, or matC pointer is invalid.
HIPSPARSE_STATUS_ALLOC_FAILED – additional buffer for long rows could not be allocated.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA != HIPSPARSE_OPERATION_NON_TRANSPOSE or opB != HIPSPARSE_OPERATION_NON_TRANSPOSE.

hipsparseSDDMM_bufferSize()#

hipsparseStatus_t hipsparseSDDMM_bufferSize(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void *alpha, hipsparseConstDnMatDescr_t A, hipsparseConstDnMatDescr_t B, const void *beta, hipsparseSpMatDescr_t C, hipDataType computeType, hipsparseSDDMMAlg_t alg, size_t *pBufferSizeInBytes)#

Calculate the buffer size required for the sampled dense dense matrix multiplication:

C := α (o p (A) \cdot o p (B)) \circ s p y (C) + β \cdot C,

where

C

is a sparse matrix and

A

and

B

are dense matrices.

hipsparseSDDMM_bufferSize computes the required user allocated buffer size needed when computing the sampled dense dense matrix multiplication

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] dense matrix $A$ operation type.
opB – [in] dense matrix $B$ operation type.
alpha – [in] scalar $α$ .
A – [in] dense matrix $A$ descriptor.
B – [in] dense matrix $B$ descriptor.
beta – [in] scalar $β$ .
C – [inout] sparse matrix $C$ descriptor.
computeType – [in] floating point precision for the SDDMM computation.
alg – [in] specification of the algorithm to use.
pBufferSizeInBytes – [out] number of bytes of the temporary storage buffer.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, beta, A, B, D, C or pBufferSizeInBytes pointer is invalid or the value of opA or opB is incorrect
HIPSPARSE_STATUS_NOT_SUPPORTED – opA == HIPSPARSE_OPERATION_CONJUGATE_TRANSPOSE or opB == HIPSPARSE_OPERATION_CONJUGATE_TRANSPOSE.

hipsparseSDDMM_preprocess()#

hipsparseStatus_t hipsparseSDDMM_preprocess(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void *alpha, hipsparseConstDnMatDescr_t A, hipsparseConstDnMatDescr_t B, const void *beta, hipsparseSpMatDescr_t C, hipDataType computeType, hipsparseSDDMMAlg_t alg, void *tempBuffer)#

Preprocess step of the sampled dense dense matrix multiplication:

C := α (o p (A) \cdot o p (B)) \circ s p y (C) + β \cdot C,

where

C

is a sparse matrix and

A

and

B

are dense matrices.

hipsparseSDDMM_preprocess performs the required preprocessing used when computing the sampled dense dense matrix multiplication

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] dense matrix $A$ operation type.
opB – [in] dense matrix $B$ operation type.
alpha – [in] scalar $α$ .
A – [in] dense matrix $A$ descriptor.
B – [in] dense matrix $B$ descriptor.
beta – [in] scalar $β$ .
C – [inout] sparse matrix $C$ descriptor.
computeType – [in] floating point precision for the SDDMM computation.
alg – [in] specification of the algorithm to use.
tempBuffer – [in] temporary storage buffer allocated by the user. The size must be greater or equal to the size obtained with hipsparseSDDMM_bufferSize.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, beta, A, B, C or tempBuffer pointer is invalid or the value of opA or opB is incorrect.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA == HIPSPARSE_OPERATION_CONJUGATE_TRANSPOSE or opB == HIPSPARSE_OPERATION_CONJUGATE_TRANSPOSE.

hipsparseSDDMM()#

hipsparseStatus_t hipsparseSDDMM(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void *alpha, hipsparseConstDnMatDescr_t A, hipsparseConstDnMatDescr_t B, const void *beta, hipsparseSpMatDescr_t C, hipDataType computeType, hipsparseSDDMMAlg_t alg, void *tempBuffer)#

Description: Sampled Dense-Dense Matrix Multiplication.

hipsparseSDDMM multiplies the scalar $α$ with the dense $m \times k$ matrix $A$ , the dense $k \times n$ matrix $B$ , filtered by the sparsity pattern of the $m \times n$ sparse matrix $C$ and adds the result to $C$ scaled by $β$ . The final result is stored in the sparse $m \times n$ matrix $C$ , such that

C := α (o p (A) \cdot o p (B)) \circ s p y (C) + β C,

with

\begin{array}{r} o p (A) = {\begin{cases} A, & if opA == HIPSPARSE_OPERATION_NON_TRANSPOSE \\ A^{T}, & if opA == HIPSPARSE_OPERATION_TRANSPOSE \end{cases} \end{array}

,

\begin{array}{r} o p (B) = {\begin{cases} B, & if opB == HIPSPARSE_OPERATION_NON_TRANSPOSE \\ B^{T}, & if opB == HIPSPARSE_OPERATION_TRANSPOSE \end{cases} \end{array}

and

\begin{array}{r} s p y (C)_{i j} = {\begin{cases} 1 if i == j, & 0 if i != j \end{cases} \end{array}

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] dense matrix $A$ operation type.
opB – [in] dense matrix $B$ operation type.
alpha – [in] scalar $α$ .
A – [in] dense matrix $A$ descriptor.
B – [in] dense matrix $B$ descriptor.
beta – [in] scalar $β$ .
C – [inout] sparse matrix $C$ descriptor.
computeType – [in] floating point precision for the SDDMM computation.
alg – [in] specification of the algorithm to use.
tempBuffer – [in] temporary storage buffer allocated by the user. The size must be greater or equal to the size obtained with hipsparseSDDMM_bufferSize.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, beta, A, B, C or tempBuffer pointer is invalid or the value of opA or opB is incorrect.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA == HIPSPARSE_OPERATION_CONJUGATE_TRANSPOSE or opB == HIPSPARSE_OPERATION_CONJUGATE_TRANSPOSE.

hipsparseSpSV_createDescr()#

hipsparseStatus_t hipsparseSpSV_createDescr(hipsparseSpSVDescr_t *descr)#

Create sparse matrix triangular solve descriptor.

hipsparseSpSV_createDescr creates a sparse matrix triangular solve descriptor. It should be destroyed at the end using hipsparseSpSV_destroyDescr().

hipsparseSpSV_destroyDescr()#

hipsparseStatus_t hipsparseSpSV_destroyDescr(hipsparseSpSVDescr_t descr)#

Destroy sparse matrix triangular solve descriptor.

hipsparseSpSV_destroyDescr destroys a sparse matrix triangular solve descriptor and releases all resources used by the descriptor.

hipsparseSpSV_bufferSize()#

hipsparseStatus_t hipsparseSpSV_bufferSize(hipsparseHandle_t handle, hipsparseOperation_t opA, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstDnVecDescr_t x, const hipsparseDnVecDescr_t y, hipDataType computeType, hipsparseSpSVAlg_t alg, hipsparseSpSVDescr_t spsvDescr, size_t *pBufferSizeInBytes)#

Buffer size step of solution of triangular linear system:

o p (A) \cdot y := α \cdot x,

where

A

is a sparse matrix in CSR storage format,

x

and

y

are dense vectors.

hipsparseSpSV_bufferSize computes the required user allocated buffer size needed when computing the solution of triangular linear system $o p (A) \cdot y = α \cdot x$ , where $A$ is a sparse matrix in CSR storage format, $x$ and $y$ are dense vectors.

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] matrix operation type.
alpha – [in] scalar $α$ .
matA – [in] matrix descriptor.
x – [in] vector descriptor.
y – [inout] vector descriptor.
computeType – [in] floating point precision for the SpSV computation.
alg – [in] SpSV algorithm for the SpSV computation.
spsvDescr – [in] SpSV descriptor.
pBufferSizeInBytes – [out] number of bytes of the temporary storage buffer.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, matA, x, y, spsvDescr or pBufferSizeInBytes pointer is invalid.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA, computeType or alg is currently not supported.

hipsparseSpSV_analysis()#

hipsparseStatus_t hipsparseSpSV_analysis(hipsparseHandle_t handle, hipsparseOperation_t opA, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstDnVecDescr_t x, const hipsparseDnVecDescr_t y, hipDataType computeType, hipsparseSpSVAlg_t alg, hipsparseSpSVDescr_t spsvDescr, void *externalBuffer)#

Analysis step of solution of triangular linear system:

o p (A) \cdot y := α \cdot x,

where

A

is a sparse matrix in CSR storage format,

x

and

y

are dense vectors.

hipsparseSpSV_analysis performs the required analysis used when computing the solution of triangular linear system $o p (A) \cdot y = α \cdot x$ , where $A$ is a sparse matrix in CSR storage format, $x$ and $y$ are dense vectors.

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] matrix operation type.
alpha – [in] scalar $α$ .
matA – [in] matrix descriptor.
x – [in] vector descriptor.
y – [inout] vector descriptor.
computeType – [in] floating point precision for the SpSV computation.
alg – [in] SpSV algorithm for the SpSV computation.
spsvDescr – [in] SpSV descriptor.
externalBuffer – [out] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, matA, x, y, spsvDescr or externalBuffer pointer is invalid.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA, computeType or alg is currently not supported.

hipsparseSpSV_solve()#

hipsparseStatus_t hipsparseSpSV_solve(hipsparseHandle_t handle, hipsparseOperation_t opA, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstDnVecDescr_t x, const hipsparseDnVecDescr_t y, hipDataType computeType, hipsparseSpSVAlg_t alg, hipsparseSpSVDescr_t spsvDescr)#

Sparse triangular solve.

hipsparseSpSV_solve solves a sparse triangular linear system of a sparse $m \times m$ matrix, defined in CSR or COO storage format, a dense solution vector $y$ and the right-hand side $x$ that is multiplied by $α$ , such that

o p (A) \cdot y = α \cdot x,

with

\begin{array}{r} o p (A) = {\begin{cases} A, & if trans == HIPSPARSE_OPERATION_NON_TRANSPOSE \\ A^{T}, & if trans == HIPSPARSE_OPERATION_TRANSPOSE \\ A^{H}, & if trans == HIPSPARSE_OPERATION_CONJUGATE_TRANSPOSE \end{cases} \end{array}

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] matrix operation type.
alpha – [in] scalar $α$ .
matA – [in] matrix descriptor.
x – [in] vector descriptor.
y – [inout] vector descriptor.
computeType – [in] floating point precision for the SpSV computation.
alg – [in] SpSV algorithm for the SpSV computation.
spsvDescr – [in] SpSV descriptor.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, matA, x, y, or spsvDescr pointer is invalid.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA, computeType or alg is currently not supported.

hipsparseSpSM_createDescr()#

hipsparseStatus_t hipsparseSpSM_createDescr(hipsparseSpSMDescr_t *descr)#

Create sparse matrix triangular solve with multiple rhs descriptor.

hipsparseSpSM_createDescr creates a sparse matrix triangular solve with multiple rhs descriptor. It should be destroyed at the end using hipsparseSpSM_destroyDescr().

hipsparseSpSM_destroyDescr()#

hipsparseStatus_t hipsparseSpSM_destroyDescr(hipsparseSpSMDescr_t descr)#

Destroy sparse matrix triangular solve with multiple rhs descriptor.

hipsparseSpSM_destroyDescr destroys a sparse matrix triangular solve with multiple rhs descriptor and releases all resources used by the descriptor.

hipsparseSpSM_bufferSize()#

hipsparseStatus_t hipsparseSpSM_bufferSize(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstDnMatDescr_t matB, const hipsparseDnMatDescr_t matC, hipDataType computeType, hipsparseSpSMAlg_t alg, hipsparseSpSMDescr_t spsmDescr, size_t *pBufferSizeInBytes)#

Buffer size step of solution of triangular linear system:

o p (A) \cdot C := α \cdot o p (B),

where

A

is a sparse matrix in CSR storage format,

B

and

C

are dense matrices.

hipsparseSpSM_bufferSize computes the required user allocated buffer size needed when computing the solution of triangular linear system $o p (A) \cdot C = α \cdot o p (B)$ , where $A$ is a sparse matrix in CSR storage format, $B$ and $C$ are dense matrices.

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] matrix operation type for the sparse matrix $A$ .
opB – [in] matrix operation type for the dense matrix $B$ .
alpha – [in] scalar $α$ .
matA – [in] sparse matrix descriptor.
matB – [in] dense matrix descriptor.
matC – [inout] dense matrix descriptor.
computeType – [in] floating point precision for the SpSM computation.
alg – [in] SpSM algorithm for the SpSM computation.
spsmDescr – [in] SpSM descriptor.
pBufferSizeInBytes – [out] number of bytes of the temporary storage buffer.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, matA, matB, matC, spsmDescr or pBufferSizeInBytes pointer is invalid.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA, opB, computeType or alg is currently not supported.

hipsparseSpSM_analysis()#

hipsparseStatus_t hipsparseSpSM_analysis(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstDnMatDescr_t matB, const hipsparseDnMatDescr_t matC, hipDataType computeType, hipsparseSpSMAlg_t alg, hipsparseSpSMDescr_t spsmDescr, void *externalBuffer)#

Analysis step of solution of triangular linear system:

o p (A) \cdot C := α \cdot o p (B),

where

A

is a sparse matrix in CSR storage format,

B

and

C

are dense vectors.

hipsparseSpSM_analysis performs the required analysis used when computing the solution of triangular linear system $o p (A) \cdot C = α \cdot o p (B)$ , where $A$ is a sparse matrix in CSR storage format, $B$ and $C$ are dense vectors.

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] matrix operation type for the sparse matrix $A$ .
opB – [in] matrix operation type for the dense matrix $B$ .
alpha – [in] scalar $α$ .
matA – [in] sparse matrix descriptor.
matB – [in] dense matrix descriptor.
matC – [inout] dense matrix descriptor.
computeType – [in] floating point precision for the SpSM computation.
alg – [in] SpSM algorithm for the SpSM computation.
spsmDescr – [in] SpSM descriptor.
externalBuffer – [out] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, matA, matB, matC, spsmDescr or externalBuffer pointer is invalid.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA, opB, computeType or alg is currently not supported.

hipsparseSpSM_solve()#

hipsparseStatus_t hipsparseSpSM_solve(hipsparseHandle_t handle, hipsparseOperation_t opA, hipsparseOperation_t opB, const void *alpha, hipsparseConstSpMatDescr_t matA, hipsparseConstDnMatDescr_t matB, const hipsparseDnMatDescr_t matC, hipDataType computeType, hipsparseSpSMAlg_t alg, hipsparseSpSMDescr_t spsmDescr, void *externalBuffer)#

Sparse triangular system solve.

hipsparseSpSM_solve solves a sparse triangular linear system of a sparse $m \times m$ matrix, defined in CSR or COO storage format, a dense solution matrix $C$ and the right-hand side $B$ that is multiplied by $α$ , such that

o p (A) \cdot C = α \cdot o p (B),

with

\begin{array}{r} o p (A) = {\begin{cases} A, & if trans == HIPSPARSE_OPERATION_NON_TRANSPOSE \\ A^{T}, & if trans == HIPSPARSE_OPERATION_TRANSPOSE \\ A^{H}, & if trans == HIPSPARSE_OPERATION_CONJUGATE_TRANSPOSE \end{cases} \end{array}

and

\begin{array}{r} o p (B) = {\begin{cases} B, & if transB == HIPSPARSE_OPERATION_NON_TRANSPOSE \\ B^{T}, & if transB == HIPSPARSE_OPERATION_TRANSPOSE \\ B^{H}, & if transB == HIPSPARSE_OPERATION_CONJUGATE_TRANSPOSE \end{cases} \end{array}

Parameters:

handle – [in] handle to the hipsparse library context queue.
opA – [in] matrix operation type for the sparse matrix $A$ .
opB – [in] matrix operation type for the dense matrix $B$ .
alpha – [in] scalar $α$ .
matA – [in] sparse matrix descriptor.
matB – [in] dense matrix descriptor.
matC – [inout] dense matrix descriptor.
computeType – [in] floating point precision for the SpSM computation.
alg – [in] SpSM algorithm for the SpSM computation.
spsmDescr – [in] SpSM descriptor.
externalBuffer – [out] temporary storage buffer allocated by the user.

Return values:

HIPSPARSE_STATUS_SUCCESS – the operation completed successfully.
HIPSPARSE_STATUS_INVALID_VALUE – handle, alpha, matA, matB, matC, spsmDescr or externalBuffer pointer is invalid.
HIPSPARSE_STATUS_NOT_SUPPORTED – opA, opB, computeType or alg is currently not supported.

Sparse Generic Functions

Contents

Sparse Generic Functions#

hipsparseAxpby()#

hipsparseGather()#

hipsparseScatter()#

hipsparseRot()#

hipsparseSparseToDense_bufferSize()#

hipsparseSparseToDense()#

hipsparseDenseToSparse_bufferSize()#

hipsparseDenseToSparse_analysis()#

hipsparseDenseToSparse_convert()#

hipsparseSpVV_bufferSize()#

hipsparseSpVV()#

hipsparseSpMV_bufferSize()#

hipsparseSpMV_preprocess()#

hipsparseSpMV()#

hipsparseSpMM_bufferSize()#

hipsparseSpMM_preprocess()#

hipsparseSpMM()#

hipsparseSpGEMM_createDescr()#

hipsparseSpGEMM_destroyDescr()#

hipsparseSpGEMM_workEstimation()#

hipsparseSpGEMM_compute()#

hipsparseSpGEMM_copy()#

hipsparseSpGEMMreuse_workEstimation()#

hipsparseSpGEMMreuse_nnz()#

hipsparseSpGEMMreuse_copy()#

hipsparseSpGEMMreuse_compute()#

hipsparseSDDMM_bufferSize()#

hipsparseSDDMM_preprocess()#

hipsparseSDDMM()#

hipsparseSpSV_createDescr()#

hipsparseSpSV_destroyDescr()#

hipsparseSpSV_bufferSize()#

hipsparseSpSV_analysis()#

hipsparseSpSV_solve()#

hipsparseSpSM_createDescr()#

hipsparseSpSM_destroyDescr()#

hipsparseSpSM_bufferSize()#

hipsparseSpSM_analysis()#

hipsparseSpSM_solve()#