PaStiX Handbook  6.3.2
pastix_cuda.h File Reference

Go to the source code of this file.

Data Structures

struct  gemm_param_s
 
struct  gemm_params_s
 

Macros

#define MAX_BATCH_COUNT   16
 

Typedefs

typedef struct gemm_param_s gemm_param_t
 
typedef struct gemm_params_s gemm_params_t
 

Functions

void pastix_zgemm_vbatched_nt (pastix_trans_t transB, pastix_int_t n, pastix_int_t k, cuDoubleComplex alpha, const cuDoubleComplex *dB, pastix_int_t lddb, cuDoubleComplex beta, pastix_int_t max_m, pastix_int_t batchCount, cudaStream_t stream, gemm_params_t params)
 
void pastix_cgemm_vbatched_nt (pastix_trans_t transB, pastix_int_t n, pastix_int_t k, cuFloatComplex alpha, const cuFloatComplex *dB, pastix_int_t lddb, cuFloatComplex beta, pastix_int_t max_m, pastix_int_t batchCount, cudaStream_t stream, gemm_params_t params)
 
void pastix_dgemm_vbatched_nt (pastix_trans_t transB, pastix_int_t n, pastix_int_t k, double alpha, const double *dB, pastix_int_t lddb, double beta, pastix_int_t max_m, pastix_int_t batchCount, cudaStream_t stream, gemm_params_t params)
 
void pastix_sgemm_vbatched_nt (pastix_trans_t transB, pastix_int_t n, pastix_int_t k, float alpha, const float *dB, pastix_int_t lddb, float beta, pastix_int_t max_m, pastix_int_t batchCount, cudaStream_t stream, gemm_params_t params)
 
void pastix_fermi_zgemmsp (char TRANSA, char TRANSB, int m, int n, int k, cuDoubleComplex alpha, const cuDoubleComplex *gpu_A, int lda, const cuDoubleComplex *gpu_B, int ldb, cuDoubleComplex beta, cuDoubleComplex *gpu_C, int ldc, int blocknbr, const int *blocktab, int fblocknbr, const int *fblocktab, cudaStream_t stream)
 
void pastix_fermi_cgemmsp (char TRANSA, char TRANSB, int m, int n, int k, cuFloatComplex alpha, const cuFloatComplex *gpu_A, int lda, const cuFloatComplex *gpu_B, int ldb, cuFloatComplex beta, cuFloatComplex *gpu_C, int ldc, int blocknbr, const int *blocktab, int fblocknbr, const int *fblocktab, cudaStream_t stream)
 
void pastix_fermi_dgemmsp (char TRANSA, char TRANSB, int m, int n, int k, double alpha, const double *gpu_A, int lda, const double *gpu_B, int ldb, double beta, double *gpu_C, int ldc, int blocknbr, const int *blocktab, int fblocknbr, const int *fblocktab, cudaStream_t stream)
 
void pastix_fermi_sgemmsp (char TRANSA, char TRANSB, int m, int n, int k, float alpha, const float *gpu_A, int lda, const float *gpu_B, int ldb, float beta, float *gpu_C, int ldc, int blocknbr, const int *blocktab, int fblocknbr, const int *fblocktab, cudaStream_t stream)
 

Detailed Description

PaStiX GPU kernel header.

Version
6.3.2
Author
Mathieu Faverge
Date
2023-07-21

Definition in file pastix_cuda.h.


Data Type Documentation

◆ gemm_param_s

struct gemm_param_s

Definition at line 23 of file pastix_cuda.h.

Data Fields
const void * Aptr
void * Cptr
pastix_int_t M
pastix_int_t lda
pastix_int_t ldc

◆ gemm_params_s

struct gemm_params_s

Definition at line 31 of file pastix_cuda.h.

Data Fields
gemm_param_t p[MAX_BATCH_COUNT]