|
void | pastix_zgemm_vbatched_nt (pastix_trans_t transB, pastix_int_t n, pastix_int_t k, cuDoubleComplex alpha, const cuDoubleComplex *dB, pastix_int_t lddb, cuDoubleComplex beta, pastix_int_t max_m, pastix_int_t batchCount, cudaStream_t stream, gemm_params_t params) |
|
void | pastix_cgemm_vbatched_nt (pastix_trans_t transB, pastix_int_t n, pastix_int_t k, cuFloatComplex alpha, const cuFloatComplex *dB, pastix_int_t lddb, cuFloatComplex beta, pastix_int_t max_m, pastix_int_t batchCount, cudaStream_t stream, gemm_params_t params) |
|
void | pastix_dgemm_vbatched_nt (pastix_trans_t transB, pastix_int_t n, pastix_int_t k, double alpha, const double *dB, pastix_int_t lddb, double beta, pastix_int_t max_m, pastix_int_t batchCount, cudaStream_t stream, gemm_params_t params) |
|
void | pastix_sgemm_vbatched_nt (pastix_trans_t transB, pastix_int_t n, pastix_int_t k, float alpha, const float *dB, pastix_int_t lddb, float beta, pastix_int_t max_m, pastix_int_t batchCount, cudaStream_t stream, gemm_params_t params) |
|
void | pastix_fermi_zgemmsp (char TRANSA, char TRANSB, int m, int n, int k, cuDoubleComplex alpha, const cuDoubleComplex *gpu_A, int lda, const cuDoubleComplex *gpu_B, int ldb, cuDoubleComplex beta, cuDoubleComplex *gpu_C, int ldc, int blocknbr, const int *blocktab, int fblocknbr, const int *fblocktab, cudaStream_t stream) |
|
void | pastix_fermi_cgemmsp (char TRANSA, char TRANSB, int m, int n, int k, cuFloatComplex alpha, const cuFloatComplex *gpu_A, int lda, const cuFloatComplex *gpu_B, int ldb, cuFloatComplex beta, cuFloatComplex *gpu_C, int ldc, int blocknbr, const int *blocktab, int fblocknbr, const int *fblocktab, cudaStream_t stream) |
|
void | pastix_fermi_dgemmsp (char TRANSA, char TRANSB, int m, int n, int k, double alpha, const double *gpu_A, int lda, const double *gpu_B, int ldb, double beta, double *gpu_C, int ldc, int blocknbr, const int *blocktab, int fblocknbr, const int *fblocktab, cudaStream_t stream) |
|
void | pastix_fermi_sgemmsp (char TRANSA, char TRANSB, int m, int n, int k, float alpha, const float *gpu_A, int lda, const float *gpu_B, int ldb, float beta, float *gpu_C, int ldc, int blocknbr, const int *blocktab, int fblocknbr, const int *fblocktab, cudaStream_t stream) |
|
PaStiX GPU kernel header.
- Copyright
- 2016-2024 Bordeaux INP, CNRS (LaBRI UMR 5800), Inria, Univ. Bordeaux. All rights reserved.
- Version
- 6.4.0
- Author
- Mathieu Faverge
- Date
- 2024-07-05
Definition in file pastix_cuda.h.