34 scalar_t alpha_ = scalar_t(alpha);
35 scalar_t beta_ = scalar_t(beta);
37 gemm_cuda(handle, gemmTrA ? CUBLAS_OP_T : CUBLAS_OP_N,
38 gemmTrB ? CUBLAS_OP_T : CUBLAS_OP_N, m, n, k, &alpha_,
39 static_cast<const scalar_t*
>(A_data), lda,
40 static_cast<const scalar_t*
>(B_data), ldb, &beta_,
41 static_cast<scalar_t*
>(C_data), ldc),
#define DISPATCH_LINALG_DTYPE_TO_TEMPLATE(DTYPE,...)
ccGuiPythonInstance * GetInstance() noexcept
void AddMMCUDA(void *A_data, void *B_data, void *C_data, int64_t m, int64_t k, int64_t n, double alpha, double beta, bool gemmTrA, bool gemmTrB, int lda, int ldb, int ldc, Dtype dtype, const Device &device)
Generic file read and write utility for python interface.