#pragma once #include #include #include #include #if !AT_MKL_ENABLED() #define MKL_INT int #else #include #endif namespace at { namespace native { void mkl_gemm_batched( TransposeType trans_A, TransposeType trans_B, MKL_INT batch_size, MKL_INT M, MKL_INT N, MKL_INT K, float alpha, const float** A, MKL_INT lda, const float** B, MKL_INT ldb, float beta, float** C, MKL_INT ldc); void mkl_gemm_batched( TransposeType trans_A, TransposeType trans_B, MKL_INT batch_size, MKL_INT M, MKL_INT N, MKL_INT K, double alpha, const double** A, MKL_INT lda, const double** B, MKL_INT ldb, double beta, double** C, MKL_INT ldc); void mkl_gemm_batched( TransposeType trans_A, TransposeType trans_B, MKL_INT batch_size, MKL_INT M, MKL_INT N, MKL_INT K, c10::complex alpha, const c10::complex** A, MKL_INT lda, const c10::complex** B, MKL_INT ldb, c10::complex beta, c10::complex** C, MKL_INT ldc); void mkl_gemm_batched( TransposeType trans_A, TransposeType trans_B, MKL_INT batch_size, MKL_INT M, MKL_INT N, MKL_INT K, c10::complex alpha, const c10::complex** A, MKL_INT lda, const c10::complex** B, MKL_INT ldb, c10::complex beta, c10::complex** C, MKL_INT ldc); void mkl_gemm_bf16bf16f32( TransposeType trans_A, TransposeType trans_B, MKL_INT M, MKL_INT N, MKL_INT K, const float alpha, const c10::BFloat16* A, MKL_INT lda, const c10::BFloat16* B, MKL_INT ldb, const float beta, float* C, MKL_INT ldc); void mkl_gemm_f16f16f32( TransposeType trans_A, TransposeType trans_B, int M, int N, int K, const float alpha, const c10::Half* A, int lda, const c10::Half* B, int ldb, const float beta, float* C, int ldc); }} // namespace at::native