11#ifndef TLAPACK_BLAS_HEMM_HH
12#define TLAPACK_BLAS_HEMM_HH
57 class T = type_t<matrixC_t>,
58 disable_if_allow_optblas_t<pair<matrixA_t, T>,
62 pair<beta_t, T> > = 0>
77 const idx_t m = nrows(
B);
78 const idx_t n = ncols(
B);
83 uplo != Uplo::General);
89 if (
side == Side::Left) {
90 if (
uplo != Uplo::Lower) {
92 for (idx_t j = 0; j < n; ++j) {
93 for (idx_t i = 0; i < m; ++i) {
98 for (idx_t
k = 0;
k < i; ++
k) {
109 for (idx_t j = 0; j < n; ++j) {
110 for (idx_t i = m - 1; i != idx_t(-1); --i) {
115 for (idx_t
k = i + 1;
k < m; ++
k) {
129 if (
uplo != Uplo::Lower) {
131 for (idx_t j = 0; j < n; ++j) {
134 for (idx_t i = 0; i < m; ++i)
138 for (idx_t
k = 0;
k < j; ++
k) {
140 for (idx_t i = 0; i < m; ++i)
144 for (idx_t
k = j + 1;
k < n; ++
k) {
146 for (idx_t i = 0; i < m; ++i)
153 for (idx_t j = 0; j < n; ++j) {
156 for (idx_t i = 0; i < m; ++i)
160 for (idx_t
k = 0;
k < j; ++
k) {
162 for (idx_t i = 0; i < m; ++i)
166 for (idx_t
k = j + 1;
k < n; ++
k) {
168 for (idx_t i = 0; i < m; ++i)
176#ifdef TLAPACK_USE_LAPACKPP
196 class T = type_t<matrixC_t>,
197 enable_if_allow_optblas_t<pair<matrixA_t, T>,
201 pair<beta_t, T> > = 0>
211 auto A_ = legacy_matrix(A);
212 auto B_ = legacy_matrix(B);
213 auto C_ = legacy_matrix(C);
216 constexpr Layout L = layout<matrixC_t>;
217 const auto& m = C_.m;
218 const auto& n = C_.n;
221 if (alpha == alpha_t(0))
223 -3,
"Infs and NaNs in A or B will not propagate to C on output");
224 if (beta == beta_t(0) && !is_same_v<beta_t, StrongZero>)
227 "Infs and NaNs in C on input will not propagate to C on output");
229 return ::blas::hemm((::blas::Layout)L, (::blas::Side)side,
230 (::blas::Uplo)uplo, m, n, alpha, A_.ptr, A_.ldim,
231 B_.ptr, B_.ldim, (T)beta, C_.ptr, C_.ldim);
Side
Definition types.hpp:271
Uplo
Definition types.hpp:50
constexpr real_type< T > real(const T &x) noexcept
Extends std::real() to real datatypes.
Definition utils.hpp:71
constexpr T conj(const T &x) noexcept
Extends std::conj() to real datatypes.
Definition utils.hpp:100
#define TLAPACK_SCALAR
Macro for tlapack::concepts::Scalar compatible with C++17.
Definition concepts.hpp:915
#define TLAPACK_LEGACY_MATRIX
Macro for tlapack::concepts::LegacyMatrix compatible with C++17.
Definition concepts.hpp:951
#define TLAPACK_MATRIX
Macro for tlapack::concepts::Matrix compatible with C++17.
Definition concepts.hpp:896
void hemm(Side side, Uplo uplo, const alpha_t &alpha, const matrixA_t &A, const matrixB_t &B, const beta_t &beta, matrixC_t &C)
Hermitian matrix-matrix multiply:
Definition hemm.hpp:63
#define tlapack_check_false(cond)
Throw an error if cond is true.
Definition exceptionHandling.hpp:113
#define tlapack_warning(info, detailedInfo)
Warning handler.
Definition exceptionHandling.hpp:156
Concept for types that represent tlapack::Side.
Concept for types that represent tlapack::Uplo.
typename traits::real_type_traits< Types..., int >::type real_type
The common real type of the list of types.
Definition scalar_type_traits.hpp:113
Strong zero type.
Definition StrongZero.hpp:43