<T>LAPACK 0.1.1
C++ Template Linear Algebra PACKage
Loading...
Searching...
No Matches
potrf_blocked_right_looking.hpp
Go to the documentation of this file.
1
5//
6// Copyright (c) 2025, University of Colorado Denver. All rights reserved.
7//
8// This file is part of <T>LAPACK.
9// <T>LAPACK is free software: you can redistribute it and/or modify it under
10// the terms of the BSD 3-Clause license. See the accompanying LICENSE file.
11
12#ifndef TLAPACK_POTRF_BLOCKED_RL_HH
13#define TLAPACK_POTRF_BLOCKED_RL_HH
14
16#include "tlapack/blas/herk.hpp"
17#include "tlapack/blas/trsm.hpp"
20
21namespace tlapack {
22
60template <TLAPACK_UPLO uplo_t, TLAPACK_SMATRIX matrix_t>
62{
63 using T = type_t<matrix_t>;
64 using real_t = real_type<T>;
65 using idx_t = size_type<matrix_t>;
66 using range = pair<idx_t, idx_t>;
67
68 // Constants
69 const real_t one(1);
70 const idx_t n = nrows(A);
71 const idx_t nb = opts.nb;
72
73 // check arguments
74 tlapack_check(uplo == Uplo::Lower || uplo == Uplo::Upper);
75 tlapack_check(nrows(A) == ncols(A));
76
77 // Quick return
78 if (n <= 0) return 0;
79
80 // Unblocked code
81 else if (nb >= n)
82 return potf2(uplo, A);
83
84 // Blocked code
85 else {
86 if (uplo == Uplo::Upper) {
87 for (idx_t j = 0; j < n; j += nb) {
88 idx_t jb = min(nb, n - j);
89
90 // Define AJJ
91 auto AJJ = slice(A, range{j, j + jb}, range{j, j + jb});
92
93 int info = potf2(UPPER_TRIANGLE, AJJ);
94 if (info != 0) {
96 info + j,
97 "The leading minor of the reported order is not "
98 "positive definite,"
99 " and the factorization could not be completed.");
100 return info + j;
101 }
102
103 if (j + jb < n) {
104 auto B = slice(A, range{j, j + jb}, range{j + jb, n});
105 auto C = slice(A, range{j + jb, n}, range{j + jb, n});
106
107 trsm(LEFT_SIDE, UPPER_TRIANGLE, CONJ_TRANS, NON_UNIT_DIAG,
108 one, AJJ, B);
109 herk(UPPER_TRIANGLE, CONJ_TRANS, -one, B, one, C);
110 }
111 }
112 }
113 else {
114 for (idx_t j = 0; j < n; j += nb) {
115 idx_t jb = min(nb, n - j);
116
117 // Define AJJ
118 auto AJJ = slice(A, range{j, j + jb}, range{j, j + jb});
119
120 int info = potf2(LOWER_TRIANGLE, AJJ);
121 if (info != 0) {
123 info + j,
124 "The leading minor of the reported order is not "
125 "positive definite,"
126 " and the factorization could not be completed.");
127 return info + j;
128 }
129
130 if (j + jb < n) {
131 auto B = slice(A, range{j + jb, n}, range{j, j + jb});
132 auto C = slice(A, range{j + jb, n}, range{j + jb, n});
133
134 trsm(RIGHT_SIDE, LOWER_TRIANGLE, CONJ_TRANS, NON_UNIT_DIAG,
135 one, AJJ, B);
136 herk(LOWER_TRIANGLE, NO_TRANS, -one, B, one, C);
137 }
138 }
139 }
140
141 return 0;
142 }
143}
144
145} // namespace tlapack
146
147#endif // TLAPACK_POTRF_BLOCKED_RL_HH
void herk(Uplo uplo, Op trans, const alpha_t &alpha, const matrixA_t &A, const beta_t &beta, matrixC_t &C)
Hermitian rank-k update:
Definition herk.hpp:68
void trsm(Side side, Uplo uplo, Op trans, Diag diag, const alpha_t &alpha, const matrixA_t &A, matrixB_t &B)
Solve the triangular matrix-vector equation.
Definition trsm.hpp:76
int potrf_rl(uplo_t uplo, matrix_t &A, const BlockedCholeskyOpts &opts={})
Computes the Cholesky factorization of a Hermitian positive definite matrix A using a blocked algorit...
Definition potrf_blocked_right_looking.hpp:61
int potf2(uplo_t uplo, matrix_t &A)
Computes the Cholesky factorization of a Hermitian positive definite matrix A using a level-2 algorit...
Definition potf2.hpp:58
#define tlapack_check(cond)
Throw an error if cond is false.
Definition exceptionHandling.hpp:98
#define tlapack_error(info, detailedInfo)
Error handler.
Definition exceptionHandling.hpp:142
Computes the Cholesky factorization of a Hermitian positive definite matrix A using a level-2 algorit...
Computes the Cholesky factorization of a Hermitian positive definite matrix A using a blocked algorit...
typename traits::real_type_traits< Types..., int >::type real_type
The common real type of the list of types.
Definition scalar_type_traits.hpp:113
Definition potrf_blocked.hpp:22