tlapack/svd__qr_8hpp_source.html

//

// Copyright (c) 2025, University of Colorado Denver. All rights reserved.

//

// This file is part of <T>LAPACK.

// <T>LAPACK is free software: you can redistribute it and/or modify it under

// the terms of the BSD 3-Clause license. See the accompanying LICENSE file.


#ifndef TLAPACK_SVD_QR_HH

#define TLAPACK_SVD_QR_HH


#include "tlapack/base/utils.hpp"

#include "tlapack/blas/iamax.hpp"

#include "tlapack/blas/lartg.hpp"

#include "tlapack/blas/rot.hpp"

#include "tlapack/blas/swap.hpp"

#include "tlapack/lapack/gebrd.hpp"

#include "tlapack/lapack/singularvalues22.hpp"

#include "tlapack/lapack/svd22.hpp"


namespace tlapack {


template <class matrix_t,

          class d_t,

          class e_t,

          enable_if_t<is_same_v<type_t<d_t>, real_type<type_t<d_t>>>, int> = 0,

          enable_if_t<is_same_v<type_t<e_t>, real_type<type_t<e_t>>>, int> = 0>


int svd_qr(Uplo uplo,

           bool want_u,

           bool want_vt,

           d_t& d,

           e_t& e,

           matrix_t& U,

           matrix_t& Vt)

{

    using idx_t = size_type<matrix_t>;

    using range = pair<idx_t, idx_t>;

    using T = type_t<matrix_t>;

    using real_t = real_type<T>;


    // constants

    const real_t one(1);

    const real_t zero(0);

    const idx_t n = size(d);

    const real_t eps = ulp<real_t>();

    const real_t unfl = safe_min<real_t>();

    const real_t tolmul =

        max(real_t(10.0), min(real_t(100.0), one / sqrt(sqrt(sqrt(eps)))));

    const real_t tol = tolmul * eps;


    // Quick return

    if (n == 0) return 0;


    // If the matrix is lower bidiagonal, apply a sequence of rotations

    // to make it upper bidiagonal.

    if (uplo == Uplo::Lower) {

        real_t c, s, r;


        for (idx_t i = 0; i < n - 1; ++i) {

            lartg(d[i], e[i], c, s, r);

            d[i] = r;

            e[i] = s * d[i + 1];

            d[i + 1] = c * d[i + 1];


            // Update singular vectors if desired

            if (want_u) {

                auto u1 = col(U, i);

                auto u2 = col(U, i + 1);

                rot(u1, u2, c, s);

            }

        }

    }


    idx_t itmax = 30 * n;


    //

    // Determine threshold

    //

    real_t sminoa = abs(d[0]);

    if (sminoa != zero) {

        auto mu = sminoa;

        for (idx_t i = 1; i < n; ++i) {

            mu = abs(d[i]) * (mu / (mu + abs(e[i - 1])));

            sminoa = min(sminoa, mu);

            if (sminoa == zero) break;

        }

    }

    sminoa = sminoa / sqrt(real_t(n));

    real_t thresh = max(tol * sminoa, (real_t(n) * unfl));


    // istart and istop determine the active block

    idx_t istart = 0;

    idx_t istop = n;


    // Keep track of previous istart and istop to know when to change direction

    idx_t istart_old = -1;

    idx_t istop_old = -1;


    // If true, chase bulges from top to bottom

    // If false chase bulges from bottom to top

    // This variable is reevaluated for every new subblock

    bool forwarddirection = true;


    //

    // Main loop

    //

    for (idx_t iter = 0; iter <= itmax; ++iter) {

        if (iter == itmax) {

            // The QR algorithm failed to converge, return with error.

            return istop;

        }


        if (istop <= 1) {

            // All singular values have been found, exit and return 0.

            break;

        }


        // Find active block

        auto smax = abs(d[istop - 1]);

        for (idx_t i = istop - 1; i > istart; --i) {

            smax = max(smax, abs(d[i - 1]));

            smax = max(smax, abs(e[i - 1]));

            if (abs(e[i - 1]) <= thresh) {

                e[i - 1] = zero;

                istart = i;

                break;

            }

        }


        // A singular value has split off, reduce istop and start the loop again

        if (istart == istop - 1) {

            istop = istop - 1;

            istart = 0;

            continue;

        }


        // A 2x2 block has split off, handle separately

        if (istart + 1 == istop - 1) {

            real_t csl, snl, csr, snr, sigmn, sigmx;

            svd22(d[istart], e[istart], d[istart + 1], sigmn, sigmx, csl, snl,

                  csr, snr);

            d[istart] = sigmx;

            d[istart + 1] = sigmn;

            e[istart] = zero;


            // Update singular vectors if desired

            if (want_u) {

                auto u1 = col(U, istart);

                auto u2 = col(U, istart + 1);

                rot(u1, u2, csl, snl);

            }

            if (want_vt) {

                auto vt1 = row(Vt, istart);

                auto vt2 = row(Vt, istart + 1);

                rot(vt1, vt2, csr, snr);

            }


            istop = istop - 2;

            istart = 0;

            continue;

        }


        if (istart >= istop_old or istop <= istart_old) {

            forwarddirection = abs(d[istart]) > abs(d[istop - 1]);

        }

        istart_old = istart;

        istop_old = istop;


        //

        // Extra convergence checks

        //


        real_t sminl;

        if (forwarddirection) {

            // First apply standard test to bottom of matrix

            if (abs(e[istop - 2]) <= tol * abs(d[istop - 1])) {

                e[istop - 2] = zero;

                istop = istop - 1;

                continue;

            }

            // Now apply fancy convergence criterion using recurrence

            // relation for minimal singular value estimate

            auto mu = abs(d[istart]);

            sminl = mu;

            bool found_zero = false;

            for (idx_t i = istart; i + 1 < istop; ++i) {

                if (abs(e[i]) < tol * mu) {

                    found_zero = true;

                    e[i] = zero;

                    break;

                }

                mu = abs(d[i + 1]) * (mu / (mu + abs(e[i])));

                sminl = min(sminl, mu);

            }

            if (found_zero) continue;

        }

        else {

            // First apply standard test to top of matrix

            if (abs(e[istart]) <= tol * abs(d[istart])) {

                e[istart] = zero;

                istart = istart + 1;

                continue;

            }

            // Now apply fancy convergence criterion using recurrence

            // relation for minimal singular value estimate

            auto mu = abs(d[istop - 1]);

            sminl = mu;

            bool found_zero = false;

            for (idx_t i2 = istart; i2 + 1 < istop; ++i2) {

                idx_t i = istop - 2 - (i2 - istart);

                if (abs(e[i]) < tol * mu) {

                    found_zero = true;

                    e[i] = zero;

                    break;

                }

                mu = abs(d[i]) * (mu / (mu + abs(e[i])));

                sminl = min(sminl, mu);

            }

            if (found_zero) continue;

        }


        // Compute shift.  First, test if shifting would ruin relative

        // accuracy, and if so set the shift to zero.

        real_t shift;

        if (real_t(n) * tol * (sminl / smax) <= max(eps, real_t(0.01) * tol)) {

            shift = zero;

        }

        else {

            real_t sstart, temp;

            if (forwarddirection) {

                // Compute the shift from 2-by-2 block at end of matrix

                sstart = abs(d[istart]);

                singularvalues22(d[istop - 2], e[istop - 2], d[istop - 1],

                                 shift, temp);

            }

            else {

                // Compute the shift from 2-by-2 block at start of matrix

                sstart = abs(d[istop - 1]);

                singularvalues22(d[istart], e[istart], d[istart + 1], shift,

                                 temp);

            }


            // Test if shift negligible, and if so set to zero

            if (sstart > zero and square(shift / sstart) < eps) shift = zero;

        }


        if (shift == zero) {

            // If shift = 0, do simplified QR iteration, this is better for the

            // relative accuracy of small singular values

            if (forwarddirection) {

                real_t r, cs, sn, oldcs, oldsn;

                cs = one;

                sn = zero;

                oldcs = one;

                oldsn = zero;

                for (idx_t i = istart; i < istop - 1; ++i) {

                    lartg(d[i] * cs, e[i], cs, sn, r);

                    if (i > istart) e[i - 1] = oldsn * r;

                    lartg(oldcs * r, d[i + 1] * sn, oldcs, oldsn, d[i]);


                    // Update singular vectors if desired

                    if (want_u) {

                        auto u1 = col(U, i);

                        auto u2 = col(U, i + 1);

                        rot(u1, u2, oldcs, oldsn);

                    }

                    if (want_vt) {

                        auto vt1 = row(Vt, i);

                        auto vt2 = row(Vt, i + 1);

                        rot(vt1, vt2, cs, sn);

                    }

                }

                real_t h = d[istop - 1] * cs;

                d[istop - 1] = h * oldcs;

                e[istop - 2] = h * oldsn;

            }

            else {

                real_t r, cs, sn, oldcs, oldsn;

                cs = one;

                sn = zero;

                oldcs = one;

                oldsn = zero;

                for (idx_t i = istop - 1; i > istart; --i) {

                    lartg(d[i] * cs, e[i - 1], cs, sn, r);

                    if (i < istop - 1) e[i] = oldsn * r;

                    lartg(oldcs * r, d[i - 1] * sn, oldcs, oldsn, d[i]);


                    // Update singular vectors if desired

                    if (want_u) {

                        auto u1 = col(U, i - 1);

                        auto u2 = col(U, i);

                        rot(u1, u2, cs, -sn);

                    }

                    if (want_vt) {

                        auto vt1 = row(Vt, i - 1);

                        auto vt2 = row(Vt, i);

                        rot(vt1, vt2, oldcs, -oldsn);

                    }

                }

                real_t h = d[istart] * cs;

                d[istart] = h * oldcs;

                e[istart] = h * oldsn;

            }

        }

        else {

            // Use nonzero shift


            if (forwarddirection) {

                real_t f = (abs(d[istart]) - shift) *

                           (real_t(sgn(d[istart])) + shift / d[istart]);

                real_t g = e[istart];

                for (idx_t i = istart; i < istop - 1; ++i) {

                    real_t r, csl, snl, csr, snr;

                    lartg(f, g, csr, snr, r);

                    if (i > istart) e[i - 1] = r;

                    f = csr * d[i] + snr * e[i];

                    e[i] = csr * e[i] - snr * d[i];

                    g = snr * d[i + 1];

                    d[i + 1] = csr * d[i + 1];


                    lartg(f, g, csl, snl, r);

                    d[i] = r;

                    f = csl * e[i] + snl * d[i + 1];

                    d[i + 1] = csl * d[i + 1] - snl * e[i];

                    if (i + 1 < istop - 1) {

                        g = snl * e[i + 1];

                        e[i + 1] = csl * e[i + 1];

                    }


                    // Update singular vectors if desired

                    if (want_u) {

                        auto u1 = col(U, i);

                        auto u2 = col(U, i + 1);

                        rot(u1, u2, csl, snl);

                    }

                    if (want_vt) {

                        auto vt1 = row(Vt, i);

                        auto vt2 = row(Vt, i + 1);

                        rot(vt1, vt2, csr, snr);

                    }

                }

                e[istop - 2] = f;

            }

            else {

                real_t f = (abs(d[istop - 1]) - shift) *

                           (real_t(sgn(d[istop - 1])) + shift / d[istop - 1]);

                real_t g = e[istop - 2];

                for (idx_t i = istop - 1; i > istart; --i) {

                    real_t r, csl, snl, csr, snr;

                    lartg(f, g, csr, snr, r);

                    if (i < istop - 1) e[i] = r;

                    f = csr * d[i] + snr * e[i - 1];

                    e[i - 1] = csr * e[i - 1] - snr * d[i];

                    g = snr * d[i - 1];

                    d[i - 1] = csr * d[i - 1];


                    lartg(f, g, csl, snl, r);

                    d[i] = r;

                    f = csl * e[i - 1] + snl * d[i - 1];

                    d[i - 1] = csl * d[i - 1] - snl * e[i - 1];

                    if (i > istart + 1) {

                        g = snl * e[i - 2];

                        e[i - 2] = csl * e[i - 2];

                    }


                    // Update singular vectors if desired

                    if (want_u) {

                        auto u1 = col(U, i - 1);

                        auto u2 = col(U, i);

                        rot(u1, u2, csr, -snr);

                    }

                    if (want_vt) {

                        auto vt1 = row(Vt, i - 1);

                        auto vt2 = row(Vt, i);

                        rot(vt1, vt2, csl, -snl);

                    }

                }

                e[istart] = f;

            }

        }

    }


    // All singular values converged, so make them positive

    for (idx_t i = 0; i < n; ++i) {

        if (d[i] < zero) {

            d[i] = -d[i];

            if (want_vt) {

                auto vt1 = row(Vt, i);

                scal(-one, vt1);

            }

        }

    }


    // Sort the singular values into decreasing order.

    for (idx_t i = 0; i < n - 1; ++i) {

        auto d2 = slice(d, range{i, n});

        idx_t imax = i + iamax(d2);

        if (imax != i) {

            std::swap(d[imax], d[i]);


            if (want_u) {

                auto u1 = col(U, imax);

                auto u2 = col(U, i);

                tlapack::swap(u1, u2);

            }

            if (want_vt) {

                auto vt1 = row(Vt, imax);

                auto vt2 = row(Vt, i);

                tlapack::swap(vt1, vt2);

            }

        }

    }


    return 0;

}


}  // namespace tlapack


#endif  // TLAPACK_SVD_QR_HH

tlapack::Uplo
Uplo
Definition types.hpp:50

utils.hpp

tlapack::sgn
constexpr int sgn(const T &val)
Type-safe sgn function.
Definition utils.hpp:109

iamax.hpp

rot.hpp

swap.hpp

gebrd.hpp

tlapack::svd22
void svd22(const T &f, const T &g, const T &h, T &ssmin, T &ssmax, T &csl, T &snl, T &csr, T &snr)
Computes the singular value decomposition of a 2-by-2 real triangular matrix.
Definition svd22.hpp:55

tlapack::singularvalues22
void singularvalues22(const T &f, const T &g, const T &h, T &ssmin, T &ssmax)
Computes the singular value decomposition of a 2-by-2 real triangular matrix.
Definition singularvalues22.hpp:40

tlapack::rot
void rot(vectorX_t &x, vectorY_t &y, const c_type &c, const s_type &s)
Apply plane rotation:
Definition rot.hpp:44

tlapack::swap
void swap(vectorX_t &x, vectorY_t &y)
Swap vectors, .
Definition swap.hpp:31

tlapack::iamax
size_type< vector_t > iamax(const vector_t &x, const IamaxOpts< abs_f > &opts)
Return .
Definition iamax.hpp:234

tlapack::lartg
void lartg(const T &a, const T &b, real_type< T > &c, T &s, T &r)
Construct plane rotation that eliminates b, such that:
Definition lartg.hpp:38

tlapack::scal
void scal(const alpha_t &alpha, vector_t &x)
Scale vector by constant, .
Definition scal.hpp:30

tlapack::svd_qr
int svd_qr(Uplo uplo, bool want_u, bool want_vt, d_t &d, e_t &e, matrix_t &U, matrix_t &Vt)
Computes the singular values and, optionally, the right and/or left singular vectors from the singula...
Definition svd_qr.hpp:85

lartg.hpp

tlapack::real_type
typename traits::real_type_traits< Types..., int >::type real_type
The common real type of the list of types.
Definition scalar_type_traits.hpp:113

singularvalues22.hpp

svd22.hpp