CubbyFlow/_s_v_d-_impl_8hpp_source.html

// This code is based on Jet framework.

// Copyright (c) 2018 Doyub Kim

// CubbyFlow is voxel-based fluid simulation engine for computer games.

// Copyright (c) 2020 CubbyFlow Team

// Core Part: Chris Ohk, Junwoo Hwang, Jihong Sin, Seungwoo Yoo

// AI Part: Dongheon Cho, Minseo Kim

// We are making my contributions/submissions to this project solely in our

// personal capacity and are not conveying any rights to any intellectual

// property of any third parties.


#ifndef CUBBYFLOW_SVD_IMPL_HPP

#define CUBBYFLOW_SVD_IMPL_HPP


#include <stdexcept>


namespace CubbyFlow

{

namespace Internal

{

template <typename T>


T Sign(T a, T b)

{

    return static_cast<double>(b) >= 0.0 ? std::fabs(a) : -std::fabs(a);

}


template <typename T>


T Pythag(T a, T b)

{

    T at = std::fabs(a);

    T bt = std::fabs(b);

    T ct;

    T result;


    if (at > bt)

    {

        ct = bt / at;

        result = at * std::sqrt(1 + ct * ct);

    }

    else if (bt > 0)

    {

        ct = at / bt;

        result = bt * std::sqrt(1 + ct * ct);

    }

    else

    {

        result = 0;

    }


    return result;

}


}  // namespace Internal


template <typename T>


void SVD(const MatrixMxN<T>& a, MatrixMxN<T>& u, VectorN<T>& w, MatrixMxN<T>& v)

{

    const int m = static_cast<int>(a.GetRows());

    const int n = static_cast<int>(a.GetCols());


    int i, j = 0, jj = 0, k = 0, l = 0, nm = 0;

    T c = 0, f = 0, h = 0, s = 0, x = 0, y = 0, z = 0;

    T anorm = 0, g = 0, scale = 0;


    if (m < n)

    {

        throw std::invalid_argument{

            "Number of rows of input matrix must greater than or equal to "

            "columns."

        };

    }


    // Prepare workspace

    VectorN<T> rv1(n, T{});

    u = a;

    w.Resize(n, 0);

    v.Resize(n, n, 0);


    // Householder reduction to bi-diagonal form

    for (i = 0; i < n; i++)

    {

        // left-hand reduction

        l = i + 1;

        rv1[i] = scale * g;

        g = s = scale = 0;


        if (i < m)

        {

            for (k = i; k < m; k++)

            {

                scale += std::fabs(u(k, i));

            }


            if (std::fabs(static_cast<double>(scale)) >=

                std::numeric_limits<double>::epsilon())

            {

                for (k = i; k < m; k++)

                {

                    u(k, i) /= scale;

                    s += u(k, i) * u(k, i);

                }


                f = u(i, i);

                g = -Internal::Sign(std::sqrt(s), f);

                h = f * g - s;

                u(i, i) = f - g;


                if (i != n - 1)

                {

                    for (j = l; j < n; j++)

                    {

                        s = 0;


                        for (k = i; k < m; k++)

                        {

                            s += u(k, i) * u(k, j);

                        }


                        f = s / h;


                        for (k = i; k < m; k++)

                        {

                            u(k, j) += f * u(k, i);

                        }

                    }

                }


                for (k = i; k < m; k++)

                {

                    u(k, i) *= scale;

                }

            }

        }


        w[i] = scale * g;


        // right-hand reduction

        g = s = scale = 0;


        if (i < m && i != n - 1)

        {

            for (k = l; k < n; k++)

            {

                scale += std::fabs(u(i, k));

            }


            if (std::fabs(static_cast<double>(scale)) >=

                std::numeric_limits<double>::epsilon())

            {

                for (k = l; k < n; k++)

                {

                    u(i, k) /= scale;

                    s += u(i, k) * u(i, k);

                }


                f = u(i, l);

                g = -Internal::Sign(std::sqrt(s), f);

                h = f * g - s;

                u(i, l) = f - g;


                for (k = l; k < n; k++)

                {

                    rv1[k] = static_cast<T>(u(i, k)) / h;

                }


                if (i != m - 1)

                {

                    for (j = l; j < m; j++)

                    {

                        s = 0;


                        for (k = l; k < n; k++)

                        {

                            s += u(j, k) * u(i, k);

                        }


                        for (k = l; k < n; k++)

                        {

                            u(j, k) += s * rv1[k];

                        }

                    }

                }


                for (k = l; k < n; k++)

                {

                    u(i, k) *= scale;

                }

            }

        }


        anorm = std::max(anorm,

                         (std::fabs(static_cast<T>(w[i])) + std::fabs(rv1[i])));

    }


    // accumulate the right-hand transformation

    for (i = n - 1; i >= 0; i--)

    {

        if (i < n - 1)

        {

            if (std::fabs(static_cast<double>(g)) >=

                std::numeric_limits<double>::epsilon())

            {

                for (j = l; j < n; j++)

                {

                    v(j, i) = ((u(i, j) / u(i, l)) / g);

                }


                // T division to avoid underflow

                for (j = l; j < n; j++)

                {

                    s = 0;


                    for (k = l; k < n; k++)

                    {

                        s += u(i, k) * v(k, j);

                    }


                    for (k = l; k < n; k++)

                    {

                        v(k, j) += s * v(k, i);

                    }

                }

            }


            for (j = l; j < n; j++)

            {

                v(i, j) = v(j, i) = 0;

            }

        }


        v(i, i) = 1;

        g = rv1[i];

        l = i;

    }


    // accumulate the left-hand transformation

    for (i = n - 1; i >= 0; i--)

    {

        l = i + 1;

        g = w[i];


        if (i < n - 1)

        {

            for (j = l; j < n; j++)

            {

                u(i, j) = 0;

            }

        }


        if (std::fabs(static_cast<double>(g)) >=

            std::numeric_limits<double>::epsilon())

        {

            g = 1 / g;


            if (i != n - 1)

            {

                for (j = l; j < n; j++)

                {

                    s = 0;


                    for (k = l; k < m; k++)

                    {

                        s += u(k, i) * u(k, j);

                    }


                    f = (s / u(i, i)) * g;


                    for (k = i; k < m; k++)

                    {

                        u(k, j) += f * u(k, i);

                    }

                }

            }


            for (j = i; j < m; j++)

            {

                u(j, i) = u(j, i) * g;

            }

        }

        else

        {

            for (j = i; j < m; j++)

            {

                u(j, i) = 0;

            }

        }


        ++u(i, i);

    }


    // diagonalize the bi-diagonal form

    for (k = n - 1; k >= 0; k--)

    {

        // loop over singular values

        for (int its = 0; its < 30; its++)

        {

            // loop over allowed iterations

            int flag = 1;


            for (l = k; l >= 0; l--)

            {

                // test for splitting

                nm = l - 1;


                if (std::fabs(static_cast<double>(rv1[l])) <=

                    std::numeric_limits<double>::epsilon())

                {

                    flag = 0;

                    break;

                }


                if (std::fabs(static_cast<double>(w[nm])) <=

                    std::numeric_limits<double>::epsilon())

                {

                    break;

                }

            }


            if (flag)

            {

                c = 0;

                s = 1;


                for (i = l; i <= k; i++)

                {

                    f = s * rv1[i];


                    if (std::fabs(static_cast<double>(f)) <=

                        std::numeric_limits<double>::epsilon())

                    {

                        g = w[i];

                        h = Internal::Pythag(f, g);

                        w[i] = static_cast<T>(h);

                        h = 1 / h;

                        c = g * h;

                        s = -f * h;


                        for (j = 0; j < m; j++)

                        {

                            y = u(j, nm);

                            z = u(j, i);

                            u(j, nm) = y * c + z * s;

                            u(j, i) = z * c - y * s;

                        }

                    }

                }

            }


            z = w[k];


            if (l == k)

            {

                // convergence

                if (z < 0)

                {

                    // make singular value nonnegative

                    w[k] = -z;


                    for (j = 0; j < n; j++)

                    {

                        v(j, k) = -v(j, k);

                    }

                }


                break;

            }


            if (its >= 30)

            {

                throw std::logic_error{ "No convergence after 30 iterations" };

            }


            // shift from bottom 2 x 2 minor

            x = w[l];

            nm = k - 1;

            y = w[nm];

            g = rv1[nm];

            h = rv1[k];

            f = ((y - z) * (y + z) + (g - h) * (g + h)) / (2 * h * y);

            g = Internal::Pythag(f, static_cast<T>(1));

            f = ((x - z) * (x + z) +

                 h * ((y / (f + Internal::Sign(g, f))) - h)) /

                x;


            // next QR transformation

            c = s = 1;


            for (j = l; j <= nm; j++)

            {

                i = j + 1;

                g = rv1[i];

                y = w[i];

                h = s * g;

                g = c * g;

                z = Internal::Pythag(f, h);

                rv1[j] = z;

                c = f / z;

                s = h / z;

                f = x * c + g * s;

                g = g * c - x * s;

                h = y * s;

                y = y * c;


                for (jj = 0; jj < n; jj++)

                {

                    x = v(jj, j);

                    z = v(jj, i);

                    v(jj, j) = x * c + z * s;

                    v(jj, i) = z * c - x * s;

                }


                z = Internal::Pythag(f, h);

                w[j] = z;


                if (std::fabs(static_cast<double>(z)) >=

                    std::numeric_limits<double>::epsilon())

                {

                    z = 1 / z;

                    c = f * z;

                    s = h * z;

                }


                f = (c * g) + (s * y);

                x = (c * y) - (s * g);


                for (jj = 0; jj < m; jj++)

                {

                    y = u(jj, j);

                    z = u(jj, i);

                    u(jj, j) = y * c + z * s;

                    u(jj, i) = z * c - y * s;

                }

            }


            rv1[l] = 0;

            rv1[k] = f;

            w[k] = x;

        }

    }

}


template <typename T, size_t M, size_t N>


void SVD(const Matrix<T, M, N>& a, Matrix<T, M, N>& u, Vector<T, N>& w,

         Matrix<T, N, N>& v)

{

    const int m = static_cast<int>(M);

    const int n = static_cast<int>(N);


    int i, its, j = 0, jj = 0, k = 0, l = 0, nm = 0;

    T c = 0, f = 0, h = 0, s = 0, x = 0, y = 0, z = 0;

    T anorm = 0, g = 0, scale = 0;


    static_assert(m >= n,

                  "Number of rows of input matrix must greater than or equal "

                  "to columns.");


    // Prepare workspace

    Vector<T, N> rv1;

    u = a;

    w = Vector<T, N>{};

    v = Matrix<T, N, N>{};


    // Householder reduction to bi-diagonal form

    for (i = 0; i < n; i++)

    {

        // left-hand reduction

        l = i + 1;

        rv1[i] = scale * g;

        g = s = scale = 0;


        if (i < m)

        {

            for (k = i; k < m; k++)

            {

                scale += std::fabs(u(k, i));

            }


            if (scale)

            {

                for (k = i; k < m; k++)

                {

                    u(k, i) /= scale;

                    s += u(k, i) * u(k, i);

                }


                f = u(i, i);

                g = -Internal::Sign(std::sqrt(s), f);

                h = f * g - s;

                u(i, i) = f - g;


                if (i != n - 1)

                {

                    for (j = l; j < n; j++)

                    {

                        s = 0;


                        for (k = i; k < m; k++)

                        {

                            s += u(k, i) * u(k, j);

                        }


                        f = s / h;


                        for (k = i; k < m; k++)

                        {

                            u(k, j) += f * u(k, i);

                        }

                    }

                }


                for (k = i; k < m; k++)

                {

                    u(k, i) *= scale;

                }

            }

        }


        w[i] = scale * g;


        // right-hand reduction

        g = s = scale = 0;


        if (i < m && i != n - 1)

        {

            for (k = l; k < n; k++)

            {

                scale += std::fabs(u(i, k));

            }


            if (scale)

            {

                for (k = l; k < n; k++)

                {

                    u(i, k) /= scale;

                    s += u(i, k) * u(i, k);

                }


                f = u(i, l);

                g = -Internal::Sign(std::sqrt(s), f);

                h = f * g - s;

                u(i, l) = f - g;


                for (k = l; k < n; k++)

                {

                    rv1[k] = static_cast<T>(u(i, k)) / h;

                }


                if (i != m - 1)

                {

                    for (j = l; j < m; j++)

                    {

                        s = 0;


                        for (k = l; k < n; k++)

                        {

                            s += u(j, k) * u(i, k);

                        }


                        for (k = l; k < n; k++)

                        {

                            u(j, k) += s * rv1[k];

                        }

                    }

                }


                for (k = l; k < n; k++)

                {

                    u(i, k) *= scale;

                }

            }

        }

        anorm = std::max(anorm,

                         (std::fabs(static_cast<T>(w[i])) + std::fabs(rv1[i])));

    }


    // accumulate the right-hand transformation

    for (i = n - 1; i >= 0; i--)

    {

        if (i < n - 1)

        {

            if (g)

            {

                for (j = l; j < n; j++)

                {

                    v(j, i) = ((u(i, j) / u(i, l)) / g);

                }


                // T division to avoid underflow

                for (j = l; j < n; j++)

                {

                    s = 0;


                    for (k = l; k < n; k++)

                    {

                        s += u(i, k) * v(k, j);

                    }


                    for (k = l; k < n; k++)

                    {

                        v(k, j) += s * v(k, i);

                    }

                }

            }


            for (j = l; j < n; j++)

            {

                v(i, j) = v(j, i) = 0;

            }

        }


        v(i, i) = 1;

        g = rv1[i];

        l = i;

    }


    // accumulate the left-hand transformation

    for (i = n - 1; i >= 0; i--)

    {

        l = i + 1;

        g = w[i];


        if (i < n - 1)

        {

            for (j = l; j < n; j++)

            {

                u(i, j) = 0;

            }

        }


        if (g)

        {

            g = 1 / g;


            if (i != n - 1)

            {

                for (j = l; j < n; j++)

                {

                    s = 0;


                    for (k = l; k < m; k++)

                    {

                        s += u(k, i) * u(k, j);

                    }


                    f = (s / u(i, i)) * g;


                    for (k = i; k < m; k++)

                    {

                        u(k, j) += f * u(k, i);

                    }

                }

            }


            for (j = i; j < m; j++)

            {

                u(j, i) = u(j, i) * g;

            }

        }

        else

        {

            for (j = i; j < m; j++)

            {

                u(j, i) = 0;

            }

        }


        ++u(i, i);

    }


    // diagonalize the bi-diagonal form

    for (k = n - 1; k >= 0; k--)

    {

        // loop over singular values

        for (its = 0; its < 30; its++)

        {

            // loop over allowed iterations

            int flag = 1;


            for (l = k; l >= 0; l--)

            {

                // test for splitting

                nm = l - 1;


                if (std::fabs(rv1[l]) + anorm == anorm)

                {

                    flag = 0;

                    break;

                }


                if (std::fabs(static_cast<T>(w[nm])) + anorm == anorm)

                {

                    break;

                }

            }


            if (flag)

            {

                c = 0;

                s = 1;


                for (i = l; i <= k; i++)

                {

                    f = s * rv1[i];


                    if (std::fabs(f) + anorm != anorm)

                    {

                        g = w[i];

                        h = Internal::Pythag(f, g);

                        w[i] = static_cast<T>(h);

                        h = 1 / h;

                        c = g * h;

                        s = -f * h;


                        for (j = 0; j < m; j++)

                        {

                            y = u(j, nm);

                            z = u(j, i);

                            u(j, nm) = y * c + z * s;

                            u(j, i) = z * c - y * s;

                        }

                    }

                }

            }


            z = w[k];


            if (l == k)

            {

                // convergence

                if (z < 0)

                {

                    // make singular value nonnegative

                    w[k] = -z;


                    for (j = 0; j < n; j++)

                    {

                        v(j, k) = -v(j, k);

                    }

                }


                break;

            }


            if (its >= 30)

            {

                throw std::logic_error{ "No convergence after 30 iterations" };

            }


            // shift from bottom 2 x 2 minor

            x = w[l];

            nm = k - 1;

            y = w[nm];

            g = rv1[nm];

            h = rv1[k];

            f = ((y - z) * (y + z) + (g - h) * (g + h)) / (2 * h * y);

            g = Internal::Pythag(f, static_cast<T>(1));

            f = ((x - z) * (x + z) +

                 h * ((y / (f + Internal::Sign(g, f))) - h)) /

                x;


            // next QR transformation

            c = s = 1;


            for (j = l; j <= nm; j++)

            {

                i = j + 1;

                g = rv1[i];

                y = w[i];

                h = s * g;

                g = c * g;

                z = Internal::Pythag(f, h);

                rv1[j] = z;

                c = f / z;

                s = h / z;

                f = x * c + g * s;

                g = g * c - x * s;

                h = y * s;

                y = y * c;


                for (jj = 0; jj < n; jj++)

                {

                    x = v(jj, j);

                    z = v(jj, i);

                    v(jj, j) = x * c + z * s;

                    v(jj, i) = z * c - x * s;

                }


                z = Internal::Pythag(f, h);

                w[j] = z;


                if (z)

                {

                    z = 1 / z;

                    c = f * z;

                    s = h * z;

                }


                f = (c * g) + (s * y);

                x = (c * y) - (s * g);


                for (jj = 0; jj < m; jj++)

                {

                    y = u(jj, j);

                    z = u(jj, i);

                    u(jj, j) = y * c + z * s;

                    u(jj, i) = z * c - y * s;

                }

            }


            rv1[l] = 0;

            rv1[k] = f;

            w[k] = x;

        }

    }

}


}  // namespace CubbyFlow


#endif

CubbyFlow::Matrix
Definition Matrix.hpp:30

CubbyFlow::Matrix::GetCols
constexpr size_t GetCols() const
Definition Matrix-Impl.hpp:266

CubbyFlow::Matrix::GetRows
constexpr size_t GetRows() const
Definition Matrix-Impl.hpp:260

CubbyFlow::Internal::Pythag
T Pythag(T a, T b)
Definition SVD-Impl.hpp:27

CubbyFlow::Internal::Sign
T Sign(T a, T b)
Definition SVD-Impl.hpp:21

CubbyFlow
Definition pybind11Utils.hpp:21

CubbyFlow::SVD
void SVD(const MatrixMxN< T > &a, MatrixMxN< T > &u, VectorN< T > &w, MatrixMxN< T > &v)
Singular value decomposition (SVD).
Definition SVD-Impl.hpp:54

CubbyFlow::Vector
Matrix< T, Rows, 1 > Vector
Definition Matrix.hpp:738