CubbyFlow/_s_v_d-_impl_8hpp_source.html

 // This code is based on Jet framework.
 // Copyright (c) 2018 Doyub Kim
 // CubbyFlow is voxel-based fluid simulation engine for computer games.
 // Copyright (c) 2020 CubbyFlow Team
 // Core Part: Chris Ohk, Junwoo Hwang, Jihong Sin, Seungwoo Yoo
 // AI Part: Dongheon Cho, Minseo Kim
 // We are making my contributions/submissions to this project solely in our
 // personal capacity and are not conveying any rights to any intellectual
 // property of any third parties.

 #ifndef CUBBYFLOW_SVD_IMPL_HPP
 #define CUBBYFLOW_SVD_IMPL_HPP

 #include <stdexcept>

 namespace CubbyFlow
 {
 namespace Internal
 {
 template <typename T>
 T Sign(T a, T b)
 {
     return static_cast<double>(b) >= 0.0 ? std::fabs(a) : -std::fabs(a);
 }

 template <typename T>
 T Pythag(T a, T b)
 {
     T at = std::fabs(a);
     T bt = std::fabs(b);
     T ct;
     T result;

     if (at > bt)
     {
         ct = bt / at;
         result = at * std::sqrt(1 + ct * ct);
     }
     else if (bt > 0)
     {
         ct = at / bt;
         result = bt * std::sqrt(1 + ct * ct);
     }
     else
     {
         result = 0;
     }

     return result;
 }
 }  // namespace Internal

 template <typename T>
 void SVD(const MatrixMxN<T>& a, MatrixMxN<T>& u, VectorN<T>& w, MatrixMxN<T>& v)
 {
     const int m = static_cast<int>(a.GetRows());
     const int n = static_cast<int>(a.GetCols());

     int i, j = 0, jj = 0, k = 0, l = 0, nm = 0;
     T c = 0, f = 0, h = 0, s = 0, x = 0, y = 0, z = 0;
     T anorm = 0, g = 0, scale = 0;

     if (m < n)
     {
         throw std::invalid_argument{
             "Number of rows of input matrix must greater than or equal to "
             "columns."
         };
     }

     // Prepare workspace
     VectorN<T> rv1(n, T{});
     u = a;
     w.Resize(n, 0);
     v.Resize(n, n, 0);

     // Householder reduction to bi-diagonal form
     for (i = 0; i < n; i++)
     {
         // left-hand reduction
         l = i + 1;
         rv1[i] = scale * g;
         g = s = scale = 0;

         if (i < m)
         {
             for (k = i; k < m; k++)
             {
                 scale += std::fabs(u(k, i));
             }

             if (std::fabs(static_cast<double>(scale)) >=
                 std::numeric_limits<double>::epsilon())
             {
                 for (k = i; k < m; k++)
                 {
                     u(k, i) /= scale;
                     s += u(k, i) * u(k, i);
                 }

                 f = u(i, i);
                 g = -Internal::Sign(std::sqrt(s), f);
                 h = f * g - s;
                 u(i, i) = f - g;

                 if (i != n - 1)
                 {
                     for (j = l; j < n; j++)
                     {
                         s = 0;

                         for (k = i; k < m; k++)
                         {
                             s += u(k, i) * u(k, j);
                         }

                         f = s / h;

                         for (k = i; k < m; k++)
                         {
                             u(k, j) += f * u(k, i);
                         }
                     }
                 }

                 for (k = i; k < m; k++)
                 {
                     u(k, i) *= scale;
                 }
             }
         }

         w[i] = scale * g;

         // right-hand reduction
         g = s = scale = 0;

         if (i < m && i != n - 1)
         {
             for (k = l; k < n; k++)
             {
                 scale += std::fabs(u(i, k));
             }

             if (std::fabs(static_cast<double>(scale)) >=
                 std::numeric_limits<double>::epsilon())
             {
                 for (k = l; k < n; k++)
                 {
                     u(i, k) /= scale;
                     s += u(i, k) * u(i, k);
                 }

                 f = u(i, l);
                 g = -Internal::Sign(std::sqrt(s), f);
                 h = f * g - s;
                 u(i, l) = f - g;

                 for (k = l; k < n; k++)
                 {
                     rv1[k] = static_cast<T>(u(i, k)) / h;
                 }

                 if (i != m - 1)
                 {
                     for (j = l; j < m; j++)
                     {
                         s = 0;

                         for (k = l; k < n; k++)
                         {
                             s += u(j, k) * u(i, k);
                         }

                         for (k = l; k < n; k++)
                         {
                             u(j, k) += s * rv1[k];
                         }
                     }
                 }

                 for (k = l; k < n; k++)
                 {
                     u(i, k) *= scale;
                 }
             }
         }

         anorm = std::max(anorm,
                          (std::fabs(static_cast<T>(w[i])) + std::fabs(rv1[i])));
     }

     // accumulate the right-hand transformation
     for (i = n - 1; i >= 0; i--)
     {
         if (i < n - 1)
         {
             if (std::fabs(static_cast<double>(g)) >=
                 std::numeric_limits<double>::epsilon())
             {
                 for (j = l; j < n; j++)
                 {
                     v(j, i) = ((u(i, j) / u(i, l)) / g);
                 }

                 // T division to avoid underflow
                 for (j = l; j < n; j++)
                 {
                     s = 0;

                     for (k = l; k < n; k++)
                     {
                         s += u(i, k) * v(k, j);
                     }

                     for (k = l; k < n; k++)
                     {
                         v(k, j) += s * v(k, i);
                     }
                 }
             }

             for (j = l; j < n; j++)
             {
                 v(i, j) = v(j, i) = 0;
             }
         }

         v(i, i) = 1;
         g = rv1[i];
         l = i;
     }

     // accumulate the left-hand transformation
     for (i = n - 1; i >= 0; i--)
     {
         l = i + 1;
         g = w[i];

         if (i < n - 1)
         {
             for (j = l; j < n; j++)
             {
                 u(i, j) = 0;
             }
         }

         if (std::fabs(static_cast<double>(g)) >=
             std::numeric_limits<double>::epsilon())
         {
             g = 1 / g;

             if (i != n - 1)
             {
                 for (j = l; j < n; j++)
                 {
                     s = 0;

                     for (k = l; k < m; k++)
                     {
                         s += u(k, i) * u(k, j);
                     }

                     f = (s / u(i, i)) * g;

                     for (k = i; k < m; k++)
                     {
                         u(k, j) += f * u(k, i);
                     }
                 }
             }

             for (j = i; j < m; j++)
             {
                 u(j, i) = u(j, i) * g;
             }
         }
         else
         {
             for (j = i; j < m; j++)
             {
                 u(j, i) = 0;
             }
         }

         ++u(i, i);
     }

     // diagonalize the bi-diagonal form
     for (k = n - 1; k >= 0; k--)
     {
         // loop over singular values
         for (int its = 0; its < 30; its++)
         {
             // loop over allowed iterations
             int flag = 1;

             for (l = k; l >= 0; l--)
             {
                 // test for splitting
                 nm = l - 1;

                 if (std::fabs(static_cast<double>(rv1[l])) <=
                     std::numeric_limits<double>::epsilon())
                 {
                     flag = 0;
                     break;
                 }

                 if (std::fabs(static_cast<double>(w[nm])) <=
                     std::numeric_limits<double>::epsilon())
                 {
                     break;
                 }
             }

             if (flag)
             {
                 c = 0;
                 s = 1;

                 for (i = l; i <= k; i++)
                 {
                     f = s * rv1[i];

                     if (std::fabs(static_cast<double>(f)) <=
                         std::numeric_limits<double>::epsilon())
                     {
                         g = w[i];
                         h = Internal::Pythag(f, g);
                         w[i] = static_cast<T>(h);
                         h = 1 / h;
                         c = g * h;
                         s = -f * h;

                         for (j = 0; j < m; j++)
                         {
                             y = u(j, nm);
                             z = u(j, i);
                             u(j, nm) = y * c + z * s;
                             u(j, i) = z * c - y * s;
                         }
                     }
                 }
             }

             z = w[k];

             if (l == k)
             {
                 // convergence
                 if (z < 0)
                 {
                     // make singular value nonnegative
                     w[k] = -z;

                     for (j = 0; j < n; j++)
                     {
                         v(j, k) = -v(j, k);
                     }
                 }

                 break;
             }

             if (its >= 30)
             {
                 throw std::logic_error{ "No convergence after 30 iterations" };
             }

             // shift from bottom 2 x 2 minor
             x = w[l];
             nm = k - 1;
             y = w[nm];
             g = rv1[nm];
             h = rv1[k];
             f = ((y - z) * (y + z) + (g - h) * (g + h)) / (2 * h * y);
             g = Internal::Pythag(f, static_cast<T>(1));
             f = ((x - z) * (x + z) +
                  h * ((y / (f + Internal::Sign(g, f))) - h)) /
                 x;

             // next QR transformation
             c = s = 1;

             for (j = l; j <= nm; j++)
             {
                 i = j + 1;
                 g = rv1[i];
                 y = w[i];
                 h = s * g;
                 g = c * g;
                 z = Internal::Pythag(f, h);
                 rv1[j] = z;
                 c = f / z;
                 s = h / z;
                 f = x * c + g * s;
                 g = g * c - x * s;
                 h = y * s;
                 y = y * c;

                 for (jj = 0; jj < n; jj++)
                 {
                     x = v(jj, j);
                     z = v(jj, i);
                     v(jj, j) = x * c + z * s;
                     v(jj, i) = z * c - x * s;
                 }

                 z = Internal::Pythag(f, h);
                 w[j] = z;

                 if (std::fabs(static_cast<double>(z)) >=
                     std::numeric_limits<double>::epsilon())
                 {
                     z = 1 / z;
                     c = f * z;
                     s = h * z;
                 }

                 f = (c * g) + (s * y);
                 x = (c * y) - (s * g);

                 for (jj = 0; jj < m; jj++)
                 {
                     y = u(jj, j);
                     z = u(jj, i);
                     u(jj, j) = y * c + z * s;
                     u(jj, i) = z * c - y * s;
                 }
             }

             rv1[l] = 0;
             rv1[k] = f;
             w[k] = x;
         }
     }
 }

 template <typename T, size_t M, size_t N>
 void SVD(const Matrix<T, M, N>& a, Matrix<T, M, N>& u, Vector<T, N>& w,
          Matrix<T, N, N>& v)
 {
     const int m = static_cast<int>(M);
     const int n = static_cast<int>(N);

     int i, its, j = 0, jj = 0, k = 0, l = 0, nm = 0;
     T c = 0, f = 0, h = 0, s = 0, x = 0, y = 0, z = 0;
     T anorm = 0, g = 0, scale = 0;

     static_assert(m >= n,
                   "Number of rows of input matrix must greater than or equal "
                   "to columns.");

     // Prepare workspace
     Vector<T, N> rv1;
     u = a;
     w = Vector<T, N>{};
     v = Matrix<T, N, N>{};

     // Householder reduction to bi-diagonal form
     for (i = 0; i < n; i++)
     {
         // left-hand reduction
         l = i + 1;
         rv1[i] = scale * g;
         g = s = scale = 0;

         if (i < m)
         {
             for (k = i; k < m; k++)
             {
                 scale += std::fabs(u(k, i));
             }

             if (scale)
             {
                 for (k = i; k < m; k++)
                 {
                     u(k, i) /= scale;
                     s += u(k, i) * u(k, i);
                 }

                 f = u(i, i);
                 g = -Internal::Sign(std::sqrt(s), f);
                 h = f * g - s;
                 u(i, i) = f - g;

                 if (i != n - 1)
                 {
                     for (j = l; j < n; j++)
                     {
                         s = 0;

                         for (k = i; k < m; k++)
                         {
                             s += u(k, i) * u(k, j);
                         }

                         f = s / h;

                         for (k = i; k < m; k++)
                         {
                             u(k, j) += f * u(k, i);
                         }
                     }
                 }

                 for (k = i; k < m; k++)
                 {
                     u(k, i) *= scale;
                 }
             }
         }

         w[i] = scale * g;

         // right-hand reduction
         g = s = scale = 0;

         if (i < m && i != n - 1)
         {
             for (k = l; k < n; k++)
             {
                 scale += std::fabs(u(i, k));
             }

             if (scale)
             {
                 for (k = l; k < n; k++)
                 {
                     u(i, k) /= scale;
                     s += u(i, k) * u(i, k);
                 }

                 f = u(i, l);
                 g = -Internal::Sign(std::sqrt(s), f);
                 h = f * g - s;
                 u(i, l) = f - g;

                 for (k = l; k < n; k++)
                 {
                     rv1[k] = static_cast<T>(u(i, k)) / h;
                 }

                 if (i != m - 1)
                 {
                     for (j = l; j < m; j++)
                     {
                         s = 0;

                         for (k = l; k < n; k++)
                         {
                             s += u(j, k) * u(i, k);
                         }

                         for (k = l; k < n; k++)
                         {
                             u(j, k) += s * rv1[k];
                         }
                     }
                 }

                 for (k = l; k < n; k++)
                 {
                     u(i, k) *= scale;
                 }
             }
         }
         anorm = std::max(anorm,
                          (std::fabs(static_cast<T>(w[i])) + std::fabs(rv1[i])));
     }

     // accumulate the right-hand transformation
     for (i = n - 1; i >= 0; i--)
     {
         if (i < n - 1)
         {
             if (g)
             {
                 for (j = l; j < n; j++)
                 {
                     v(j, i) = ((u(i, j) / u(i, l)) / g);
                 }

                 // T division to avoid underflow
                 for (j = l; j < n; j++)
                 {
                     s = 0;

                     for (k = l; k < n; k++)
                     {
                         s += u(i, k) * v(k, j);
                     }

                     for (k = l; k < n; k++)
                     {
                         v(k, j) += s * v(k, i);
                     }
                 }
             }

             for (j = l; j < n; j++)
             {
                 v(i, j) = v(j, i) = 0;
             }
         }

         v(i, i) = 1;
         g = rv1[i];
         l = i;
     }

     // accumulate the left-hand transformation
     for (i = n - 1; i >= 0; i--)
     {
         l = i + 1;
         g = w[i];

         if (i < n - 1)
         {
             for (j = l; j < n; j++)
             {
                 u(i, j) = 0;
             }
         }

         if (g)
         {
             g = 1 / g;

             if (i != n - 1)
             {
                 for (j = l; j < n; j++)
                 {
                     s = 0;

                     for (k = l; k < m; k++)
                     {
                         s += u(k, i) * u(k, j);
                     }

                     f = (s / u(i, i)) * g;

                     for (k = i; k < m; k++)
                     {
                         u(k, j) += f * u(k, i);
                     }
                 }
             }

             for (j = i; j < m; j++)
             {
                 u(j, i) = u(j, i) * g;
             }
         }
         else
         {
             for (j = i; j < m; j++)
             {
                 u(j, i) = 0;
             }
         }

         ++u(i, i);
     }

     // diagonalize the bi-diagonal form
     for (k = n - 1; k >= 0; k--)
     {
         // loop over singular values
         for (its = 0; its < 30; its++)
         {
             // loop over allowed iterations
             int flag = 1;

             for (l = k; l >= 0; l--)
             {
                 // test for splitting
                 nm = l - 1;

                 if (std::fabs(rv1[l]) + anorm == anorm)
                 {
                     flag = 0;
                     break;
                 }

                 if (std::fabs(static_cast<T>(w[nm])) + anorm == anorm)
                 {
                     break;
                 }
             }

             if (flag)
             {
                 c = 0;
                 s = 1;

                 for (i = l; i <= k; i++)
                 {
                     f = s * rv1[i];

                     if (std::fabs(f) + anorm != anorm)
                     {
                         g = w[i];
                         h = Internal::Pythag(f, g);
                         w[i] = static_cast<T>(h);
                         h = 1 / h;
                         c = g * h;
                         s = -f * h;

                         for (j = 0; j < m; j++)
                         {
                             y = u(j, nm);
                             z = u(j, i);
                             u(j, nm) = y * c + z * s;
                             u(j, i) = z * c - y * s;
                         }
                     }
                 }
             }

             z = w[k];

             if (l == k)
             {
                 // convergence
                 if (z < 0)
                 {
                     // make singular value nonnegative
                     w[k] = -z;

                     for (j = 0; j < n; j++)
                     {
                         v(j, k) = -v(j, k);
                     }
                 }

                 break;
             }

             if (its >= 30)
             {
                 throw std::logic_error{ "No convergence after 30 iterations" };
             }

             // shift from bottom 2 x 2 minor
             x = w[l];
             nm = k - 1;
             y = w[nm];
             g = rv1[nm];
             h = rv1[k];
             f = ((y - z) * (y + z) + (g - h) * (g + h)) / (2 * h * y);
             g = Internal::Pythag(f, static_cast<T>(1));
             f = ((x - z) * (x + z) +
                  h * ((y / (f + Internal::Sign(g, f))) - h)) /
                 x;

             // next QR transformation
             c = s = 1;

             for (j = l; j <= nm; j++)
             {
                 i = j + 1;
                 g = rv1[i];
                 y = w[i];
                 h = s * g;
                 g = c * g;
                 z = Internal::Pythag(f, h);
                 rv1[j] = z;
                 c = f / z;
                 s = h / z;
                 f = x * c + g * s;
                 g = g * c - x * s;
                 h = y * s;
                 y = y * c;

                 for (jj = 0; jj < n; jj++)
                 {
                     x = v(jj, j);
                     z = v(jj, i);
                     v(jj, j) = x * c + z * s;
                     v(jj, i) = z * c - x * s;
                 }

                 z = Internal::Pythag(f, h);
                 w[j] = z;

                 if (z)
                 {
                     z = 1 / z;
                     c = f * z;
                     s = h * z;
                 }

                 f = (c * g) + (s * y);
                 x = (c * y) - (s * g);

                 for (jj = 0; jj < m; jj++)
                 {
                     y = u(jj, j);
                     z = u(jj, i);
                     u(jj, j) = y * c + z * s;
                     u(jj, i) = z * c - y * s;
                 }
             }

             rv1[l] = 0;
             rv1[k] = f;
             w[k] = x;
         }
     }
 }
 }  // namespace CubbyFlow

 #endif
CubbyFlow::Internal::Sign
T Sign(T a, T b)
Definition: SVD-Impl.hpp:21

CubbyFlow::Matrix< T, MATRIX_SIZE_DYNAMIC, MATRIX_SIZE_DYNAMIC >::GetCols
size_t GetCols() const
Definition: Matrix-Impl.hpp:1069

CubbyFlow::Matrix< T, MATRIX_SIZE_DYNAMIC, MATRIX_SIZE_DYNAMIC >::Resize
void Resize(size_t rows, size_t cols, ConstReference val=ValueType{})
Definition: Matrix-Impl.hpp:1035

CubbyFlow::Matrix
Definition: Matrix.hpp:27

CubbyFlow
Definition: pybind11Utils.hpp:20

CubbyFlow::Matrix< T, MATRIX_SIZE_DYNAMIC, MATRIX_SIZE_DYNAMIC >
Definition: Matrix.hpp:531

CubbyFlow::Matrix< T, MATRIX_SIZE_DYNAMIC, 1 >
Definition: Matrix.hpp:611

CubbyFlow::Internal::Pythag
T Pythag(T a, T b)
Definition: SVD-Impl.hpp:27

CubbyFlow::Matrix< T, MATRIX_SIZE_DYNAMIC, 1 >::Resize
void Resize(size_t rows, ConstReference val=ValueType{})
Definition: Matrix-Impl.hpp:1245

CubbyFlow::SVD
void SVD(const MatrixMxN< T > &a, MatrixMxN< T > &u, VectorN< T > &w, MatrixMxN< T > &v)
Singular value decomposition (SVD).
Definition: SVD-Impl.hpp:54

CubbyFlow::Matrix< T, MATRIX_SIZE_DYNAMIC, MATRIX_SIZE_DYNAMIC >::GetRows
size_t GetRows() const
Definition: Matrix-Impl.hpp:1063