alp/v0.8-preview/gmres_8hpp_source.html

 /*
  *   Copyright 2023 Huawei Technologies Co., Ltd.
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  *
  *     http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 #ifndef _H_GRB_ALGORITHMS_GMRES
 #define _H_GRB_ALGORITHMS_GMRES

 #include <cstdio>
 #include <complex>
 #include <functional> //function

 #include <graphblas.hpp>
 #include <graphblas/algorithms/norm.hpp>
 #include <graphblas/utils/iscomplex.hpp>

 namespace grb {

     namespace algorithms {

         template<
             typename NonzeroType,
             typename DimensionType,
             typename ResidualType,
             class Ring = Semiring<
                 grb::operators::add< NonzeroType >, grb::operators::mul< NonzeroType >,
                 grb::identities::zero, grb::identities::one
             >,
             class Minus = operators::subtract< NonzeroType >,
             class Divide = operators::divide< NonzeroType >
         >
         grb::RC hessolve(
             std::vector< NonzeroType > &H,
             const DimensionType n,
             const DimensionType &kspspacesize,
             const ResidualType tol,
             std::vector< NonzeroType > &vecx,
             const Ring &ring = Ring(),
             const Minus &minus = Minus(),
             const Divide &divide = Divide(),
             const std::function< ResidualType( ResidualType ) > &sqrtX =
                 std_sqrt< ResidualType, ResidualType >
         ) {
             RC rc = grb::SUCCESS;

             if( n < 1 ) {
                 return ILLEGAL;
             }
             if( H.size() < ( n * n ) ) {
                 std::cerr << "Error: algorithms::hessolve requires input parameter H to "
                     << "have a number of entries greater-than n^2. "
                     << "However, " << H.size() << " is smaller-than "
                       << ( n * n ) << ".\n";
                 return ILLEGAL;
             }
             if( kspspacesize < 1 ) {
                 return ILLEGAL;
             }
             if( kspspacesize >= n ) {
                 return ILLEGAL;
             }
             if( tol <= 0 ) {
                 return ILLEGAL;
             }
             if( vecx.size() <= n ) {
                 std::cerr << "Error: algorithms::hessolve requires a given workspace vecx "
                     << "that has a number of entries greater-than or equal-to the given "
                     << "parameter n. However, " << vecx.size() << " is strictly smaller-than "
                     << "or equal-to " << n << ".\n";
                 return MISMATCH;
             }

             // vecx = H
             for( size_t i = 0; i < n; ++i ) {
                 vecx[ i ] = H[ i ];
             }

             size_t n_ksp = std::min( kspspacesize, n - 1 );

             // for i in range(n):
             for( size_t i = 0; i < n_ksp; ++i ) {
                 // Givens rotation parameters
                 NonzeroType c, s;

                 // this scope is is using real ring
                 {
                     Semiring<
                         grb::operators::add< ResidualType >, grb::operators::mul< ResidualType >,
                         grb::identities::zero, grb::identities::one
                     > ring_rtype;

                     // a, b = H[ i:i+2, i ]
                     NonzeroType a = H[ ( i + 1 ) * n + i ];
                     NonzeroType b = H[ ( i + 1 ) * n + i + 1 ];

                     ResidualType a_mod = grb::utils::is_complex< NonzeroType >::modulus( a );
                     ResidualType b_mod = grb::utils::is_complex< NonzeroType >::modulus( b );
                     NonzeroType b_conj = grb::utils::is_complex< NonzeroType >::conjugate( b );
                     ResidualType a_mod2 = a_mod;
                     ResidualType b_mod2 = b_mod;
                     rc = rc ? rc : grb::foldl( a_mod2, a_mod,
                         ring_rtype.getMultiplicativeOperator() );
                     rc = rc ? rc : grb::foldl( b_mod2, b_mod,
                         ring_rtype.getMultiplicativeOperator() );

                     // tmp1 = sqrt(norm(a)**2+norm(b)**2)
                     ResidualType tmp1 = a_mod2;
                     rc = rc ? rc : grb::foldl( tmp1, b_mod2,
                         ring_rtype.getAdditiveOperator() );
                     tmp1 = sqrtX( tmp1 );

                     //c = a_mod / tmp1 ;
                     c = a_mod;
                     rc = rc ? rc : grb::foldl( c, tmp1, divide );
                     if( a_mod != 0 ) {
                         // s = a / std::norm(a) * std::conj(b) / tmp1;
                         s = a;
                         rc = rc ? rc : grb::foldl( s, a_mod, divide );
                         rc = rc ? rc : grb::foldl( s, b_conj, ring.getMultiplicativeOperator() );
                         rc = rc ? rc : grb::foldl( s, tmp1, divide );
                     } else {
                         // s = std::conj(b) / tmp1;
                         s = b_conj;
                         rc = rc ? rc : grb::foldl( s, tmp1, divide );
                     }
                 }

                 // for k in range(i,n):
                 for( size_t k = i; k < n_ksp; ++k ) {
                     // tmp2 = s * H[ i+1, k ]
                     NonzeroType tmp2 = H[ ( k + 1 ) * n + i + 1 ];
                     rc = rc ? rc : grb::foldl( tmp2, s, ring.getMultiplicativeOperator() );

                     // H[i+1,k] = -conjugate(s) * H[i,k] + c * H[i+1,k]
                     NonzeroType tmp4 = H[ ( k + 1 ) * n + i ];
                     rc = rc ? rc : grb::foldl( H[ ( k + 1 ) * n + i + 1 ], c,
                         ring.getMultiplicativeOperator() );
                     rc = rc ? rc : grb::foldl(
                         tmp4,
                         grb::utils::is_complex< NonzeroType >::conjugate( s ),
                         ring.getMultiplicativeOperator()
                     );
                     rc = rc ? rc : grb::foldl( H[ ( k + 1 ) * n + i + 1 ], tmp4, minus );

                     // H[i,k]   = c * H[i,k] + tmp2
                     rc = rc ? rc : grb::foldl( H[ ( k + 1 ) * n + i ], c,
                         ring.getMultiplicativeOperator() );
                     rc = rc ? rc : grb::foldl( H[ ( k + 1 ) * n + i ], tmp2,
                         ring.getAdditiveOperator() );
                 }

                 // tmp3 = vecx[i]
                 NonzeroType tmp3 = vecx[ i ];
                 NonzeroType tmp5 = vecx[ i + 1 ];

                 // vecx[i] =  c * tmp3 + s * vecx[i+1]
                 rc = rc ? rc : grb::foldl( vecx[ i ], c, ring.getMultiplicativeOperator() );
                 rc = rc ? rc : grb::foldl( tmp5, s, ring.getMultiplicativeOperator() );
                 rc = rc ? rc : grb::foldl( vecx[ i ], tmp5, ring.getAdditiveOperator() );


                 // vecx[i+1]  =  -conjugate(s) * tmp3 + c * vecx[i+1]
                 rc = rc ? rc : grb::foldl( vecx[ i + 1 ], c, ring.getMultiplicativeOperator() );
                 rc = rc ? rc : grb::foldl(
                     tmp3,
                     grb::utils::is_complex< NonzeroType >::conjugate( s ),
                     ring.getMultiplicativeOperator()
                 );
                 rc = rc ? rc : grb::foldl( vecx[ i + 1 ], tmp3, minus );
             }

 #ifdef _DEBUG
             std::cout << "hessolve vecx vector before back-substitution, vector = ";
             for( size_t k = 0; k < n_ksp; ++k ) {
                 std::cout << vecx[ k ] << " ";
             }
             std::cout << "\n";
 #endif

             // for i in range(n-1,-1,-1):
             for( size_t m = 0; m < n_ksp; ++m ) {
                 size_t i = n_ksp - 1 - m;
                 // for j in range(i+1,n):
                 for( size_t j = i + 1; j < n_ksp; ++j ) {
                     // vecx[i] = vecx[i]-vecx[j]*H[i,j]
                     NonzeroType tmp6 = vecx[ j ];
                     rc = rc ? rc : grb::foldl( tmp6, H[ ( j + 1 ) * n + i ],
                         ring.getMultiplicativeOperator() );
                     rc = rc ? rc : grb::foldl( vecx[ i ], tmp6, minus );
                 }
                 // vecx[i] = vecx[i]/H[i,i]
                 if( grb::utils::is_complex< NonzeroType >::modulus( H[ ( i + 1 ) * n + i ] )
                     < tol
                 ) {
                     std::cerr << "Warning: small number in algorithms::hessolve\n";
                 }
                 rc = rc ? rc : grb::foldl( vecx[ i ], H[ ( i + 1 ) * n + i ], divide );
             }

             // H = vecx
             for( size_t i = 0; i < n; ++i ) {
                 H[ i ] = vecx[ i ];
             }

             // done
             return rc;
         }

         namespace internal {

             template<
                 Descriptor descr = descriptors::no_operation,
                 typename NonzeroType,
                 typename ResidualType,
                 class Ring = Semiring<
                     grb::operators::add< NonzeroType >, grb::operators::mul< NonzeroType >,
                     grb::identities::zero, grb::identities::one
                 >,
                 class Minus = operators::subtract< NonzeroType >,
                 class Divide = operators::divide< NonzeroType >
             >
             grb::RC gmres_step(
                 const grb::Vector< NonzeroType > &x,
                 const grb::Matrix< NonzeroType > &A,
                 const grb::Vector< NonzeroType > &b,
                 std::vector< NonzeroType > &Hmatrix,
                 std::vector< grb::Vector< NonzeroType > > &Q,
                 const size_t n_restart,
                 const ResidualType tol,
                 size_t &iterations,
                 grb::Vector< NonzeroType > &temp,
                 const grb::Matrix< NonzeroType > &M = grb::Matrix< NonzeroType >( 0, 0 ),
                 const Ring &ring = Ring(),
                 const Minus &minus = Minus(),
                 const Divide &divide = Divide(),
                 const std::function< ResidualType( ResidualType ) > &sqrtX =
                     std_sqrt< ResidualType, ResidualType >
             ) {
                 // static checks
                 static_assert( std::is_floating_point< ResidualType >::value,
                     "Can only use the Arnoldi algorithm with floating-point residual types." );

                 bool useprecond = false;
                 if( (nrows( M ) != 0) && (ncols( M ) != 0) ) {
                     useprecond = true;
                 }

                 constexpr const Descriptor descr_dense = descr | descriptors::dense;
                 const ResidualType zero = ring.template getZero< ResidualType >();

                 // dynamic checks, main error checking done in GMRES main function
 #ifndef NDEBUG
                 const size_t n = grb::ncols( A );
                 {
                     const size_t m = grb::nrows( A );
                     assert( m == n );
                     assert( size( x ) == n );
                     assert( size( b ) == m );
                     assert( size( Q[ 0 ] ) == n );
                     assert( size( temp ) == n );
                     assert( capacity( x ) == n );
                     assert( capacity( Q[ 0 ] ) == n );
                     assert( capacity( temp ) == n );
                     assert( tol > zero );
                 }
 #endif

                 ResidualType rho, tau;

                 // (re)set Hmatrix to zero
                 std::fill( Hmatrix.begin(), Hmatrix.end(), zero );

                 //Q[:,0]=b-A.dot(x) ;
                 // temp = 0
                 grb::RC ret = grb::set< descr_dense >( temp, zero );
                 assert( ret == SUCCESS );

                 // temp = A * x
                 ret = ret ? ret : grb::mxv< descr_dense >( temp, A, x, ring );
                 assert( ret == SUCCESS );

                 // Q[ 0 ] = b - temp;
                 ret = ret ? ret : grb::set< descr_dense >( Q[ 0 ], zero );
                 ret = ret ? ret : grb::foldl< descr_dense >( Q[ 0 ], b,
                     ring.getAdditiveMonoid() );
                 assert( nnz( Q[ 0 ] ) == n );
                 assert( nnz( temp ) == n );
                 ret = ret ? ret : grb::foldl< descr_dense >( Q[ 0 ], temp, minus );
                 assert( ret == SUCCESS );

                 // precond
                 if( useprecond ) {
                     // Q[ 0 ] = M * Q[ 0 ]
                     ret = grb::set< descr_dense >( temp, Q[ 0 ] );
                     assert( ret == SUCCESS );

                     ret = grb::set< descr_dense >( Q[ 0 ], zero );
                     assert( ret == SUCCESS );

                     ret = ret ? ret : grb::mxv< descr_dense >( Q[ 0 ], M, temp, ring );
                     assert( ret == SUCCESS );
                 }

                 //rho = norm(Q[:,0])
                 rho = zero;
                 ret = ret ? ret : grb::algorithms::norm2< descr_dense >( rho, Q[ 0 ], ring,
                     sqrtX );
                 assert( ret == SUCCESS );

                 Hmatrix[ 0 ] = rho;

                 tau = tol * rho;

                 size_t k = 0;
                 while( ( rho > tau ) && ( k < n_restart ) ) {
                     // alpha = r' * r;

                     if( grb::utils::is_complex< NonzeroType >::modulus(
                             Hmatrix[ k * ( n_restart + 1 ) + k ]
                         ) < tol
                     ) {
                         break;
                     }

                     // Q[k] = Q[k] / alpha
                     ret = ret ? ret : grb::foldl< descr_dense >( Q[ k ],
                         Hmatrix[ k * ( n_restart + 1 ) + k ], divide );
                     assert( ret == SUCCESS );

                     // Q[k+1] = 0
                     ret = ret ? ret : grb::set< descr_dense >( Q[ k + 1 ], zero );
                     assert( ret == SUCCESS );

                     // Q[k+1] = A * Q[k+1]
                     ret = ret ? ret : grb::mxv< descr_dense >( Q[ k + 1 ], A, Q[ k ], ring );
                     assert( ret == SUCCESS );

                     // precond
                     if( useprecond ) {
                         // Q[k+1]= M * Q[k+1]
                         ret = grb::set< descr_dense >( temp, Q[ k+1 ] );
                         assert( ret == SUCCESS );

                         ret = grb::set< descr_dense >( Q[ k+1 ], zero );
                         assert( ret == SUCCESS );

                         ret = ret ? ret : grb::mxv< descr_dense >( Q[ k+1 ], M, temp, ring );
                         assert( ret == SUCCESS );
                     }

                     (void) ++k;

                     for( size_t j = 0; j < std::min( k, n_restart ); j++ ) {
                         //H[j,k] = Q[:,j].dot(Q[:,k])
                         Hmatrix[ k * ( n_restart + 1 ) + j ] = zero;
                         ret = ret ? ret : grb::dot< descr_dense >(
                             Hmatrix[ k * ( n_restart + 1 ) + j ],
                             Q[ k ], Q[ j ],
                             ring.getAdditiveMonoid(),
                             grb::operators::conjugate_right_mul< NonzeroType >()
                         );
                         assert( ret == SUCCESS );

                         //Q[:,k] = Q[:,k]-H[j,k]*Q[:,i]
                         grb::RC ret = grb::set< descr_dense >( temp, zero );
                         assert( ret == SUCCESS );

                         NonzeroType alpha1 = Hmatrix[ k * ( n_restart + 1 ) + j ];
                         ret = ret ? ret : grb::eWiseMul< descr_dense >( temp, alpha1, Q[ j ],
                             ring );
                         assert( ret == SUCCESS );

                         ret = ret ? ret : grb::foldl< descr_dense >( Q[ k ], temp, minus );
                         assert( ret == SUCCESS );
                     } // while

                     //alpha = norm(Q[:,k])
                     ResidualType alpha = zero;
                     ret = ret ? ret : grb::algorithms::norm2< descr_dense >( alpha, Q[ k ],
                         ring, sqrtX );
                     assert( ret == SUCCESS );

                     //H[k,k] = alpha
                     Hmatrix[ k * ( n_restart + 1 ) + k ] = alpha;
                 }

                 iterations += k;

                 return ret;
             }

             template<
                 Descriptor descr = descriptors::no_operation,
                 bool no_preconditioning = true,
                 typename NonzeroType,
                 typename ResidualType,
                 class Ring = Semiring<
                     grb::operators::add< NonzeroType >, grb::operators::mul< NonzeroType >,
                     grb::identities::zero, grb::identities::one
                 >,
                 class Minus = operators::subtract< NonzeroType >,
                 class Divide = operators::divide< NonzeroType >
             >
             grb::RC gmres_dispatch(
                 grb::Vector< NonzeroType > &x,
                 const grb::Matrix< NonzeroType > &A,
                 const grb::Vector< NonzeroType > &b,
                 const size_t n_restart,
                 const size_t max_iterations,
                 const ResidualType tol,
                 size_t &iterations,
                 size_t &iterations_gmres,
                 size_t &iterations_arnoldi,
                 ResidualType &residual,
                 std::vector< grb::Vector< NonzeroType > > &Q,
                 std::vector< NonzeroType > &Hmatrix,
                 grb::Vector< NonzeroType > &temp,
                 std::vector< NonzeroType > &temp3,
                 const grb::Matrix< NonzeroType > &M,
                 const Ring &ring = Ring(),
                 const Minus &minus = Minus(),
                 const Divide &divide = Divide(),
                 const std::function< ResidualType( ResidualType ) > &sqrtX =
                     std_sqrt< ResidualType, ResidualType >
             ) {
                 grb::RC rc = grb::SUCCESS;
                 constexpr const Descriptor descr_dense = descr | descriptors::dense;
                 const ResidualType zero = ring.template getZero< ResidualType >();

                 // dynamic checks
                 {
                     // mismatches
                     const size_t n = grb::ncols( A );
                     const size_t m = grb::nrows( A );
                     if( grb::size( x ) != n ) {
                         return MISMATCH;
                     }
                     if( grb::size( b ) != m ) {
                         return MISMATCH;
                     }
                     if( !no_preconditioning ) {
                         if( grb::ncols( M ) != n || grb::nrows( M ) != m ) {
                             return MISMATCH;
                         }
                     }

                     // illegal inputs
                     if( capacity( x ) != n ) {
                         return ILLEGAL;
                     }
                     if( m != n ) {
                         std::cerr << "Warning: grb::algorithms::conjugate_gradient requires "
                             << "square input matrices, but a non-square input matrix was "
                             << "given instead.\n";
                         return ILLEGAL;
                     }
                     if( n_restart == 0 && max_iterations > 0 ) {
                         return ILLEGAL;
                     }
                     if( tol <= zero ) {
                         std::cerr << "Error: tolerance input to GMRES must be strictly"
                                << "positive\n";
                         return ILLEGAL;
                     }

                     // workspace
                     if( Q.size() <= n_restart ) {
                         std::cerr << "Error: expected n_restart + 1 (" << (n_restart+1) << ") "
                             << "columns in the given Q, but only " << Q.size() << " were given.\n";
                         // FIXME this should become a MISMATCH once ALP/Dense is up
                         return ILLEGAL;
                     }
                     for( size_t i = 0; i <= n_restart; ++i ) {
                         if( grb::size( Q[ i ] ) != n || grb::capacity( Q[ i ] ) != n ) {
                             std::cerr << "Error: provided workspace vectors in Q are not of the "
                                 << "correct length and/or capacity.\n";
                             return ILLEGAL;
                         }
                     }
                     if( Hmatrix.size() < ( ( n_restart + 1 ) * ( n_restart + 1 ) ) ) {
                         std::cerr << "Error: expected (n_restart + 1)^2 entries in H ("
                             << ( ( n_restart + 1 ) * ( n_restart + 1 ) ) << "), but only "
                             << Hmatrix.size() << " were given.\n";
                         // FIXME H should become a structured matrix and this code should return
                         //       MISMATCH if dimension check fails, once ALP/Dense is up
                         return ILLEGAL;
                     }
                     if( grb::size( temp ) < n || grb::capacity( temp ) < n ) {
                         std::cerr << "Error: provided temp workspace vector is not of the correct "
                             << "length and/or capacity.\n";
                         return ILLEGAL;
                     }
                     if( temp3.size() < n ) {
                         std::cerr << "Error: provided temp3 workspace vector (STL) is not of the "
                             << "correct length.\n";
                         return ILLEGAL;
                     }
                 }

                 // no side effects: set initial values to outputs only after error checking
                 iterations = iterations_gmres = iterations_arnoldi = 0;
                 residual = 0;

                 // get RHS vector norm
                 ResidualType bnorm = zero;
                 rc = rc ? rc : grb::algorithms::norm2< descr_dense >( bnorm, b, ring,
                     sqrtX );

 #ifdef DEBUG
                 {
                     std::cout << "RHS norm = " << bnorm << " \n";
                     PinnedVector< NonzeroType > pinnedVector( b, SEQUENTIAL );
                     std::cout << "RHS vector = ";
                     for( size_t k = 0; k < 10; ++k ) {
                         const NonzeroType &nonzeroValue = pinnedVector.getNonzeroValue( k );
                         std::cout << nonzeroValue << " ";
                     }
                     std::cout << " ...  ";
                     for( size_t k = n - 10; k < n; ++k ) {
                         const NonzeroType &nonzeroValue = pinnedVector.getNonzeroValue( k );
                         std::cout << nonzeroValue << " ";
                     }
                     std::cout << "\n";
                 }
 #endif
                 // guard against a trivial call
                 if( max_iterations == 0 ) {
                     rc = rc ? rc : grb::algorithms::norm2< descr_dense >( residual, b, ring,
                         sqrtX );
                     assert( rc == grb::SUCCESS );

                     if( residual <= tol * bnorm ) {
                         return rc;
                     } else {
                         return FAILED;
                     }
                 }

                 // perform gmres iterations
                 for( size_t gmres_iter = 0; gmres_iter < max_iterations; ++gmres_iter ) {
                     (void) ++iterations;
                     (void) ++iterations_gmres;
                     size_t kspspacesize = 0;
                     if( no_preconditioning ) {
 #ifdef DEBUG
                         std::cout << "Call gmres without preconditioner.\n";
 #endif
                         rc = rc ? rc : gmres_step< descr_dense >(
                             x, A, b,
                             Hmatrix, Q,
                             n_restart, tol,
                             kspspacesize,
                             temp, grb::Matrix< NonzeroType >( 0, 0 ),
                             ring, minus, divide, sqrtX
                         );
                     } else {
 #ifdef DEBUG
                         std::cout << "Call gmres with preconditioner.\n";
 #endif
                         rc = rc ? rc : gmres_step< descr_dense >(
                             x, A, b,
                             Hmatrix, Q,
                             n_restart, tol,
                             kspspacesize,
                             temp, M,
                             ring, minus, divide, sqrtX
                         );
                     }
 #ifdef DEBUG
                     if( rc == grb::SUCCESS ) {
                         std::cout << "gmres iteration finished successfully, kspspacesize = "
                             << kspspacesize << "\n";
                     }
 #endif
                     assert( rc == grb::SUCCESS );

                     iterations_arnoldi += kspspacesize;

                     rc = rc ? rc : hessolve(
                         Hmatrix, n_restart + 1, kspspacesize, tol, temp3,
                         ring, minus, divide, sqrtX
                     );
                     assert( rc == grb::SUCCESS );


                     // update x
                     for( size_t i = 0; rc == grb::SUCCESS && i < kspspacesize; ++i ) {
                         rc = rc ? rc : grb::eWiseMul< descr_dense >( x, Hmatrix[ i ], Q[ i ],
                             ring );
                         assert( rc == grb::SUCCESS );

                     }

 #ifdef DEBUG
                     if( rc == grb::SUCCESS ) {
                         std::cout << "vector x updated successfully\n";
                         PinnedVector< NonzeroType > pinnedVector( x, SEQUENTIAL );
                         std::cout << "x vector = ";
                         for( size_t k = 0; k < 10; ++k ) {
                             const NonzeroType &nonzeroValue = pinnedVector.getNonzeroValue( k );
                             std::cout << nonzeroValue << " ";
                         }
                         std::cout << " ...  ";
                         for( size_t k = n-10; k < n; ++k ) {
                             const NonzeroType &nonzeroValue = pinnedVector.getNonzeroValue( k );
                             std::cout << nonzeroValue << " ";
                         }
                         std::cout << "\n";
                     }
 #endif

                     // calculate residual
                     rc = grb::set< descr_dense >( temp, zero );
                     rc = rc ? rc : grb::mxv< descr_dense >( temp, A, x, ring );
                     rc = rc ? rc : grb::foldl< descr_dense >( temp, b, minus );
                     rc = rc ? rc : grb::algorithms::norm2< descr_dense >( residual, temp, ring,
                         sqrtX );
                     assert( rc == grb::SUCCESS );

 #ifdef DEBUG
                     std::cout << "Residual norm = " << residual << " \n";
 #endif

                     if( residual <= tol * bnorm ) {
 #ifdef DEBUG
                         std::cout << "Convergence reached\n";
 #endif
                         break;
                     }
                 } // gmres iterations

                 if( rc == SUCCESS && residual > tol  * bnorm ) {
                     return FAILED;
                 } else {
                     return rc;
                 }
             }

         } // end namespace grb::algorithms::internal

         template<
             Descriptor descr = descriptors::no_operation,
             typename NonzeroType,
             typename ResidualType,
             class Ring = Semiring<
                 grb::operators::add< NonzeroType >, grb::operators::mul< NonzeroType >,
                 grb::identities::zero, grb::identities::one
             >,
             class Minus = operators::subtract< NonzeroType >,
             class Divide = operators::divide< NonzeroType >
         >
         grb::RC gmres(
             grb::Vector< NonzeroType > &x,
             const grb::Matrix< NonzeroType > &A,
             const grb::Vector< NonzeroType > &b,
             const size_t n_restart,
             const size_t max_iterations,
             const ResidualType tol,
             size_t &iterations,
             size_t &iterations_gmres,
             size_t &iterations_arnoldi,
             ResidualType &residual,
             std::vector< grb::Vector< NonzeroType > > &Q,
             std::vector< NonzeroType > &Hmatrix,
             grb::Vector< NonzeroType > &temp,
             std::vector< NonzeroType > &temp3,
             const Ring &ring = Ring(),
             const Minus &minus = Minus(),
             const Divide &divide = Divide(),
             const std::function< ResidualType( ResidualType ) > &sqrtX =
                 std_sqrt< ResidualType, ResidualType >
         ) {
             grb::Matrix< NonzeroType > dummy( 0, 0 );
             return internal::gmres_dispatch< descr, true >(
                     x, A, b,
                     n_restart, max_iterations,
                     tol,
                     iterations, iterations_gmres, iterations_arnoldi,
                     residual,
                     Q, Hmatrix, temp, temp3,
                     dummy,
                     ring, minus, divide, sqrtX
                 );
         }

         template<
             Descriptor descr = descriptors::no_operation,
             typename NonzeroType,
             typename ResidualType,
             class Ring = Semiring<
                 grb::operators::add< NonzeroType >, grb::operators::mul< NonzeroType >,
                 grb::identities::zero, grb::identities::one
             >,
             class Minus = operators::subtract< NonzeroType >,
             class Divide = operators::divide< NonzeroType >
         >
         grb::RC preconditioned_gmres(
             grb::Vector< NonzeroType > &x,
             const grb::Matrix< NonzeroType > &M,
             const grb::Matrix< NonzeroType > &A,
             const grb::Vector< NonzeroType > &b,
             const size_t n_restart,
             const size_t max_iterations,
             const ResidualType tol,
             size_t &iterations,
             size_t &iterations_gmres,
             size_t &iterations_arnoldi,
             ResidualType &residual,
             std::vector< grb::Vector< NonzeroType > > &Q,
             std::vector< NonzeroType > &Hmatrix,
             grb::Vector< NonzeroType > &temp,
             std::vector< NonzeroType > &temp3,
             const Ring &ring = Ring(),
             const Minus &minus = Minus(),
             const Divide &divide = Divide(),
             const std::function< ResidualType( ResidualType ) > &sqrtX =
                 std_sqrt< ResidualType, ResidualType >
         ) {
             return internal::gmres_dispatch< descr, false >(
                     x, A, b,
                     n_restart, max_iterations,
                     tol,
                     iterations, iterations_gmres, iterations_arnoldi,
                     residual,
                     Q, Hmatrix, temp, temp3,
                     M,
                     ring, minus, divide, sqrtX
                 );
         }


     } // namespace algorithms

 } // end namespace grb

 #endif // end _H_GRB_ALGORITHMS_GMRES

grb::algorithms::gmres
grb::RC gmres(grb::Vector< NonzeroType > &x, const grb::Matrix< NonzeroType > &A, const grb::Vector< NonzeroType > &b, const size_t n_restart, const size_t max_iterations, const ResidualType tol, size_t &iterations, size_t &iterations_gmres, size_t &iterations_arnoldi, ResidualType &residual, std::vector< grb::Vector< NonzeroType > > &Q, std::vector< NonzeroType > &Hmatrix, grb::Vector< NonzeroType > &temp, std::vector< NonzeroType > &temp3, const Ring &ring=Ring(), const Minus &minus=Minus(), const Divide &divide=Divide(), const std::function< ResidualType(ResidualType) > &sqrtX=std_sqrt< ResidualType, ResidualType >)
Solves a linear system  with  unknown using the Generalised Minimal Residual (GMRES) method on genera...
Definition: gmres.hpp:967

grb::identities::zero
Standard identity for numerical addition.
Definition: identities.hpp:57

grb::ILLEGAL
A call to a primitive has determined that one of its arguments was illegal as per the specification o...
Definition: rc.hpp:143

grb::Matrix
An ALP/GraphBLAS matrix.
Definition: matrix.hpp:72

grb::RC
RC
Return codes of ALP primitives.
Definition: rc.hpp:47

grb::Vector
A GraphBLAS vector.
Definition: vector.hpp:64

grb::identities::one
Standard identity for numerical multiplication.
Definition: identities.hpp:79

grb::operators::subtract
Numerical substraction of two numbers.
Definition: ops.hpp:301

grb::algorithms::preconditioned_gmres
grb::RC preconditioned_gmres(grb::Vector< NonzeroType > &x, const grb::Matrix< NonzeroType > &M, const grb::Matrix< NonzeroType > &A, const grb::Vector< NonzeroType > &b, const size_t n_restart, const size_t max_iterations, const ResidualType tol, size_t &iterations, size_t &iterations_gmres, size_t &iterations_arnoldi, ResidualType &residual, std::vector< grb::Vector< NonzeroType > > &Q, std::vector< NonzeroType > &Hmatrix, grb::Vector< NonzeroType > &temp, std::vector< NonzeroType > &temp3, const Ring &ring=Ring(), const Minus &minus=Minus(), const Divide &divide=Divide(), const std::function< ResidualType(ResidualType) > &sqrtX=std_sqrt< ResidualType, ResidualType >)
Solves a linear system  with  unknown using the Generalised Minimal Residual (GMRES) method on genera...
Definition: gmres.hpp:1120

grb::algorithms::hessolve
grb::RC hessolve(std::vector< NonzeroType > &H, const DimensionType n, const DimensionType &kspspacesize, const ResidualType tol, std::vector< NonzeroType > &vecx, const Ring &ring=Ring(), const Minus &minus=Minus(), const Divide &divide=Divide(), const std::function< ResidualType(ResidualType) > &sqrtX=std_sqrt< ResidualType, ResidualType >)
Solves the least linear square problem of size n - 1, defined by the equation  where the  is an upper...
Definition: gmres.hpp:146

grb::SEQUENTIAL
Sequential mode IO.
Definition: iomode.hpp:75

grb::nnz
size_t nnz(const Vector< DataType, backend, Coords > &x) noexcept
Request the number of nonzeroes in a given vector.
Definition: io.hpp:479

grb::descriptors::no_operation
static constexpr Descriptor no_operation
Indicates no additional pre- or post-processing on any of the GraphBLAS function arguments.
Definition: descriptors.hpp:63

grb::operators::mul
This operator multiplies the two input parameters and writes the result to the output variable.
Definition: ops.hpp:208

grb::Descriptor
unsigned int Descriptor
Descriptors indicate pre- or post-processing for some or all of the arguments to an ALP/GraphBLAS cal...
Definition: descriptors.hpp:54

grb::nrows
size_t nrows(const Matrix< InputType, backend, RIT, CIT, NIT > &A) noexcept
Requests the row size of a given matrix.
Definition: io.hpp:286

grb::descriptors::dense
static constexpr Descriptor dense
Indicates that all input and output vectors to an ALP/GraphBLAS primitive are structurally dense.
Definition: descriptors.hpp:151

norm.hpp
Implements the 2-norm.

grb::ncols
size_t ncols(const Matrix< InputType, backend, RIT, CIT, NIT > &A) noexcept
Requests the column size of a given matrix.
Definition: io.hpp:339

grb::operators::conjugate_right_mul
Conjugate-multiply operator that conjugates the right-hand operand before multiplication.
Definition: ops.hpp:918

grb::foldl
RC foldl(IOType &x, const Vector< InputType, backend, Coords > &y, const Vector< MaskType, backend, Coords > &mask, const Monoid &monoid=Monoid(), const typename std::enable_if< !grb::is_object< IOType >::value &&!grb::is_object< InputType >::value &&!grb::is_object< MaskType >::value &&grb::is_monoid< Monoid >::value, void >::type *const =nullptr)
Reduces, or folds, a vector into a scalar.
Definition: blas1.hpp:3840

grb::FAILED
Indicates when one of the grb::algorithms has failed to achieve its intended result,...
Definition: rc.hpp:154

grb::operators::add
This operator takes the sum of the two input parameters and writes it to the output variable.
Definition: ops.hpp:175

grb
The ALP/GraphBLAS namespace.
Definition: graphblas.hpp:477

graphblas.hpp
The main header to include in order to use the ALP/GraphBLAS API.

grb::size
size_t size(const Vector< DataType, backend, Coords > &x) noexcept
Request the size of a given vector.
Definition: io.hpp:235

grb::operators::divide
Numerical division of two numbers.
Definition: ops.hpp:328

grb::SUCCESS
Indicates the primitive has executed successfully.
Definition: rc.hpp:54

grb::capacity
size_t capacity(const Vector< InputType, backend, Coords > &x) noexcept
Queries the capacity of the given ALP/GraphBLAS container.
Definition: io.hpp:388

grb::Semiring
A generalised semiring.
Definition: semiring.hpp:190

grb::MISMATCH
One or more of the ALP/GraphBLAS objects passed to the primitive that returned this error have mismat...
Definition: rc.hpp:90