alp/user/bicgstab_8hpp_source.html

/*

 *   Copyright 2021 Huawei Technologies Co., Ltd.

 *

 * Licensed under the Apache License, Version 2.0 (the "License");

 * you may not use this file except in compliance with the License.

 * You may obtain a copy of the License at

 *

 *     http://www.apache.org/licenses/LICENSE-2.0

 *

 * Unless required by applicable law or agreed to in writing, software

 * distributed under the License is distributed on an "AS IS" BASIS,

 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 * See the License for the specific language governing permissions and

 * limitations under the License.

 */


#ifndef _H_GRB_ALGORITHMS_BICGSTAB

#define _H_GRB_ALGORITHMS_BICGSTAB


#include <graphblas.hpp>


#include <iostream>

#include <type_traits>


#ifdef _DEBUG

 #include <cmath> // for sqrt, making the silent assumption that ResidualType

                  // is a supported type for it

#endif


namespace grb {


    namespace algorithms {


        template<

            Descriptor descr = descriptors::no_operation,

            typename IOType, typename NonzeroType, typename InputType,

            typename ResidualType,

            class Semiring = Semiring<

                operators::add< InputType, InputType, InputType >,

                operators::mul< IOType, NonzeroType, InputType >,

                identities::zero, identities::one

            >,

            class Minus = operators::subtract< ResidualType >,

            class Divide = operators::divide< ResidualType >

        >

        RC bicgstab(

            grb::Vector< IOType > &x,

            const grb::Matrix< NonzeroType > &A,

            const grb::Vector< InputType > &b,

            const size_t max_iterations,

            ResidualType tol,

            size_t &iterations,

            ResidualType &residual,

            Vector< InputType > &r,

            Vector< InputType > &rhat,

            Vector< InputType > &p,

            Vector< InputType > &v,

            Vector< InputType > &s,

            Vector< InputType > &t,

            const Semiring &semiring = Semiring(),

            const Minus &minus = Minus(),

            const Divide &divide = Divide()

        ) {

            // static checks

            static_assert( !( descr & descriptors::no_casting ) || (

                    std::is_same< IOType, NonzeroType >::value &&

                    std::is_same< IOType, InputType >::value &&

                    std::is_same< IOType, ResidualType >::value

                ), "no_casting descriptor was set but containers with differing domains "

                "were given."

            );

            static_assert( !( descr & descriptors::no_casting ) || (

                    std::is_same< NonzeroType, typename Semiring::D1 >::value &&

                    std::is_same< IOType, typename Semiring::D2 >::value &&

                    std::is_same< InputType, typename Semiring::D3 >::value &&

                    std::is_same< InputType, typename Semiring::D4 >::value

                ), "no_casting descriptor was set, but semiring has incompatible domains "

                "with the given containers."

            );

            static_assert( !( descr & descriptors::no_casting ) || (

                    std::is_same< InputType, typename Minus::D1 >::value &&

                    std::is_same< InputType, typename Minus::D2 >::value &&

                    std::is_same< InputType, typename Minus::D3 >::value

                ), "no_casting descriptor was set, but given minus operator has "

                "incompatible domains with the given containers."

            );

            static_assert( !( descr & descriptors::no_casting ) || (

                    std::is_same< ResidualType, typename Divide::D1 >::value &&

                    std::is_same< ResidualType, typename Divide::D2 >::value &&

                    std::is_same< ResidualType, typename Divide::D3 >::value

                ), "no_casting descriptor was set, but given divide operator has "

                "incompatible domains with the given tolerance type."

            );

            static_assert( std::is_floating_point< ResidualType >::value,

                "Require floating-point residual type."

            );


#ifdef _DEBUG

            std::cout << "Entering bicgstab; "

                << "tol = " << tol << ", "

                << "max_iterations = " << max_iterations << "\n";

#endif


            // descriptor for indiciating dense computations

            constexpr Descriptor dense_descr = descr | descriptors::dense;


            // get an alias to zero and one in case 1 and 0 can't cast properly

            const ResidualType zero = semiring.template getZero< ResidualType >();

            const ResidualType one  = semiring.template getOne< ResidualType >();


            // dynamic checks, sizes:

            const size_t n = nrows( A );

            if( n != ncols( A ) ) {

                return MISMATCH;

            }

            if( n != size( x ) ) {

                return MISMATCH;

            }

            if( n != size( b ) ) {

                return MISMATCH;

            }

            if( n != size( r ) || n != size( rhat ) || n != size( p ) ||

                n != size( p ) || n != size( s ) || n != size( t )

            ) {

                return MISMATCH;

            }


            // dynamic checks, capacity:

            if( n != capacity( x ) ) {

                return ILLEGAL;

            }

            if( n != capacity( r ) || n != capacity( rhat ) || n != capacity( p ) ||

                n != capacity( p ) || n != capacity( s ) || n != capacity( t )

            ) {

                return ILLEGAL;

            }


            // dynamic checks, others:

            if( tol <= zero ) {

                return ILLEGAL;

            }


#ifdef _DEBUG

            std::cout << "\t dynamic run-time error checking passed\n";

#endif


            // prelude

            ResidualType b_norm_squared = zero;

            RC ret = dot< dense_descr >( b_norm_squared, b, b, semiring );

            if( ret ) {

                std::cerr << "Error: BiCGstab encountered \"" << toString(ret)

                    << "\" during computation of the norm of b\n";

                return ret;

            }


            // make it so that we do not need to take square roots when detecting

            // convergence

            tol *= tol;

            tol *= b_norm_squared;

#ifdef _DEBUG

            std::cout << "Effective squared relative tolerance is " << tol << "\n";

#endif


            // ensure that x is structurally dense

            if( nnz( x ) != n ) {

                ret = grb::set< descriptors::invert_mask | descriptors::structural >(

                    x, x, zero

                );

                assert( nnz( x ) == n );

            }


            // compute residual (squared), taking into account that b may be sparse

            residual = zero;

            ret = ret ? ret : set( t, zero );                                   // t = Ax

            ret = ret ? ret : mxv< dense_descr >( t, A, x, semiring );

            assert( nnz( t ) == n );

            ret = ret ? ret : set( r, zero );                               // r = b - Ax

            ret = ret ? ret : foldl( r, b, semiring.getAdditiveMonoid() );

            assert( nnz( r ) == n );

            ret = ret ? ret : foldl< dense_descr >( r, t, minus );

            ret = ret ? ret : dot< dense_descr >( residual, r, r, semiring ); // residual


            // check for prelude error

            if( ret ) {

                std::cerr << "Error: BiCGstab encountered \"" << toString(ret)

                    << "\" during prelude\n";

                return ret;

            }


            // check if the guess was good enough

            if( residual < tol ) {

                return SUCCESS;

            }


#ifdef _DEBUG

            std::cout << "\t prelude completed\n";

#endif


            // start iterations

            ret = ret ? ret : set( rhat, r );

            ret = ret ? ret : set( p, zero );

            ret = ret ? ret : set( v, zero );

            ResidualType rho, rho_old, alpha, beta, omega, temp;

            rho_old = alpha = omega = one;

            iterations = 0;


            for( ; ret == SUCCESS && iterations < max_iterations; ++iterations ) {


#ifdef _DEBUG

                std::cout << "\t iteration " << iterations << " starts\n";

#endif


                // rho = ( rhat, r )

                rho = zero;

                ret = ret ? ret : dot< dense_descr >( rho, rhat, r, semiring );

#ifdef _DEBUG

                std::cout << "\t\t rho = " << rho << "\n";

#endif

                if( ret == SUCCESS && rho == zero ) {

                    std::cerr << "Error: BiCGstab detects r at iteration " << iterations <<

                        " is orthogonal to r-hat\n";

                    return FAILED;

                }


                // beta = (rho / rho_old) * (alpha / omega)

                ret = ret ? ret : apply( beta, rho, rho_old, divide );

                ret = ret ? ret : apply( temp, alpha, omega, divide );

                ret = ret ? ret : foldl( beta, temp, semiring.getMultiplicativeOperator() );

#ifdef _DEBUG

                std::cout << "\t\t beta = " << beta << "\n";

#endif


                // p = r + beta ( p - omega * v )

                ret = ret ? ret : eWiseLambda(

                    [&r,beta,&p,&v,omega,&semiring,&minus] (const size_t i) {

                        InputType tmp;

                        apply( tmp, omega, v[i], semiring.getMultiplicativeOperator() );

                        foldl( p[ i ], tmp, minus );

                        foldr( beta, p[ i ], semiring.getMultiplicativeOperator() );

                        foldr( r[ i ], p[ i ], semiring.getAdditiveOperator() );

                    }, v, p, r

                );


                // v = Ap

                ret = ret ? ret : set( v, zero );

                ret = ret ? ret : mxv< dense_descr >( v, A, p, semiring );


                // alpha = rho / (rhat, v)

                alpha = zero;

                ret = ret ? ret : dot< dense_descr >( alpha, rhat, v, semiring );

                if( alpha == zero ) {

                    std::cerr << "Error: BiCGstab detects rhat is orthogonal to v=Ap "

                        << "at iteration " << iterations << ".\n";

                    return FAILED;

                }

                ret = ret ? ret : foldr( rho, alpha, divide );

#ifdef _DEBUG

                std::cout << "\t\t alpha = " << alpha << "\n";

#endif


                // x += alpha * p is post-poned to either the pre-stabilisation exit, or

                // after the stabilisation step

                //ret = ret ? ret : eWiseMul( x, alpha, p, semiring );


                // s = r - alpha * v

                {

                    ResidualType minus_alpha = zero;

                    ret = ret ? ret : foldl( minus_alpha, alpha, minus );

                    ret = ret ? ret : set( s, r );

                    ret = ret ? ret : eWiseMul< dense_descr >( s, minus_alpha, v, semiring );

                }


                // check residual

                residual = zero;

                ret = ret ? ret : dot< dense_descr >( residual, s, s, semiring );

                assert( residual > zero );

#ifdef _DEBUG

                std::cout << "\t\t running residual, pre-stabilisation: " << sqrt(residual)

                    << "\n";

#endif

                if( ret == SUCCESS && residual < tol ) {

                    // update result (x += alpha * p) and exit

                    ret = eWiseMul< dense_descr >( x, alpha, p, semiring );

                    return ret;

                }


                // t = As

                ret = ret ? ret : set( t, zero );

                ret = ret ? ret : mxv< dense_descr >( t, A, s, semiring );


                // omega = (t, s) / (t, t);

                omega = temp = zero;

                ret = ret ? ret : dot< dense_descr >( temp, t, s, semiring );

#ifdef _DEBUG

                std::cout << "\t\t (t, s) = " << temp << "\n";

#endif

                if( ret == SUCCESS && temp == zero ) {

                    std::cerr << "Error: BiCGstab detects As at iteration " << iterations <<

                        " is orthogonal to s\n";

                    return FAILED;

                }

                ret = ret ? ret : dot< dense_descr >( omega, t, t, semiring );

#ifdef _DEBUG

                std::cout << "\t\t (t, t) = " << omega << "\n";

#endif

                assert( omega > zero );

                ret = ret ? ret : foldr( temp, omega, divide );

#ifdef _DEBUG

                std::cout << "\t\t omega = " << omega << "\n";

#endif


                // x += alpha * p + omega * s

                ret = ret ? ret : eWiseMul< dense_descr >( x, alpha, p, semiring );

                ret = ret ? ret : eWiseMul< dense_descr >( x, omega, s, semiring );


                // r = s - omega * t

                {

                    ResidualType minus_omega = zero;

                    ret = ret ? ret : foldl( minus_omega, omega, minus );

                    ret = ret ? ret : set( r, s );

                    ret = ret ? ret : eWiseMul< dense_descr >( r, minus_omega, t, semiring );

                }


                // check residual

                residual = zero;

                ret = ret ? ret : dot< dense_descr >( residual, r, r, semiring );

                assert( residual > zero );

#ifdef _DEBUG

                std::cout << "\t\t running residual, post-stabilisation: "

                    << sqrt(residual) << ". "

                    << "Residual squared: " << residual << ".\n";

#endif

                if( ret == SUCCESS ) {

                       if( residual < tol ) { return SUCCESS; }


                    // go to next iteration

                    rho_old = rho;

                }

            }


            if( ret == SUCCESS ) {

                // if we are here, then we did not detect convergence

                std::cerr << "Warning: call to BiCGstab did not converge within "

                    << max_iterations << " iterations. Squared two-norm of the running "

                    << "residual is " << residual << ". "

                    << "Target residual squared: " << tol << ".\n";

                return FAILED;

            } else {

                // if we are here, we exited due to an ALP error code

                std::cerr << "Error: BiCGstab encountered error \"" << toString(ret)

                    << "\" while iterating to " << iterations << ", ";

                if( iterations == max_iterations ) {

                    std::cerr << "which also is the maximum number of iterations.\n";

                } else {

                    std::cerr << "which is below the maximum number of iterations of "

                        << max_iterations << "\n";

                }

                return ret;

            }

        }


    }

}


#endif // end _H_GRB_ALGORITHMS_BICGSTAB


grb::Matrix
An ALP/GraphBLAS matrix.
Definition: matrix.hpp:71

grb::Semiring
A generalised semiring.
Definition: semiring.hpp:186

grb::Vector
A GraphBLAS vector.
Definition: vector.hpp:64

graphblas.hpp
The main header to include in order to use the ALP/GraphBLAS API.

grb::apply
static enum RC apply(OutputType &out, const InputType1 &x, const InputType2 &y, const OP &op=OP(), const typename std::enable_if< grb::is_operator< OP >::value &&!grb::is_object< InputType1 >::value &&!grb::is_object< InputType2 >::value &&!grb::is_object< OutputType >::value, void >::type *=nullptr)
Out-of-place application of the operator OP on two data elements.
Definition: blas0.hpp:179

grb::foldr
RC foldr(const Vector< InputType, backend, Coords > &x, const Vector< MaskType, backend, Coords > &mask, IOType &y, const Monoid &monoid=Monoid(), const typename std::enable_if< !grb::is_object< IOType >::value &&!grb::is_object< InputType >::value &&!grb::is_object< MaskType >::value &&grb::is_monoid< Monoid >::value, void >::type *const =nullptr)
Folds a vector into a scalar, right-to-left.
Definition: blas1.hpp:3943

grb::eWiseLambda
RC eWiseLambda(const Func f, const Vector< DataType, backend, Coords > &x, Args...)
Executes an arbitrary element-wise user-defined function f on any number of vectors of equal length.
Definition: blas1.hpp:3746

grb::foldl
RC foldl(IOType &x, const Vector< InputType, backend, Coords > &y, const Vector< MaskType, backend, Coords > &mask, const Monoid &monoid=Monoid(), const typename std::enable_if< !grb::is_object< IOType >::value &&!grb::is_object< InputType >::value &&!grb::is_object< MaskType >::value &&grb::is_monoid< Monoid >::value, void >::type *const =nullptr)
Reduces, or folds, a vector into a scalar.
Definition: blas1.hpp:3840

grb::set
RC set(Vector< DataType, backend, Coords > &x, const T val, const Phase &phase=EXECUTE, const typename std::enable_if< !grb::is_object< DataType >::value &&!grb::is_object< T >::value, void >::type *const =nullptr) noexcept
Sets all elements of a vector to the given value.
Definition: io.hpp:857

grb::nnz
size_t nnz(const Vector< DataType, backend, Coords > &x) noexcept
Request the number of nonzeroes in a given vector.
Definition: io.hpp:479

grb::size
size_t size(const Vector< DataType, backend, Coords > &x) noexcept
Request the size of a given vector.
Definition: io.hpp:235

grb::ncols
size_t ncols(const Matrix< InputType, backend, RIT, CIT, NIT > &A) noexcept
Requests the column size of a given matrix.
Definition: io.hpp:339

grb::capacity
size_t capacity(const Vector< InputType, backend, Coords > &x) noexcept
Queries the capacity of the given ALP/GraphBLAS container.
Definition: io.hpp:388

grb::nrows
size_t nrows(const Matrix< InputType, backend, RIT, CIT, NIT > &A) noexcept
Requests the row size of a given matrix.
Definition: io.hpp:286

grb::algorithms::bicgstab
RC bicgstab(grb::Vector< IOType > &x, const grb::Matrix< NonzeroType > &A, const grb::Vector< InputType > &b, const size_t max_iterations, ResidualType tol, size_t &iterations, ResidualType &residual, Vector< InputType > &r, Vector< InputType > &rhat, Vector< InputType > &p, Vector< InputType > &v, Vector< InputType > &s, Vector< InputType > &t, const Semiring &semiring=Semiring(), const Minus &minus=Minus(), const Divide &divide=Divide())
Solves a linear system  with  unknown by using the bi-conjugate gradient (bi-CG) stabilised method; i...
Definition: bicgstab.hpp:166

grb::descriptors::no_casting
static constexpr Descriptor no_casting
Disallows the standard casting of input parameters to a compatible domain in case they did not match ...
Definition: descriptors.hpp:196

grb::descriptors::no_operation
static constexpr Descriptor no_operation
Indicates no additional pre- or post-processing on any of the GraphBLAS function arguments.
Definition: descriptors.hpp:63

grb::descriptors::dense
static constexpr Descriptor dense
Indicates that all input and output vectors to an ALP/GraphBLAS primitive are structurally dense.
Definition: descriptors.hpp:151

grb
The ALP/GraphBLAS namespace.
Definition: graphblas.hpp:452

grb::RC
RC
Return codes of ALP primitives.
Definition: rc.hpp:47

grb::ILLEGAL
@ ILLEGAL
A call to a primitive has determined that one of its arguments was illegal as per the specification o...
Definition: rc.hpp:143

grb::MISMATCH
@ MISMATCH
One or more of the ALP/GraphBLAS objects passed to the primitive that returned this error have mismat...
Definition: rc.hpp:90

grb::SUCCESS
@ SUCCESS
Indicates the primitive has executed successfully.
Definition: rc.hpp:54

grb::FAILED
@ FAILED
Indicates when one of the grb::algorithms has failed to achieve its intended result,...
Definition: rc.hpp:154

grb::Descriptor
unsigned int Descriptor
Descriptors indicate pre- or post-processing for some or all of the arguments to an ALP/GraphBLAS cal...
Definition: descriptors.hpp:54

grb::toString
std::string toString(const RC code)