df/d38/BICRS_8hpp_source.html

 /*

  * Copyright (c) 2007-2014, A. N. Yzelman,   Utrecht University 2007-2011;

  *                                                    KU Leuven 2011-2014.

  *                          R. H. Bisseling, Utrecht University 2007-2014.

  *

  * This file is part of the Sparse Library.

  *

  * This library was developed under supervision of Prof. dr. Rob H. Bisseling at

  * Utrecht University, from 2007 until 2011. From 2011-2014, development continued

  * at KU Leuven, where Prof. dr. Dirk Roose contributed significantly to the ideas

  * behind the newer parts of the library code.

  *

  *     The Sparse Library is free software: you can redistribute it and/or modify

  *     it under the terms of the GNU General Public License as published by the

  *     Free Software Foundation, either version 3 of the License, or (at your

  *     option) any later version.

  *

  *     The Sparse Library is distributed in the hope that it will be useful, but

  *     WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY

  *     or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License

  *     for more details.

  *

  *     You should have received a copy of the GNU General Public License along

  *     with the Sparse Library. If not, see <http://www.gnu.org/licenses/>.

  */


 /*

  * File created by:

  *     A. N. Yzelman, Dept. of Mathematic, Utrecht University, 2008.

  */


 #include "SparseMatrix.hpp"

 #include <assert.h>

 #include <iostream>


 //Set when in debug mode

 //#define _DEBUG


 #ifndef _H_BICRS

 #define _H_BICRS


 template< typename _t_value, typename _i_value=LI >

 class BICRS: public SparseMatrix< _t_value, ULI > {


      protected:


         ULI r_start;


         ULI c_start;


         ULI r_end;


         ULI c_end;


         ULI jumps;


         _i_value* r_inc;


         _i_value* c_inc;


         _t_value* vals;


         _i_value ntt;


      public:


         virtual ~BICRS() {

                 delete [] r_inc;

                 delete [] c_inc;

                 delete [] vals;

         }


         BICRS() {}


         BICRS( std::string file, _t_value zero = 0 ) {

                 this->loadFromFile( file, zero );

         }


         BICRS( _i_value* row, _i_value* col, _t_value* val, ULI m, ULI n, ULI nz, _t_value zero ) {

                 this->load( row, col, val, m, n, nz, zero );

         }


         BICRS( std::vector< Triplet< _t_value > >& input, ULI m, ULI n, _t_value zero = 0 ) {

                 this->load( input, m, n, zero );

         }


         virtual void load( std::vector< Triplet< _t_value > >& input, ULI m, ULI n, _t_value zero ) {

                 ULI nz = input.size();

                 _i_value* row = new _i_value[ nz ];

                 _i_value* col = new _i_value[ nz ];

                 _t_value* val = new _t_value[ nz ];

                 unsigned long int c = 0;

                 typename std::vector< Triplet< _t_value > >::iterator it = input.begin();

                 for( ; it!=input.end(); it++, c++ ) {

                         row[ c ] = (*it).i();

                         col[ c ] = (*it).j();

                         val[ c ] = (*it).value;

                 }

                 load( row, col, val, m, n, nz, zero );

                 assert( vals != val );

                 delete [] row;

                 delete [] col;

                 delete [] val;

         }


         void load( _i_value* row, _i_value* col, _t_value* val, ULI m, ULI n, ULI nz, _t_value zero ) {

 #ifdef _DEBUG

                 std::cerr << "Warning: _DEBUG flag set." << std::endl;

 #endif

                 this->zero_element = zero;

                 this->nnz = nz;

                 this->nor = m;

                 this->noc = n;

                 this->ntt = n;

                 jumps = 0;

                 if( nz == 0 ) {

                         r_inc = c_inc = NULL;

                         vals  = NULL;

                         return; //done

                 }

                 _i_value prevrow = row[ 0 ];

                 for( unsigned long int i=1; i<this->nnz; i++ ) {

                         if( row[ i ] != prevrow )

                                 jumps++;

                         prevrow = row[ i ];

                 }

 #ifdef _DEBUG

                 std::cout << jumps << " row jumps found." << std::endl;

 #endif

                 r_inc = new _i_value[ jumps + 1 ];

                 c_inc = new _i_value[ this->nnz ];

                 vals  = new _t_value[ this->nnz ];

                 for( unsigned long int i=0; i<this->nnz; ++i ) vals[i] = val[i];


                 r_start = row[ 0 ];

                 prevrow = row[ 0 ];

                 c_start = col[ 0 ];

                 int prevcol = col[ 0 ];

                 r_end = row[ nz - 1 ];

                 c_end = col[ nz - 1 ];


 #ifdef _DEBUG

                 std::cout << "c_inc: " << prevcol << std::endl;

                 std::cout << "r_inc: " << prevrow << std::endl;

 #endif

                 int c = 0;

                 for( unsigned long int i=1; i<this->nnz; i++ ) {

                         this->c_inc[ i-1 ] = col[ i ] - prevcol;

                         if( row[ i ] != prevrow ) {

                                 this->c_inc[ i-1 ] += ntt;

                                 this->r_inc[ c++ ] = row[ i ] - prevrow;

 #ifdef _DEBUG

                                 std::cout << "c_inc: " << ntt << std::endl;

                                 std::cout << "r_inc: " << row[ i ] - prevrow << std::endl;

 #endif

                                 prevrow = row[ i ];

                         }

 #ifdef _DEBUG

                         else

                                 std::cout << "c_inc: " << col[ i ] - prevcol << std::endl;

 #endif

                         prevcol = col[ i ];

                 }

                 //overflow so to signal end of matrix

                 c_inc[ this->nnz - 1 ] = ntt;

                 //initialise last row jump to zero (prevent undefined jump)

                 r_inc[ c ] = 0;


 #ifdef _DEBUG

                 std::cout << "Construction done." << std::endl;

 #endif

         }


         virtual void getFirstIndexPair( ULI &row, ULI &col ) {

                 row = this->r_start;

                 col = this->c_start;

         }


         virtual void zxa( const _t_value*__restrict__ x_p, _t_value*__restrict__ y_p ) {

                 const _t_value * y              = y_p;

                 _i_value *__restrict__ c_inc_p  = c_inc;

                 _i_value *__restrict__ r_inc_p  = r_inc;

                 _t_value *__restrict__ v_p      = vals;


 #ifndef NDEBUG

                 const _t_value * x                              = x_p;

                 const _t_value * const x_end                    = x+this->nor;

                 const _i_value *__restrict__ const c_inc_end    = c_inc+this->nnz+1;

 #endif

                 const _t_value * const y_end                    = y+this->noc;

                 const _t_value *__restrict__ const v_end        = vals+this->nnz;


                 y_p += this->c_start;

                 x_p += this->r_start;

                 while( v_p < v_end ) {

                         assert( y_p >= y );

                         assert( y_p <  y_end );

                         assert( v_p >= vals );

                         assert( v_p < v_end );

                         assert( x_p >= x );

                         assert( x_p < x_end );

                         assert( c_inc_p >= c_inc );

                         assert( c_inc_p <  c_inc_end );

                         assert( r_inc_p >= r_inc );

                         while( y_p < y_end ) {

 #ifdef _DEBUG

                                 std::cout << (x_p-x) << "," << (y_p-y) << " next increment: " << (*(c_inc_p+1))<< std::endl;

 #endif

                                 *y_p += *v_p++ * *x_p;

                                 y_p += *c_inc_p++;

                         }

                         y_p -= ntt;

                         x_p += *r_inc_p++;

                 }

         }


         virtual void zax( const _t_value*__restrict__ x_p, _t_value*__restrict__ y_p ) {

                 const _t_value * x              = x_p;

                 _i_value *__restrict__ c_inc_p  = c_inc;

                 _i_value *__restrict__ r_inc_p  = r_inc;

                 _t_value *__restrict__ v_p      = vals;


 #ifndef NDEBUG

                 const _t_value * y                              = y_p;

                 const _t_value * const y_end                    = y+this->nor;

                 const _i_value *__restrict__ const c_inc_end    = c_inc+this->nnz;

 #endif

                 const _t_value * const x_end                    = x+this->noc;

                 const _t_value *__restrict__ const v_end        = vals+this->nnz;


                 x_p += c_start;

                 y_p += r_start;

                 while( v_p < v_end ) {

                         assert( y_p >= y );

                         assert( y_p <  y_end );

                         assert( v_p >= vals );

                         assert( v_p < v_end );

                         assert( x_p >= x );

                         assert( x_p < x_end );

                         assert( c_inc_p >= c_inc );

                         assert( c_inc_p <  c_inc_end );

                         assert( r_inc_p >= r_inc );

                         while( x_p < x_end ) {

 #ifdef _DEBUG

                                 std::cout << (y_p-y) << "," << (x_p-x) << " next increment: " << (*(c_inc_p+1))<< std::endl;

 #endif

                                 *y_p += *v_p++ * *x_p;

                                  x_p += *c_inc_p++;

                         }

                         x_p -= ntt;

                         y_p += *r_inc_p++;

                 }

         }


         virtual void zax_fb( _t_value*__restrict__ x_f, _t_value*__restrict__ y_f ) {

                 const _t_value * x              = x_f;

                 _i_value *__restrict__ c_inc_f  = c_inc;

                 _i_value *__restrict__ r_inc_f  = r_inc;

                 _i_value *__restrict__ c_inc_b  = c_inc+this->nnz - 1;

                 _i_value *__restrict__ r_inc_b  = r_inc+this->jumps;

                 _t_value *__restrict__ v_f      = vals;

                 _t_value *__restrict__ v_b      = vals+this->nnz - 1;

                 _t_value *__restrict__ x_b      = x_f + this->noc - 1;

                 _t_value *__restrict__ y_b      = y_f + this->nor - 1;

 #ifndef NDEBUG

                 const _t_value * y                              = y_f;

                 const _t_value * const y_end                    = y+this->nor;

                 const _i_value *__restrict__ const c_inc_end    = c_inc+this->nnz;

 #endif

                 const _t_value * const x_end                    = x+this->noc;

                 const _t_value *__restrict__ const v_end        = vals+this->nnz;


                 x_f += c_start;

                 y_f += r_start;

                 x_b += c_end;

                 y_b += r_end;

                 while( v_f < v_end && v_b >= vals ) {

                         assert( y_f >= y );

                         assert( y_f <  y_end );

                         assert( y_b >= y );

                         assert( y_b <  y_end );

                         assert( v_f >= vals );

                         assert( v_f < v_end );

                         assert( v_b >= vals );

                         assert( v_b < v_end );

                         assert( x_f >= x );

                         assert( x_f < x_end );

                         assert( x_b >= x );

                         assert( x_b < x_end );

                         assert( c_inc_f >= c_inc );

                         assert( c_inc_f <  c_inc_end );

                         assert( c_inc_b >= c_inc );

                         assert( c_inc_b <  c_inc_end );

                         assert( r_inc_b >= r_inc );

                         assert( r_inc_f >= r_inc );

 #ifdef _DEBUG

                         std::cout << (y_p-y) << "," << (x_p-x) << " next increment: " << (*(c_inc_p+1))<< std::endl;

 #endif

                         *y_f += *v_f++ * *x_f;

                          x_f += *c_inc_f++;

                         if( x_f >= x_end ) {

                                 x_f -= ntt;

                                 y_f += *r_inc_f++;

                         }

                         if( v_b < v_f ) break;

                         *y_b += *v_b-- * *x_b;

                          x_b -= *c_inc_b--;

                         if( x_b < x ) {

                                 x_b += ntt;

                                 y_b -= *r_inc_b++;

                         }

                 }

         }


         virtual size_t bytesUsed() {

                 return sizeof( ULI ) * 4 + sizeof( _i_value ) * ( this->nnz + jumps + 1 ) + sizeof( _t_value ) * this->nnz;

         }

 };


 #endif


SparseMatrix< _t_value, ULI >::nnz
ULI nnz
Number of non-zeros.
Definition: SparseMatrix.hpp:58

BICRS::c_end
ULI c_end
Stores the column end position.
Definition: BICRS.hpp:72

BICRS::zxa
virtual void zxa(const _t_value *__restrict__ x_p, _t_value *__restrict__ y_p)
Calculates y=xA, but does not allocate y itself.
Definition: BICRS.hpp:236

BICRS::c_start
ULI c_start
Stores the column start position.
Definition: BICRS.hpp:66

BICRS::bytesUsed
virtual size_t bytesUsed()
Function to query the amount of storage required by this sparse matrix.
Definition: BICRS.hpp:382

BICRS
Bi-directional Incremental Compressed Row Storage scheme.
Definition: BICRS.hpp:58

BICRS::zax_fb
virtual void zax_fb(_t_value *__restrict__ x_f, _t_value *__restrict__ y_f)
Calculates y=Ax, but does not allocate y itself.
Definition: BICRS.hpp:322

SparseMatrix< _t_value, ULI >::m
virtual unsigned long int m()
Queries the number of rows this matrix contains.
Definition: SparseMatrix.hpp:107

BICRS::BICRS
BICRS()
Base constructor.
Definition: BICRS.hpp:99

BICRS::~BICRS
virtual ~BICRS()
Base deconstructor.
Definition: BICRS.hpp:92

SparseMatrix< _t_value, ULI >::loadFromFile
void loadFromFile(const std::string file, const _t_valuezero=0)
Function which loads a matrix from a matrix market file.
Definition: SparseMatrix.hpp:89

SparseMatrix
Interface common to all sparse matrix storage schemes.
Definition: SparseMatrix.hpp:46

BICRS::BICRS
BICRS(std::vector< Triplet< _t_value > > &input, ULI m, ULI n, _t_value zero=0)
Base constructor.
Definition: BICRS.hpp:127

SparseMatrix< _t_value, ULI >::noc
ULI noc
Number of columns.
Definition: SparseMatrix.hpp:55

BICRS::r_start
ULI r_start
Stores the row start position.
Definition: BICRS.hpp:63

BICRS::load
void load(_i_value *row, _i_value *col, _t_value *val, ULI m, ULI n, ULI nz, _t_value zero)
Definition: BICRS.hpp:157

BICRS::load
virtual void load(std::vector< Triplet< _t_value > > &input, ULI m, ULI n, _t_value zero)
This function will rewrite the std::vector< Triplet > structure to one suitable for the other load fu...
Definition: BICRS.hpp:137

BICRS::BICRS
BICRS(_i_value *row, _i_value *col, _t_value *val, ULI m, ULI n, ULI nz, _t_value zero)
Base constructor.
Definition: BICRS.hpp:120

BICRS::r_inc
_i_value * r_inc
Stores the row jumps; size is at maximum the number of nonzeros.
Definition: BICRS.hpp:78

SparseMatrix< _t_value, ULI >::nor
ULI nor
Number of rows.
Definition: SparseMatrix.hpp:52

BICRS::zax
virtual void zax(const _t_value *__restrict__ x_p, _t_value *__restrict__ y_p)
Calculates y=Ax, but does not allocate y itself.
Definition: BICRS.hpp:279

BICRS::getFirstIndexPair
virtual void getFirstIndexPair(ULI &row, ULI &col)
Returns the first nonzero index, per reference.
Definition: BICRS.hpp:226

BICRS::c_inc
_i_value * c_inc
Stores the column jumps; size is exactly the number of nonzeros.
Definition: BICRS.hpp:81

SparseMatrix< _t_value, ULI >::zero_element
_t_value zero_element
The element considered to be zero.
Definition: SparseMatrix.hpp:63

BICRS::BICRS
BICRS(std::string file, _t_value zero=0)
Base constructor.
Definition: BICRS.hpp:105

SparseMatrix< _t_value, ULI >::n
virtual unsigned long int n()
Queries the number of columns this matrix contains.
Definition: SparseMatrix.hpp:115

BICRS::vals
_t_value * vals
Stores the values of the individual nonzeros.
Definition: BICRS.hpp:84

Triplet
A single triplet value.
Definition: Triplet.hpp:52

BICRS::ntt
_i_value ntt
Caches n times two.
Definition: BICRS.hpp:87

BICRS::jumps
ULI jumps
Stores the number of row jumps.
Definition: BICRS.hpp:75

BICRS::r_end
ULI r_end
Stores the row end position.
Definition: BICRS.hpp:69