dg/html/precond_8h_source.html

#pragma once


#include <vector>


namespace dg

{


namespace create

{


namespace detail

{

template<class T>

void sparsify( cusp::array1d<int, cusp::host_memory>& row_offsets,

         cusp::array1d<int, cusp::host_memory>& column_indices,

         cusp::array1d<T, cusp::host_memory>& values,

         const int i,

        const thrust::host_vector<T>& zw,

        const std::vector<int>& iz_zw,

        unsigned nnzmax, T threshold)

{

    //std::cout << "Entries in zw\n";

    //for( auto idx : iz_zw)

    //    std::cout << "[ "<<idx << " "<<zw[idx]<<"]\n";


    // Take zw and write it into z modulo the drop rules

    std::vector<std::pair<double, int>> pairs;

    std::vector<std::pair<int, double>> accept;

    // 1. Always take the diagonal element

    accept.push_back( {i, zw[i]});

    for( auto idx : iz_zw)

        if( idx != i) //we already have diagonal

            pairs.push_back( { zw[idx], idx});

    //std::cout << "Pairs \n";

    //for( auto pair : pairs)

    //    std::cout << pair.first << " "<<pair.second<<std::endl;

    std::sort( pairs.begin(), pairs.end(), std::greater<>());

    //std::cout << "Pairs after sort\n";

    // 2. Take nnzmax-1 largest values of zw: sort zw by size

    // but 3. only if entry is greater than threshold

    for( int k=0; k<(int)nnzmax-1; k++)

    {

        if( k < (int)pairs.size() && fabs(pairs[k].first) > threshold)

        {

            //std::cout << pairs[k].first << " "<<pairs[k].second<<std::endl;

            accept.push_back({pairs[k].second, pairs[k].first});

        }

    }

    // sort by index

    std::sort( accept.begin(), accept.end());

    //std::cout << "Accepted entries in zw\n";

    //for( auto pair : accept)

    //    std::cout << "[ "<<pair.first << " "<<pair.second<<"]\n";


    //write into matrix

    row_offsets.push_back(row_offsets[i]);

    for( auto pair : accept)

    {

        //std::cout<< "Entry "<<pair.first<<" "<<pair.second<<"\n";

        column_indices.push_back( pair.first);

        values.push_back( pair.second);

        row_offsets[i+1]++;

    }

}

}


template<class T>

void sainv_precond(

        const cusp::csr_matrix<int, T, cusp::host_memory>& a,

        cusp::csr_matrix<int, T, cusp::host_memory>& s,

        thrust::host_vector<T>& d,

        const thrust::host_vector<T>& weights,

        unsigned nnzmax,

        T threshold)

{

    unsigned n = a.num_rows;

    //assert( a.num_rows == a.num_cols);


    d.resize( n, 0.);


    // Init z_0 = e_0 and p_0 = a_{11}

    for( int j = a.row_offsets[0]; j<a.row_offsets[1]; j++)

    {

        if( a.column_indices[j] == 0)

            d[0] = a.values[j]*weights[0];

    }

    if( fabs( d[0] ) < threshold)

        d[0] = threshold;

    //std::cout << "first diagonal "<<d[0]<<"\n";

    cusp::array1d<int, cusp::host_memory> row_offsets, column_indices;

    cusp::array1d<T, cusp::host_memory> values;


    row_offsets.push_back(0);

    row_offsets.push_back(1);

    column_indices.push_back( 0);

    values.push_back( 1.0);


    // Main loop

    for( int i = 1; i<(int)n; i++)

    {

        thrust::host_vector<T> zw( n, 0.);

        std::vector<int> iz_zw; // flags nonzeros in zw

        //zw = e_i

        zw[i] = 1.0;

        iz_zw.push_back(i);

        std::vector<int> s;

        // get column indices of row i that are smaller than i

        for( int k = a.row_offsets[i]; k<a.row_offsets[i+1]; k++)

        {

            if( a.column_indices[k] < i )

                s.push_back( a.column_indices[k]);

        }

        //std::cout << "Loop i = "<<i<<"\n";

        //std::cout<<  "s\n";

        //for( auto idx : s)

        //    std::cout << idx << " \n";

        while( !s.empty())

        {

            auto it = std::min_element( s.begin(), s.end());

            int j = *it; // j < i in all cases

            s.erase( it);

            // A_j * zw

            d[i] = 0.0;

            for( int k = a.row_offsets[j]; k<a.row_offsets[j+1]; k++)

            {

                //std::cout << "Multiply k " << k<<" "<<a.column_indices[k]<<" "<< a.values[k]<<" j = "<< j << " weights "<<weights[j]<<" zw "<<zw[a.column_indices[k]]<<"\n";

                d[i] += weights[j]*a.values[k]*zw[ a.column_indices[k]];

            }

            //std::cout << "d[i] "<<d[i]<<"\n";

            T alpha = d[i]/d[j];

            //std::cout << "alpha ij "<< i <<" "<<j<<" "<<alpha<<"\n";

            if( fabs( alpha) > threshold)

            {

                for( int k = row_offsets[j]; k<row_offsets[j+1]; k++)

                {

                    int zkk = column_indices[k];

                    //std::cout << "col  = "<<zkk<<std::endl;

                    zw[ zkk] -= alpha * values[k];

                    // flag a new nonzero in zw if necessary

                    if (std::find(iz_zw.begin(), iz_zw.end(), zkk) == iz_zw.end()) {

                        iz_zw.push_back( zkk);

                    }

                    //std::cout << "col  = "<<zkk<<std::endl;

                    // add indices to set of dot products to compute

                    for( int l = a.row_offsets[zkk]; l < a.row_offsets[zkk+1]; l++)

                    {

                        //std::cout << "l  = "<<l<<" "<<a.row_offsets[zkk]<< " "<<a.row_offsets[zkk+1]<<std::endl;

                        if ( (std::find(s.begin(), s.end(), l) == s.end()) && (j<l) && (l < i) ) {

                            s.push_back( l);

                        }

                    }

                    //std::cout << "col  = "<<zkk<<std::endl;

                }

            }

        }

        d[i] = 0.0;

        for( int k = a.row_offsets[i]; k<a.row_offsets[i+1]; k++)

            d[i] += a.values[k]*zw[ a.column_indices[k]]*weights[i];

        if( fabs(d[i]) < threshold)

            d[i] = threshold;

        //std::cout << "d[i] "<<d[i]<<"\n";

        //std::cout << "zw \n";

        //for(unsigned i=0; i<zw.size(); i++)

        //    std::cout << zw[i]<<"\n";

        // Apply drop rule to zw:

        detail::sparsify( row_offsets, column_indices, values, i, zw, iz_zw, nnzmax, threshold);

    }

    s.resize( n, n, values.size());

    s.column_indices = column_indices;

    s.row_offsets = row_offsets;

    s.values = values;


}

} //namespace create


}//namespace dg

dg::create::weights
MPI_Vector< thrust::host_vector< real_type > > weights(const aRealMPITopology2d< real_type > &g)
Nodal weight coefficients.
Definition: mpi_weights.h:22

dg::create::sainv_precond
void sainv_precond(const cusp::csr_matrix< int, T, cusp::host_memory > &a, cusp::csr_matrix< int, T, cusp::host_memory > &s, thrust::host_vector< T > &d, const thrust::host_vector< T > &weights, unsigned nnzmax, T threshold)
Left looking sparse inverse preconditioner for self-adjoint positive definit matrices.
Definition: precond.h:93

dg
This is the namespace for all functions and classes defined and used by the discontinuous Galerkin li...