kaskade7/html/assembler_core_8hh_source.html

/* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */

/*                                                                           */

/*  This file is part of the library KASKADE 7                               */

/*  https://www.zib.de/research/projects/kaskade7-finite-element-toolbox     */

/*                                                                           */

/*  Copyright (C) 2002-2024 Zuse Institute Berlin                            */

/*                                                                           */

/*  KASKADE 7 is distributed under the terms of the ZIB Academic License.    */

/*    see $KASKADE/academic.txt                                              */

/*                                                                           */

/* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * */


#ifndef ASSEMBLERCORE_HH

#define ASSEMBLERCORE_HH


#include <iostream>

#include <numeric>

#include <memory>

#include <mutex>

#include <tuple>

#include <new>

#include <type_traits>


#include <boost/version.hpp>

#include <boost/mpl/accumulate.hpp>

#include <boost/mpl/bool.hpp>

#include <boost/mpl/if.hpp>

#include <boost/timer/timer.hpp>


#include <boost/exception/diagnostic_information.hpp>

#include <boost/fusion/algorithm.hpp>

#include <boost/fusion/sequence.hpp>

#include <boost/fusion/include/find_if.hpp>


#include "dune/common/config.h"


#include "dune/common/fvector.hh"

#include "dune/common/fmatrix.hh"

#include "dune/geometry/type.hh"

#include "dune/grid/common/capabilities.hh"

#include "dune/istl/bcrsmatrix.hh"

#include "dune/istl/bdmatrix.hh"


#include "fem/firstless.hh"

#include "fem/fixfusion.hh"

#include "fem/functional_aux.hh"

#include "fem/gridmanager.hh"

#include "fem/quadrature.hh"

#include "fem/variables.hh"


#include "linalg/dynamicMatrix.hh"

#include "linalg/localMatrices.hh"

#include "linalg/threadedMatrix.hh"


#include "utilities/detailed_exception.hh"

#include "utilities/threading.hh"

#include "utilities/timing.hh"

#include "utilities/typeTraits.hh"


// this is omitted in boost/fusion/sequence/container/vector/detail/vector_n.hpp

#undef N


namespace Kaskade

{


  static int const timerStatistics = 0x1;       // gather global execution time statistics

  static int const scatterStatistics = 0x2;

  static int const lockStatistics = 0x4;

  static int const localTimerStatistics = 0x0;  // gather local (per element) time statistics

  static int const statistics = 0;


  //---------------------------------------------------------------------


  namespace AssemblyDetail {


    using namespace boost::fusion;


    class RowGroupManager

    {

    public:

      RowGroupManager();


      virtual ~RowGroupManager();


      // Noncopyable since we contain mutexes.

      RowGroupManager(RowGroupManager const& m) = delete;

      RowGroupManager& operator=(RowGroupManager const& m) = delete;


      void init(int nrg, size_t rows);


      void init(int nrg, std::vector<std::vector<size_t>> const& colIndex);


      void init(int nrg, std::vector<size_t> const& weight);


      std::pair<size_t,size_t> range(int n) const;


      std::mutex& mutex(int n) const;


      int size() const;


    private:

      // start indices of row groups

      std::vector<size_t> rowGroupStart;


      // Support for simultaneous write access to different row groups.

      std::mutex* mutexes;


      // deletes the mutexes

      void clear();

    };


    // ----------------------------------------------------------------------------------------------------


    template <class Policy, class RowVar, class ColVar, class SparseIdx>

    struct MatrixBlock

    {

      static int const rowId = RowVar::id;

      static int const colId = ColVar::id;

      static int const rowSpaceIndex = RowVar::spaceIndex;

      static int const colSpaceIndex = ColVar::spaceIndex;

      static bool const symmetric    = Policy::template BlockInfo<rowId,colId>::symmetric;

      static bool const mirror       = Policy::template BlockInfo<rowId,colId>::mirror;

      static bool const lumped       = Policy::template BlockInfo<rowId,colId>::lumped;

      static bool const makePositive = Policy::template BlockInfo<rowId,colId>::makePositive;


      using SparseIndex = SparseIdx;

      typedef MatrixBlock<Policy,RowVar,ColVar,SparseIndex> Self;

      typedef typename Policy::Scalar Scalar;

      typedef typename Policy::Spaces Spaces;

      typedef Dune::FieldMatrix<Scalar,RowVar::m,ColVar::m> BlockType;

      typedef NumaBCRSMatrix<BlockType, SparseIndex> Matrix;


      typedef typename SpaceType<Spaces,RowVar::spaceIndex>::type RowSpace;

      typedef typename SpaceType<Spaces,ColVar::spaceIndex>::type ColSpace;

      typedef typename RowSpace::GridView GridView;

      typedef typename GridView::template Codim<0>::Iterator CellIterator;


      static int const dim = ColSpace::dim;


      MatrixBlock() {}


      MatrixBlock(MatrixBlock const& mb)

      : matrix(new Matrix(*mb.matrix))

      , isDense(mb.isDense)

      {}


      MatrixBlock& operator=(MatrixBlock const& mb)

      {

        *matrix = *mb.matrix;

        isDense = mb.isDense;

      }


      MatrixBlock& operator=(Scalar x)

      {

        assert(matrix.get());

        *matrix = x;

        return *this;

      }


      MatrixBlock& operator+=(MatrixBlock const& mb)

      {

        *matrix += *mb.matrix;

        return *this;

      }


      Matrix& globalMatrix()

      {

        assert(matrix.get());

        return *matrix;

      }


      Matrix const& globalMatrix() const

      {

        assert(matrix.get());

        return *matrix;

      }


      std::shared_ptr<Matrix const> globalMatrixPointer() const { return matrix; }


      template <class FaceOracle>

      void init(Spaces const& spaces, CellIterator first, CellIterator last,

                FaceOracle const& considerFace)

      {

        RowSpace const& rowSpace = *at_c<RowVar::spaceIndex>(spaces);

        ColSpace const& colSpace = *at_c<ColVar::spaceIndex>(spaces);


        // @todo: respect *dynamic* presence flag. static one is respected

        // on construction of sequence of matrix blocks. Respect symmetric flag.

        if (!Policy::template BlockInfo<rowId,colId>::present)

        {

          assert("Aieee! Nonpresent matrix block detected!\n"==0);

          abort();

        }


        boost::timer::cpu_timer timer;


        size_t nnz = 0;

        size_t const rows = rowSpace.degreesOfFreedom();

        size_t const cols = colSpace.degreesOfFreedom();


        // If mass lumping is desired, we just create a diagonal matrix.

        // Otherwise, we need to establish the connectivity pattern of

        // the ansatz functions.

        if (Policy::template BlockInfo<rowId,colId>::lumped)

        {

          assert(RowVar::spaceIndex==ColVar::spaceIndex && rows==cols);

          NumaCRSPatternCreator<SparseIndex> creator(rows,cols,false,1);

          for (size_t i=0; i<rows; ++i)

            creator.addElements(&i,&i+1,&i,&i+1);

          matrix.reset(new Matrix(creator)); // zero init

          nnz = rows;

        }

        else

        {

          // In case of global support of shape functions of one of the involved spaces (usually ConstantSpace),

          // the resulting matrix is dense. Use a shortcut to define the sparsity structure.

          bool const dense = RowSpace::Mapper::globalSupport || ColSpace::Mapper::globalSupport;


          // Allocate sparse matrix and define the sparsity structure. Estimate the required number of entries per row

          // for efficient preallocation.

          // Ws 2016-01-22: Zero nnz init is actually faster on P1 pattern, probably because otherwise the

          // chunks put a high burden on the memory system by requesting memory at the same time. This appears

          // to parallelize quite badly and hence is turned off in parallel mode.

          int preallocateEntriesPerRow = 0;

          if (NumaThreadPool::instance().nodes()==1)                       // sequential allocation in NumaCRSPatternCreator

          {

            int localSize = colSpace.mapper().globalIndices(0).size();     // # entries per row of local matrices (rough estimate)

            preallocateEntriesPerRow = dense? 0:                           // for dense matrices we'll use a specialized version

                                       dim<=1? 2*localSize:                // make room for (roughly) all elemental matrices appended...

                                       dim==2? 8*localSize:                // ... this is overprovisioning, but faster due to less ...

                                               20*localSize;               // ... allocations and data movement.

          }

          NumaCRSPatternCreator<SparseIndex> creator(rows,cols,symmetric,preallocateEntriesPerRow);


          if (statistics & timerStatistics)

            std::cout << "initial creator construction (" << rowId << "," << colId << "):  " << timer.format();

          timer.start();


          if (dense)

          {

            creator.addAllElements();

            if (statistics & timerStatistics)

              std::cout << "entering indices for (" << rowId << "," << colId << "):        " << timer.format();

            timer.start();

          }

          else

          {

            // Traditional local FE spaces - that's the hard case. We have to traverse the grid and pick up all

            // interactions of (local) basis functions.


            // Iteration over all cells. Note that the grid views of row and

            // column spaces need not cover the whole grid (e.g., in case of

            // local support). It would be best to iterate over the grid

            // view with smaller support, but for simplicity we choose the

            // row space.


            size_t const nCells = rowSpace.indexSet().size(0);


            std::vector<typename RowSpace::Mapper::GlobalIndexRange> rIndices(nCells,rowSpace.mapper().initGlobalIndexRange());

            std::vector<typename ColSpace::Mapper::GlobalIndexRange> cIndices(nCells,colSpace.mapper().initGlobalIndexRange());

            for (size_t i=0; i<nCells; ++i)

            {

              rIndices[i] = rowSpace.mapper().globalIndices(i);

              cIndices[i] = colSpace.mapper().globalIndices(i);

            }

            if (statistics & timerStatistics)

              std::cout << "gathering indices for (" << rowId << "," << colId << "):         " << timer.format();

            timer.start();


            creator.addElements(rIndices,cIndices); // enter all entries in one go


            // We may need to assemble integrals on inner faces - then there are matrix entries coupling degrees of freedom

            // associated to different cells (e.g., in discontinuous Galerkin methods). Add these entries, too.

            if(Policy::considerInnerFaces)

            {

              GridView const& gridView = rowSpace.gridView();


              for (CellIterator ci=first; ci!=last; ++ci)

              {

                auto const& rIndices = rowSpace.mapper().globalIndices(*ci);


                for (auto const& face: intersections(gridView,*ci))

                {

                  // only true inner faces are considered, and only if requested

                  if (face.boundary() || !face.neighbor() || considerFace(face)==false)

                    continue;


                  auto const& cIndices = colSpace.mapper().globalIndices(face.outside());


                  creator.addElements(begin(rIndices),end(rIndices),

                                      begin(cIndices),end(cIndices));

                } // end iteration over faces

              } // end iteration over cells

            } // end Policy::considerInnerFaces


            if (statistics & timerStatistics)

              std::cout << "entering indices for (" << rowId << "," << colId << "):          " << timer.format();

            timer.start();


            creator.balance();

            if (statistics & timerStatistics)

              std::cout << "balancing for (" << rowId << "," << colId << "):                 " << timer.format();

            timer.start();

          }


          // Now that the pattern creator is filled, create pattern and matrix.


          // Count number of nonzeros.

          nnz = creator.nonzeroes();


          // Create the matrix (zero initialization of entries).

          matrix.reset(new Matrix(creator));

          if (statistics & timerStatistics)

            std::cout << "creating pattern & matrix for (" << rowId << "," << colId << "): " << timer.format();

          timer.start();

        }


        // Check density (nonzeros>(rows*cols/2). Be careful not to get

        // overflow for very large and sparse matrices!

        if (std::min(rows,cols)>0)

          isDense = nnz/std::min(rows,cols) > std::max(rows,cols)/2;

        else

          isDense = false; // well, empty matrices are as sparse as one can hope for ;)


        if (statistics & timerStatistics)

            std::cout << "init cleanup for (" << rowId << "," << colId << "):              " << timer.format() << "\n";

      }


      // Returns true if the matrix is essentially dense (more than 50% nonzeros).

      bool dense() const { return isDense; }


    private:

      std::shared_ptr<Matrix> matrix;

      bool                    isDense;

    };


    // ---------------------------------------------------------------------------------------


    // a boost::fusion predicate telling us whether the current matrix block has the given row and column indices.

    template <int row, int col>

    struct IsBlock

    {

      template <class MatrixBlock>

      struct apply

      {

        using type = std::conditional_t<MatrixBlock::rowId==row && MatrixBlock::colId==col,boost::mpl::true_,boost::mpl::false_>;

      };

    };


    // ---------------------------------------------------------------------------------------


    template <class Policy, class AnsatzVariables, class TestVariables, class SparseIndex>

    class BlockArray

    {

      // Retain only those blocks which are present in the functional

      struct PresenceFilter

      {

        template <class Block>

        struct apply

        {

          typedef boost::mpl::bool_<Policy::template BlockInfo<Block::rowId,Block::colId>::present> type;

        };

      };


      static auto create(AnsatzVariables a, TestVariables t)

      {

        auto joiner = [=](auto blocks, auto rowVar)

        {

          using RowVar = decltype(rowVar);

          auto thisRow = transform(a,[](auto avar){ return MatrixBlock<Policy,RowVar,decltype(avar),SparseIndex>(); });

          return join(blocks,thisRow);

        };

        auto allBlocks = accumulate(t,vector<>(),joiner);

        return as_vector(filter_if<PresenceFilter>(allBlocks));

      }


    public:

      typedef decltype(create(AnsatzVariables(),TestVariables())) type;

    };


    //---------------------------------------------------------------------


    template <class Policy, class RV>

    struct RhsBlock

    {

      typedef typename std::remove_reference<RV>::type RowVar;


      static int const rowId = RowVar::id;


      typedef typename Policy::Scalar Scalar;

      typedef typename Policy::Spaces Spaces;

      typedef Dune::FieldVector<Scalar,RowVar::m> BlockType;

      typedef typename Dune::BlockVector<BlockType> Rhs;

      typedef RhsBlock<Policy,RowVar> Self;


      static int const rowSpaceIndex = RowVar::spaceIndex;

      typedef typename SpaceType<Spaces,RowVar::spaceIndex>::type RowSpace;

      typedef typename RowSpace::GridView::template Codim<0>::Iterator CellIterator;


      void init(Spaces const& spaces, CellIterator /*first*/, CellIterator /*last*/, int nrg)

      {

        RowSpace const& rowSpace = *at_c<RowVar::spaceIndex>(spaces);

        size_t rows = rowSpace.degreesOfFreedom();


        rowGroupManager = std::make_unique<RowGroupManager>();

        rowGroupManager->init(nrg,rows);

      }


      RowGroupManager& rowGroup() { return *rowGroupManager; }


      // A class storing a local element rhs vector and the corresponding indices

      struct LocalVector

      {

        // just because the ranges are not default constructible

        LocalVector(): ridx(RowSpace::Mapper::initSortedIndexRange()) {}


        std::vector<BlockType> vector;


        typedef typename RowSpace::Mapper::SortedIndexRange SortedRowIdx;


        SortedRowIdx ridx;

      };


      // A structure for holding a sequence of several local vectors to be filled sequentially

      // and to be scattered together.

      struct LocalVectors

      {

        typedef Self RhsBlock;

        typedef std::vector<BlockType> LocalVectorType;


        LocalVectors(int n, RhsBlock& rb_): localVectors(n), currentLocalVector(0), rb(&rb_) {}


        // Storage for local rhs vectors.

        std::vector<LocalVector> localVectors;


        // Which is the current local vector to be filled?

        int currentLocalVector;


        // Pointing back to its rhs block

        RhsBlock* rb;

      };


    private:

      std::unique_ptr<RowGroupManager> rowGroupManager;

    };


    template <class Policy, class TestVariables>

    class RhsBlockArray

    {

      // Define a mapping from Variable to RhsBlock for Variable as row variable.

      // Retain only those blocks which are present in the functional

      struct PresenceFilter

      {

        template <class Block>

        struct apply

        {

          typedef boost::mpl::bool_<Policy::template RhsBlockInfo<Block::rowId>::present> type;

        };

      };


      static auto create(TestVariables t)

      {

        auto allBlocks = transform(t,[](auto tvar) { return RhsBlock<Policy,decltype(tvar)>(); });

        return as_vector(filter_if<PresenceFilter>(allBlocks));

      }


    public:

      typedef decltype(create(TestVariables())) type;

    };


    //---------------------------------------------------------------------


    template <class Policy>

    struct RhsLocalData

    {

      RhsLocalData(int n_): n(n_) {}


      template <class RhsBlock>

      typename RhsBlock::LocalVectors operator()(RhsBlock const& rb) const

      {

        // due to boost::fusion::transform providing only const references to the source sequence elements, we

        // need a const cast here :(

        return typename RhsBlock::LocalVectors(n,removeConst(rb));

      }


    private:

      int n;

    };


    struct MatrixLocalData

    {

      MatrixLocalData(size_t s_)

      : s(s_) {}


      template <class MatrixBlock>

      auto operator()(MatrixBlock const& mb) const

      {

        // When switching from boost 1.51 to 1.57, it seems that the filter_view only presents

        // const references to the elements (why?), but we need non-const ones. Taking non-const

        // reference as arguments leads to failure of overload resolution, omitting this

        // functor, and ultimately to error. As a workaround, we take const reference and cast

        // it away.

        return LocalMatrices<typename MatrixBlock::BlockType,

                             MatrixBlock::lumped,

                             typename MatrixBlock::RowSpace::Mapper::SortedIndexRange,

                             typename MatrixBlock::ColSpace::Mapper::SortedIndexRange,

                             MatrixBlock>(removeConst(mb).globalMatrix(),s);

      }


    private:

      size_t s;

    };


    //---------------------------------------------------------------------


    template <class Spaces>

    class GetMaxDerivativeBase

    {

    public:

      GetMaxDerivativeBase(Spaces const& spaces_, std::map<void const*,int>& deriv_): spaces(spaces_), deriv(deriv_) {}


    private:

      Spaces const&        spaces;

      std::map<void const*,int>& deriv;


    protected:

      template <int spaceIndex>

      void enterSpace(int d) const

      {

        void const* space = at_c<spaceIndex>(spaces);

        auto i = deriv.find(space);

        if (i==deriv.end())

          deriv[space] = d;

        else

          i->second = std::max(i->second,d);

      }

    };


    template <class Functional, class Spaces>

    class GetMaxDerivativeMatrix: public GetMaxDerivativeBase<Spaces>

    {

    public:

      GetMaxDerivativeMatrix(Spaces const& spaces, std::map<void const*,int>& deriv): GetMaxDerivativeBase<Spaces>(spaces,deriv)  {}


      template <class LocalMatrices>

      void operator()(LocalMatrices const&) const

      {

        using MatrixBlock = typename LocalMatrices::InfoType;

        int d = Functional::template D2<MatrixBlock::rowId,MatrixBlock::colId>::derivatives;

        this->template enterSpace<MatrixBlock::rowSpaceIndex>(d);

        this->template enterSpace<MatrixBlock::colSpaceIndex>(d);

      }

    };


    template <class Functional, class Spaces>

    class GetMaxDerivativeRhs: public GetMaxDerivativeBase<Spaces>

    {

    public:

      GetMaxDerivativeRhs(Spaces const& spaces, std::map<void const*,int>& deriv): GetMaxDerivativeBase<Spaces>(spaces,deriv)  {}


      template <class RBlock>

      void operator()(RBlock const&) const

      {

        int d = Functional::template D1<RBlock::RhsBlock::rowId>::derivatives;

        this->template enterSpace<RBlock::RhsBlock::rowSpaceIndex>(d);

      }

    };


    template <class Functional, class Spaces, class LocalMatrices, class RBlocks>

    std::map<void const*,int> derivatives(Functional const& f, Spaces const& spaces, LocalMatrices const& localMatrices, RBlocks const& rblocks)

    {

      std::map<void const*,int> deriv; // map from space address to maximum occuring derivative


      for_each(localMatrices,GetMaxDerivativeMatrix<Functional,Spaces>(spaces,deriv));

      for_each(rblocks,GetMaxDerivativeRhs<Functional,Spaces>(spaces,deriv));

      return deriv;

    }


    //---------------------------------------------------------------------


    template <class Evaluators, class TestVariables>

    struct ClearLocalRhs

    {

      ClearLocalRhs(Evaluators const& evaluators_):

        eval(evaluators_)

      {}


      template <class LocalVectors>

      void operator()(LocalVectors& lv) const

      {

        // Deletes all entries from vector and inserts the needed number

        // of zero elements. Thus, finite elements with different number

        // of shape functions are supported. Memory reallocations do

        // rarely occur.

        assert(lv.currentLocalVector <  lv.localVectors.size());


        int const rSpaceIdx = result_of::value_at_c<TestVariables,LocalVectors::RhsBlock::rowId>::type::spaceIndex;


        auto& reval = at_c<rSpaceIdx>(eval);                    // evaluator


        auto& rc = lv.localVectors[lv.currentLocalVector];        // current local vector structure


        // set current local vector to correct size and value 0

        rc.vector.resize(reval.size());

        std::fill(rc.vector.begin(),rc.vector.end(),0);


        // retrieve sorted indices

        rc.ridx = reval.sortedIndices();

      }


      Evaluators const&  eval;

    };


    template <class Evaluators, class AnsatzVariableSetDescription, class TestVariableSetDescription>

    struct NewLocalMatrix

    {

      NewLocalMatrix(Evaluators const& reval_, Evaluators const& ceval_)

        : reval(reval_), ceval(ceval_)

      {}


      template <class LocalMatrices>

      void operator()(LocalMatrices& lm) const

      {

        using MatrixBlock = typename LocalMatrices::InfoType;


        int const cSpaceIdx = spaceIndex<AnsatzVariableSetDescription,MatrixBlock::colId>;

        int const rSpaceIdx = spaceIndex<TestVariableSetDescription  ,MatrixBlock::rowId>;


        lm.push_back(at_c<rSpaceIdx>(reval).sortedIndices(),at_c<cSpaceIdx>(ceval).sortedIndices());

      }


      Evaluators const& reval;

      Evaluators const& ceval;

    };


    //---------------------------------------------------------------------


    template <class TestVariableSetDescription, class Evaluators, class Real, class Cache>

    struct UpdateLocalRhs

    {

      UpdateLocalRhs(Evaluators const& evaluators_, Real integrationFactor_, Cache const& cache_)

      : evaluators(evaluators_)

      , integrationFactor(integrationFactor_)

      , cache(cache_)

      {}


      template <class LocalVectors>

      void operator()(LocalVectors& lv) const

      {

        typedef typename LocalVectors::RhsBlock RhsBlock;


        int const rSpaceIndex = spaceIndex<TestVariableSetDescription,RhsBlock::rowId>;

        auto& rc = lv.localVectors[lv.currentLocalVector].vector; // current local vector

        size_t const rows = rc.size();

        for (size_t i=0; i<rows; ++i)

        {

          // Check that the cache returns the correct type. The typedefs just serve for

          // creating readable error messages.

          using rhsEntryType = std::remove_reference_t<decltype(rc[i])>;

          using d1ResultType = decltype(cache.template d1<RhsBlock::rowId>(at_c<rSpaceIndex>(evaluators).evalData[i]));

          static_assert(std::is_same<rhsEntryType,d1ResultType>::value,

                        "Types don't match. Check return type of d1() in problem formulation.");


          rc[i] += integrationFactor * cache.template d1<RhsBlock::rowId>(at_c<rSpaceIndex>(evaluators).evalData[i]);

          assert(!std::isnan(rc[i][0])); // check that first entry in rhs vector is valid

        }

      }


      Evaluators const&    evaluators;

      Real                 integrationFactor;

      Cache const&         cache;

    };


    template <class AnsatzVariableSetDescription, class TestVariableSetDescription, class Evaluators, class Real, class Cache>

    struct UpdateLocalMatrix

    {

      UpdateLocalMatrix(Evaluators const& evaluators_, Real integrationFactor_, Cache const& cache_):

        evaluators(evaluators_), integrationFactor(integrationFactor_), cache(cache_)

      {}


      template <class LocalMatrices>

      void operator()(LocalMatrices& lm) const

      {

        using MatrixBlock = typename LocalMatrices::InfoType;


        // Get the evaluated ansatz (column) and test (row) functions

        int const rowId =    MatrixBlock::rowId;

        int const colId =    MatrixBlock::colId;

        int const rSpaceIndex = spaceIndex<TestVariableSetDescription,rowId>;

        int const cSpaceIndex = spaceIndex<AnsatzVariableSetDescription,colId>;

        auto const& rEval = at_c<rSpaceIndex>(evaluators).evalData;

        auto const& cEval = at_c<cSpaceIndex>(evaluators).evalData;


        auto& A = lm.back();  // the current local Galerkin matrix to contribute to


        // retrieve number of localized ansatz functions

        int const rows = A.ridx().size();

        int const cols = A.cidx().size();


        // loop over all combinations of localized ansatz and test functions

        for (int i=0; i<rows; ++i)

        {

          int begin = MatrixBlock::lumped? i: 0;

          int end = (MatrixBlock::symmetric||MatrixBlock::lumped)? i+1: cols;

          for (int j=begin; j<end; ++j)

          {

            static_assert(std::is_same<std::remove_reference_t<decltype(A(i,j))>,

                                       decltype(cache.template d2<rowId,colId>(rEval[i],cEval[j]))

                          >::value, "Types don't match. Check return type of d2() in problem formulation.");

            A(i,j) += integrationFactor * cache.template d2<rowId,colId>(rEval[i], cEval[j]);

            assert(!std::isnan(A(i,j)[0][0])); // check that top left entry is valid

          }

        }

      }


      Evaluators const& evaluators;

      Real              integrationFactor;

      Cache const&      cache;

    };


    // TODO: factorize common functionality out of both UpdateLocalMatrix classes

    template <class AnsatzVariableSetDescription, class TestVariableSetDescription,

              class Evaluators, class Real, class Cache>

    struct UpdateLocalMatrixFromInnerBoundaryCache

    {

      UpdateLocalMatrixFromInnerBoundaryCache(Evaluators const& insideEval, Evaluators const& outsideEval,

                                              Real integrationFactor_, Cache const& cache_, bool sameCell_)

      : insideEvaluator(insideEval)

      , outsideEvaluator(outsideEval)

      , integrationFactor(integrationFactor_)

      , cache(cache_)

      , sameCell(sameCell_)

      {}


      template <class LocalMatrices>

      void operator()(LocalMatrices& lm) const

      {

        using MatrixBlock = typename LocalMatrices::InfoType;


        int const rSpaceIndex = spaceIndex<TestVariableSetDescription,  MatrixBlock::rowId>;

        int const cSpaceIndex = spaceIndex<AnsatzVariableSetDescription,MatrixBlock::colId>;


        auto& A = lm.localMatrices.back();


        // retrieve number of localized ansatz functions

        int const rows = A.ridx().size();

        int const cols = A.cidx().size();


        // loop over all combinations of localized ansatz and test functions

        for (int i=0; i<rows; ++i)

        {

          int begin = MatrixBlock::lumped? i: 0;

          int end = ((MatrixBlock::symmetric && sameCell)||MatrixBlock::lumped)? i+1: cols;

          for (int j=begin; j<end; ++j)

          {

            auto tmp = cache.template d2<MatrixBlock::rowId,MatrixBlock::colId>(

                at_c<rSpaceIndex>(insideEvaluator).evalData[i],

                at_c<cSpaceIndex>(outsideEvaluator).evalData[j], sameCell);

            A(i,j) += integrationFactor * tmp;

            assert(!std::isnan(A(i,j)[0][0])); // check that top left entry is valid

          }

        }

      }


      Evaluators const& insideEvaluator, outsideEvaluator;

      Real              integrationFactor;

      Cache const&      cache;

      bool              sameCell;

    };

    //---------------------------------------------------------------------


    template <class GlobalRhs>

    struct ScatterLocalRhs

    {

      ScatterLocalRhs(GlobalRhs& globalRhs_, bool immediate_ = false):

        globalRhs(globalRhs_), immediate(immediate_)

      {}


      template <class LocalVectors>

      void operator()(LocalVectors& lv) const

      {

        auto& gRhs = at_c<LocalVectors::RhsBlock::rowId>(globalRhs.data);


        auto const& rowGroups = lv.rb->rowGroup();


        if (immediate || lv.currentLocalVector+1==lv.localVectors.size())

        {

          int const last = immediate ? lv.currentLocalVector : lv.localVectors.size();


          // step through all row groups and scatter all the included local vectors' components

          for (int rg=0; rg<rowGroups.size(); ++rg)

          {

            // obtain and lock the row group

            auto const [firstRow,lastRow] = rowGroups.range(rg);

            std::lock_guard lock(rowGroups.mutex(rg));


            // step through all local vectors

            for (int i=0; i<last; ++i)

            {

              auto& ri = lv.localVectors[i].vector;

              auto& ridx = lv.localVectors[i].ridx;


              assert(ri.size()==ridx.size());


              for (int r=0; r<ridx.size(); ++r)

              {

                size_t const rGlobalIndex = ridx[r].first;


                // check if this row is inside the row group

                if (firstRow<=rGlobalIndex && rGlobalIndex<lastRow)

                {

                  size_t const rLocalIndex = ridx[r].second;

                  gRhs[rGlobalIndex] += ri[rLocalIndex];

                }

              }

            }

          }


          // everything's scattered - clean up

          lv.currentLocalVector = 0;

        }

        else

          ++lv.currentLocalVector; // prepare next local vector for updating

      }


      GlobalRhs&        globalRhs;

      bool              immediate;

    };


    //---------------------------------------------------------------------------------------------


    template <class Functional>

    struct SymmetrizeLocalMatrix

    {

      template <class LocalMatrices>

      void operator()(LocalMatrices& lm) const

      {

        using MatrixBlock = typename LocalMatrices::InfoType;


        // If a block is symmetric, only the lower part of the local

        // matrix is filled. Mirror to the upper part for easy access in

        // the following loop. For lumped (purely diagonal) blocks, of course,

        // nothing is to do.

        if constexpr (!MatrixBlock::lumped && MatrixBlock::symmetric)

        {

          auto& m = lm.back();

          int const N = m.ridx().size();

          assert(N==m.cidx().size());


          // copy lower triangular part to upper triangular part, transposing

          // each entry

          for (int i=0; i<N-1; ++i)

            for (int j=i+1; j<N; ++j)

              m(i,j) = transpose(m(j,i));


          // If we are asked to enforce positive semidefiniteness of these local

          // matrices (symmetric and non-lumped), we do this using an eigendecomposition,

          // and shifting all nonpositive eigenvalues to zero.

          if constexpr (MatrixBlock::makePositive)

          {

            assert(f);

            constexpr int row = MatrixBlock::rowId;

            constexpr int col = MatrixBlock::colId;


            // First we need to extract the local matrix.

            using Entry = typename MatrixBlock::BlockType;

            DynamicMatrix<Entry> Aloc(N,N);

            for (int j=0; j<N; ++j)

              for (int i=0; i<N; ++i)

                Aloc[i][j] = m(i,j);


            // now we set all negative eigenvalues to zero in the eigendecomposition

            bool changed = makePositiveSemiDefinite(Aloc,f->template makePositiveThreshold<row,col>());


            // now we copy the matrix back

            if (changed)

              for (int j=0; j<N; ++j)

                for (int i=0; i<N; ++i)

                  m(i,j) = Aloc[i][j];

          }

        }

      }


      Functional const* f;

    };


    //---------------------------------------------------------------------

    //---------------------------------------------------------------------


    template <class Functional>

    struct VariationalFunctionalPolicy

    {

      typedef typename Functional::Scalar                Scalar;

      typedef typename Functional::AnsatzVars::Spaces    Spaces;

      static constexpr bool considerInnerFaces = hasInnerBoundaryCache<Functional>;


      template <int rowId>

      struct RhsBlockInfo

      {

        static bool const present = Functional::template D1<rowId>::present;

      };


      template <int rowId, int colId>

      struct BlockInfo

      {

        static bool const present = Functional::template D2<rowId,colId>::present && rowId>=colId;

        static bool const symmetric = (rowId==colId || Functional::template D2<rowId,colId>::symmetric)

                      && (result_of::value_at_c<typename Functional::TestVars::Variables,rowId>::type::spaceIndex

                          == result_of::value_at_c<typename Functional::AnsatzVars::Variables,colId>::type::spaceIndex);

        static bool const mirror = rowId>colId;

        static bool const lumped = symmetric && Functional::template D2<rowId,colId>::lumped;

        static bool const makePositive = symmetric && Functional::template D2<rowId,colId>::makePositive;

      };


      Scalar functional() const { return fValue; }


      static constexpr bool hasValue = true;


      Scalar fValue;

    };


    template <class Functional>

    struct WeakFormulationPolicy

    {

      typedef typename Functional::Scalar                Scalar;

      typedef typename Functional::AnsatzVars::Spaces    Spaces;

      static constexpr bool considerInnerFaces = hasInnerBoundaryCache<Functional>;


      template <int rowId>

      struct RhsBlockInfo

      {

        static bool const present = Functional::template D1<rowId>::present;

      };


      template <int rowId, int colId>

      struct BlockInfo

      {

        static bool const present = Functional::template D2<rowId,colId>::present;

        static bool const symmetric = Functional::template D2<rowId,colId>::symmetric

            && (result_of::value_at_c<typename Functional::TestVars::Variables,rowId>::type::spaceIndex

                == result_of::value_at_c<typename Functional::AnsatzVars::Variables,colId>::type::spaceIndex);

        static bool const mirror = false;

        static bool const lumped = symmetric && Functional::template D2<rowId,colId>::lumped;

        static bool const makePositive = symmetric && Functional::template D2<rowId,colId>::makePositive;

      };


    public:

      static constexpr bool hasValue = false;


      Scalar fValue = 0;

    };


    template <class Problem>

    using FormulationPolicy = std::conditional_t<Problem::type==VariationalFunctional,

                                                 VariationalFunctionalPolicy<Problem>,

                                                 WeakFormulationPolicy<Problem>>;


    // -------------------------------------------------------------------------------------------------------


    struct TakeAllBlocks

    {

      template <int row>          struct D1 { static bool const assemble = true; };

      template <int row, int col> struct D2 { static bool const assemble = true; };

    };


    // Mapping a block filter to an MPL predicate

    template <class BlockFilter>

    struct MatrixBlockFilter

    {

      template <class X>

      struct apply

      {

        typedef boost::mpl::bool_<BlockFilter::template D2<X::rowId,X::colId>::assemble> type;

      };

    };


    template <class> struct Fill;


    template <class Block, bool, bool>

    struct CopyBlock

    {

      template <class OtherBlock>

      static void apply(OtherBlock const&, std::unique_ptr<Block>&, bool, size_t){}

    };


    template <class Scalar, int n, class Allocator, bool symmetric>

    struct CopyBlock<Dune::BCRSMatrix<Dune::FieldMatrix<Scalar,n,n>,Allocator>,symmetric,true>

    {

      typedef Dune::BCRSMatrix<Dune::FieldMatrix<Scalar,n,n>,Allocator> Block;


      static void apply(Block const& from, std::unique_ptr<Block>& to, bool extractOnlyLowerTriangle, size_t nnz)

      {

        // copy

        if(extractOnlyLowerTriangle == symmetric)

        {

          to.reset(new Block(from));

          return;

        }


        // only lower triangle is stored in the assembler -> restore full matrix

        if( (!extractOnlyLowerTriangle && symmetric) || (extractOnlyLowerTriangle && !symmetric) )

        {

          std::vector<std::vector<size_t> > bcrsPattern(from.N());

          for(size_t i=0; i<from.N(); ++i)

            for(size_t j=0; j<=i; ++j)

            {

              if(from.exists(i,j))

              {

                bcrsPattern[i].push_back(j);

                if(i!=j && !extractOnlyLowerTriangle)

                  bcrsPattern[j].push_back(i);

              }

            }

          for(std::vector<size_t>& row : bcrsPattern) std::sort(row.begin(),row.end());


          to.reset(new Block(from.N(),from.M(),nnz,Block::row_wise));


          // init sparsity pattern

          for (typename Block::CreateIterator row=to->createbegin(); row!=to->createend(); ++row)

            for(size_t col : bcrsPattern[row.index()]) row.insert(col);


          // read data

          for(size_t row=0; row<bcrsPattern.size(); ++row)

            for(size_t col : bcrsPattern[row])

            {

              if(row >= col) (*to)[row][col] = from[row][col];

              else if(!extractOnlyLowerTriangle)

              {

                for(size_t i=0; i<n; ++i)

                  for(size_t j=0; j<n; ++j)

                    (*to)[row][col][i][j] = from[col][row][j][i];

              }

            }

        }

      }

    };


    template <class BCRSMat, int rowIndex, int columnIndex>

    struct BlockToBCRS

    {

      explicit BlockToBCRS(std::unique_ptr<BCRSMat>& m, bool extractOnlyLowerTriangle_, size_t nnz_) : mat(m), extractOnlyLowerTriangle(extractOnlyLowerTriangle_), nnz(nnz_)

      {}


      template <class MatrixBlock>

      void operator()(MatrixBlock const& mb) const

      {

        CopyBlock<BCRSMat,MatrixBlock::symmetric,MatrixBlock::rowId==rowIndex && MatrixBlock::colId==columnIndex>::apply(mb.globalMatrix(),mat,extractOnlyLowerTriangle,nnz);

      }


    private:

      std::unique_ptr<BCRSMat>& mat;

      bool extractOnlyLowerTriangle;

      size_t nnz;

    };


  } // End of namespace AssemblyDetail

  //---------------------------------------------------------------------

  //---------------------------------------------------------------------


  template <class GridView>

  class CachingBoundaryDetector

  {

    using Cell = Kaskade::Cell<GridView>;

    typedef CachingBoundaryDetector<GridView> Self;


  public:

    CachingBoundaryDetector(GridSignals& signals, GridView const& gridView_) :

      gridView(gridView_), indexSet(gridView.indexSet())

    {

      refConnection = signals.informAboutRefinement.connect(int(GridSignals::allocResources),

                                                            [=](GridSignals::Status when){this->update(when);});

      update(GridSignals::AfterRefinement);

    }


    CachingBoundaryDetector(GridView const& gridView_) :

      gridView(gridView_), indexSet(gridView.indexSet())

    {

      update(GridSignals::AfterRefinement);

    }


    bool hasBoundaryIntersections(Cell const& cell) const

    {

      assert(indexSet.size(0)==boundaryFlag.size()); // check for grid adaptation...

      return boundaryFlag[indexSet.index(cell)];

    }


  private:

    GridView const&                    gridView;

    typename GridView::IndexSet const& indexSet;

    std::vector<bool>                  boundaryFlag;

    boost::signals2::scoped_connection refConnection;


    void update(int const status)

    {

      using namespace Dune;


      if (status == GridSignals::AfterRefinement)

      {

        boundaryFlag.resize(indexSet.size(0));

        // TODO: run this loop in parallel (no so easy because of concurrent access to the bool vector...)

        for (auto const& cell: elements(gridView))

          boundaryFlag[indexSet.index(cell)] = cell.hasBoundaryIntersections();

      }

    }

  };


  class ForwardingBoundaryDetector

  {

  public:

    template <class GridView>

    ForwardingBoundaryDetector(GridSignals const&, GridView const&)

    {}


    template <class GridView>

    ForwardingBoundaryDetector(GridView const&)

    {}


    template <class Entity>

    bool hasBoundaryIntersections(Entity const& cell) const

    {

      return cell.hasBoundaryIntersections();

    }

  };


  class TrivialBoundaryDetector

  {

  public:

    template <class GridView>

    TrivialBoundaryDetector(GridSignals const&, GridView const&)

    {}


    template <class GridView>

    TrivialBoundaryDetector(GridView const&)

    {}


    template <class Entity>

    bool hasBoundaryIntersections(Entity const& cell) const

    {

      return true;

    }

  };


  //---------------------------------------------------------------------


  //---------------------------------------------------------------------

  //---------------------------------------------------------------------


  namespace Assembler

  {

    enum { VALUE=0x1, RHS=0x2, MATRIX=0x4, EVERYTHING=0x7 };

  }


  // ----------------------------------------------------------------------------------------------

  // ----------------------------------------------------------------------------------------------


  template <class F,

            class SparseIndex = size_t,

            class BoundaryDetector = CachingBoundaryDetector<typename F::AnsatzVars::GridView>,

            class QuadRule =  Dune::QuadratureRule<typename F::AnsatzVars::Grid::ctype,

                                                   F::AnsatzVars::Grid::dimension>>

  class VariationalFunctionalAssembler

  : public AssemblyDetail::FormulationPolicy<F>

  {

  protected:

    typedef typename AssemblyDetail::FormulationPolicy<F>     Policy;


  public:

    typedef VariationalFunctionalAssembler<F,SparseIndex,BoundaryDetector,QuadRule> Self;


    typedef          F                            Functional;

    typedef typename Functional::AnsatzVars       AnsatzVariableSetDescription;


    typedef typename Functional::TestVars         TestVariableSetDescription;


    typedef typename AnsatzVariableSetDescription::Grid      Grid;


    typedef typename AnsatzVariableSetDescription::GridView  GridView;


    typedef typename AnsatzVariableSetDescription::Spaces    Spaces;

    typedef typename AnsatzVariableSetDescription::IndexSet  IndexSet;


    typedef typename Functional::Scalar           field_type;


    using Scalar = field_type;


  protected:

    typedef typename AnsatzVariableSetDescription::Variables AnsatzVariables;

    typedef typename TestVariableSetDescription::Variables   TestVariables;


    static_assert(std::is_same<typename AnsatzVariableSetDescription::Spaces, typename TestVariableSetDescription::Spaces>::value,

                  "VariableSetDescriptions for ansatz spaces and test spaces must provide the same space list.");

    static_assert(Functional::type==WeakFormulation || std::is_same<AnsatzVariableSetDescription,TestVariableSetDescription>::value,

                  "For problem type VariationalFunctional, ansatz and test variables must be the same.");


    // Whether we need to assemble on inner faces.

    constexpr static bool innerBoundaries = hasInnerBoundaryCache<Functional>;


  public:


    using MatrixBlockArray = typename AssemblyDetail::BlockArray<Policy,AnsatzVariables,TestVariables,SparseIndex>::type;


    typedef typename AssemblyDetail::RhsBlockArray<Policy,TestVariables>::type RhsBlockArray;


    typedef typename TestVariableSetDescription::template CoefficientVectorRepresentation<>::type RhsArray;


  private:

    VariationalFunctionalAssembler(GridManagerBase<Grid>& gridManager_, Spaces const& spaces)

    : spaces_(spaces),

      gridManager(gridManager_),

      gv(boost::fusion::at_c<0>(spaces)->gridView()),

      indexSet(gv.indexSet()),

      boundaryDetector(gridManager_.signals,gv),

      nSimultaneousBlocks(80),

      rowBlockFactor(2.0),

      localStorageSize(128000) // roughly 128 kB

    {

      static_assert(symmetryCheck<Functional,std::min(AnsatzVariableSetDescription::noOfVariables,

                                                      TestVariableSetDescription::noOfVariables)>,

                    "If a problem is of type VariationalFunctional, the present diagonal blocks need to be marked as symmetric in D2.");

      refConnection = gridManager_.signals.informAboutRefinement.connect(int(GridSignals::freeResources),

                                                                         [this](GridSignals::Status when){this->reactToRefinement(when);});

    }


  public:

    explicit VariationalFunctionalAssembler(Spaces const& spaces)

    : VariationalFunctionalAssembler(boost::fusion::deref(boost::fusion::begin(spaces))->gridManager(),spaces)

    {

    }


    // injected here for backward compatibility and convenience. TODO: Remove in the long run?

    static unsigned int const VALUE  = Assembler::VALUE;

    static unsigned int const RHS    = Assembler::RHS;

    static unsigned int const MATRIX = Assembler::MATRIX;

    static unsigned int const EVERYTHING = Assembler::EVERYTHING;


    Self& setNSimultaneousBlocks(int n)

    {

      nSimultaneousBlocks = n;

      return *this;

    }


    Self& setRowBlockFactor(double a)

    {

      rowBlockFactor = a;

      return *this;

    }


    Self& setLocalStorageSize(size_t s)

    {

      localStorageSize = s;

      return *this;

    }


    Self& setGatherTimings(bool gt)

    {

      gatherTimings = gt;

      return *this;

    }


    void assemble(F const& f, unsigned int flags=Assembler::EVERYTHING, int nThreads=0, bool verbose=false)

    {

      if (flags)

        assemble<AssemblyDetail::TakeAllBlocks>(f,[](auto const& cell) { return true; },

                                                flags,nThreads,verbose);

    }


  protected:

    // Define iterator and entity type for stepping through all cells of the grid.

    typedef typename GridView::template Codim<0>::Iterator CellIterator;

    typedef typename CellIterator::Entity Entity;


  public:


    template <class BlockFilter, class CellFilter>

    void assemble(F const& f, CellFilter const& cellFilter, unsigned int flags=Assembler::EVERYTHING, int nTasks=0, bool verbose=false)

    {

      using namespace Dune;

      using namespace boost::fusion;

      using namespace AssemblyDetail;


      auto& timings = Timings::instance();

      ScopedTimingSection assemblyTiming("assembly",gatherTimings);


      if (gatherTimings) timings.start("get cell ranges");

      auto const& cellRanges = gridManager.cellRanges(gv);

      if (gatherTimings) timings.stop("get cell ranges");


      // Choose the number of tasks

      if (nTasks < 1)

        nTasks = NumaThreadPool::instance().cpus();


      if (!gridManager.gridIsThreadSafe())

      {

        if (verbose)

          std::cout << "Grid is not thread safe. Reducing number of used threads to 1." << std::endl;

        nTasks = 1;

      }

      else

        if(verbose) std::cout << "#tasks:" << nTasks << " " << std::endl;

      assert(nTasks>=1);


      nTasks = std::min(nTasks,cellRanges.maxRanges());


      if (gatherTimings) timings.start("creating rhs/matrix data structures");

      // set entries to zero

      auto clearGlobalData = [](auto& x) { x = 0; };


      if (flags & RHS)

        for_each(getRhs().first.data,clearGlobalData);


      if (flags & MATRIX)

      {

        typedef filter_view<MatrixBlockArray,MatrixBlockFilter<BlockFilter>> MatrixBlockFilter;

        for_each(MatrixBlockFilter(getMatrix(f)),clearGlobalData);

      }

      if (gatherTimings) timings.stop("creating rhs/matrix data structures");


      // If there is only one task, things are somewhat simpler and more efficient...

      if (nTasks == 1)

      {

        ScopedTimingSection("perform sequential assembly",gatherTimings);

        Scalar retval =

            assembleCellRange<BlockFilter>(f,cellFilter,flags,gv.template begin<0>(),gv.template end<0>(),0);

        if (flags & VALUE)

          this->fValue = retval;

      }

      else

      {

        ScopedTimingSection parAssTime("perform parallel assembly",gatherTimings);

        // Partition the cells in ranges of almost equal size and do the assembly in parallel.

        std::vector<Scalar> values(nTasks,0.0);


        parallelFor([&cellRanges,this,&f,flags,&values,&cellFilter](int i, int n) {

                      auto range = cellRanges.range(n,i);

                      values[i] = this->assembleCellRange<BlockFilter>(f,cellFilter,flags,range.begin(),range.end(),i);

                    },

                    nTasks);


        // At the end, add all the functional values up

        if (flags & VALUE)

          this->fValue = std::accumulate(values.begin(),values.end(),0.0);

      }


      // announce validity of assembled data

      validparts |= flags;

    }


  private:


    template <class BlockFilter, class CellFilter>

    Scalar assembleCellRange(F const& f, CellFilter const& cellFilter,

                             unsigned int flags, CellIterator cell, CellIterator last, int threadNo)

    {

      using namespace Dune;

      using namespace boost::fusion;

      using namespace AssemblyDetail;


      // timer for gathering performance statistics

      boost::timer::cpu_timer scatterTimer, evalTimer, localTimer, setupTimer, totalTimer;

      if (statistics & localTimerStatistics)

      {

        evalTimer.stop();

        scatterTimer.stop();

        localTimer.stop();

      }

      // Obtain global data structures. Note that here is no race condition even if the

      // data is constructed on demand, as the required data structures have been created

      // and initialized before.

      MatrixBlockArray* globalMatrix    = flags & MATRIX? & getMatrix()    : nullptr;

      RhsArray*         globalRhs       = flags & RHS   ? & getRhs().first : nullptr;

      RhsBlockArray*    globalRhsBlocks = flags & RHS   ? & getRhs().second: nullptr;


      using MatrixBlockFilter = filter_view<MatrixBlockArray,AssemblyDetail::MatrixBlockFilter<BlockFilter>>;


      // Local contribution to global value.

      Scalar fValue = 0;


      int const dim = Grid::dimension;

      typedef typename Grid::ctype CoordType;


      // Allocate local rhs vectors that can be reused on each

      // element. Since all variables may have different element types

      // (i.e. different number of components), this has to be one local

      // rhs per variable.

      auto localRhs = as_vector(transform(*globalRhsBlocks,RhsLocalData<Policy>(nSimultaneousBlocks))); // assemble several cells en bloc before scattering


      // We assemble local matrices into a buffer from where they are scattered simultaneously. The buffers

      // scatter automatically when they are full, such that access to previous local matrices is not possible.

      // For DG methods, there are several local matrices that are assembled simultaneously in a particular

      // access pattern, such that we use two buffers. The total buffer size is localStorageSize.

      using LocalMatrices = decltype(as_vector(transform(MatrixBlockFilter(*globalMatrix),MatrixLocalData(0))));

      LocalMatrices localMatrices, localNeighborMatrices;

      if (flags & MATRIX)

      {

        localMatrices = as_vector(transform(MatrixBlockFilter(*globalMatrix),

                                            MatrixLocalData(innerBoundaries? localStorageSize/2: localStorageSize)));

        localNeighborMatrices = as_vector(transform(MatrixBlockFilter(*globalMatrix),

                                                    MatrixLocalData(innerBoundaries? localStorageSize/2: 0)));

      }


      // element-local functional value

      Scalar floc = 0;


      // Shape function cache. Remember that every thread has to use its own cache, thus we create our own here.

      typedef ShapeFunctionCache<Grid,Scalar> SfCache;

      SfCache sfCache;


      // Quadrature rule caches. Remember that every thread has to use its own quadrature caches, thus we create our own here.

      QuadratureTraits<QuadRule>                          quadratureCache;

      QuadratureTraits<QuadratureRule<CoordType,dim-1>>   faceQuadratureCache;


      // Evaluators for shape functions of all FE spaces. Remember that

      // every thread has to use its own collection of evaluators (for both current cell and neighbouring cells in case

      // we assemble on inner boundaries)!

      auto evaluators = getEvaluators(spaces(),&sfCache,AssemblyDetail::derivatives(f,spaces(),localMatrices,localRhs));

      using Evaluators = decltype(evaluators);

      auto neighbourEvaluators = evaluators;

      // Create the "caches" responsible for evaluating the variational functional / weak formulation.

      // The inner boundary cache need not exist, thus we evaluate it as 0 if not present. Lambda function

      // is a trick to allow using constexpr if.

      auto domainCache = f.createDomainCache(flags);

      auto boundaryCache = f.createBoundaryCache(flags);

      auto innerBoundaryCache = [&](){ if constexpr (innerBoundaries) return f.createInnerBoundaryCache(flags);

                                       else                           return 0; }();

      // The symmetrizer functor. We pass the heterogeneous array of global matrices

      // such that run-time meta information, e.g., on enforcing positive definiteness,

      // can be used.

      SymmetrizeLocalMatrix<Functional> symmetrizeLocalMatrix{&f};


      // Dummy variable sets to be fed to boost::fusion algorithms.

      typename AnsatzVariableSetDescription::Variables ansatzVars;

      typename TestVariableSetDescription::Variables testVars;


      if (statistics & localTimerStatistics)

        setupTimer.stop();


      // Assemble representation: step through all elements, assemble

      // the local matrix and rhs, and scatter their entries into the

      // global data structures.

      if (statistics & localTimerStatistics)

        evalTimer.resume();


      while(cell!=last)

      {

        // If the cell is not of interest, skip

        if (!cellFilter(*cell))

        {

          ++cell;

          continue;

        }


        // tell the problem on which cell we are

        domainCache.moveTo(*cell);


        // for all spaces involved, compute the shape functions and

        // their global indices, which are needed for evaluating the

        // functional's derivative.

        moveEvaluatorsToCell(evaluators,*cell,indexSet.index(*cell));

        int const shapeFunctionMaxOrder = maxOrder(evaluators);


        if (statistics & localTimerStatistics) localTimer.resume();

        if (statistics & localTimerStatistics) evalTimer.stop();


        // create new local matrices and right hand sides.

        floc = 0;

        if (flags & RHS)

          for_each(localRhs,ClearLocalRhs<Evaluators,TestVariables>(evaluators));


        if (flags & MATRIX)

          for_each(localMatrices,NewLocalMatrix<Evaluators,AnsatzVariableSetDescription,

                                                TestVariableSetDescription>(evaluators,evaluators));


        // loop over all quadrature points and integrate local stiffness matrix and rhs

        int const integrationOrderOnCell = f.integrationOrder(*cell,shapeFunctionMaxOrder,false);

        GeometryType gt = cell->type();


        QuadRule const qr = quadratureCache.rule(gt,integrationOrderOnCell);

        useQuadratureRuleInEvaluators(evaluators,qr,0);


        size_t nQuadPos = qr.size();

        for (size_t g=0; g<nQuadPos; ++g)

        {

          // pos of integration point

          FieldVector<CoordType,dim> const& quadPos = qr[g].position();


          // for all spaces involved, update the evaluators associated to this quadrature point

          moveEvaluatorsToIntegrationPoint(evaluators,quadPos,qr,g,0);


          // prepare evaluation of functional

          domainCache.evaluateAt(quadPos,evaluators);


          CoordType weightTimesDetJac(cell->geometry().integrationElement(quadPos)); // determinant of jacobian

          assert(weightTimesDetJac > 0);

          // weight of quadrature point

          weightTimesDetJac *= qr[g].weight();


          // step through all local matrix and rhs blocks and update their data

          if constexpr (Self::hasValue)

            if (flags & VALUE)

              floc += weightTimesDetJac*domainCache.d0();

          if (flags & RHS)

            for_each(localRhs,UpdateLocalRhs<TestVariableSetDescription,Evaluators,Scalar,

                                             typename F::DomainCache>(evaluators,weightTimesDetJac,domainCache));

          if (flags & MATRIX)

            for_each(localMatrices,UpdateLocalMatrix<AnsatzVariableSetDescription,TestVariableSetDescription,

                                                     Evaluators,Scalar,typename F::DomainCache>(

                                                  evaluators,weightTimesDetJac,domainCache));

        }


        // Handle Robin (Cauchy) type boundary conditions and interior face terms. Loop over all

        // faces (codim 1) that are exterior boundaries or are relevant due to interior face

        // terms and integrate the contribution. We assume that intersections on the domain

        // boundary always consist of the whole face (codim 1 subentity).

        if(innerBoundaries || boundaryDetector.hasBoundaryIntersections(*cell))

        {

          int const integrationOrderOnFace = f.integrationOrder(*cell,shapeFunctionMaxOrder,true);


          // This would be nice, but since there is no way to obtain an IntersectionIterator from an

          // Intersection, we'd need to pass the Intersection directly to boundaryCache.moveTo()

          // - which would be nicer, but is a breaking change. Consider this for the next major revision.

          //

          // for (auto const& face: intersections(gv,*cell))

          //

          // Instead, we use the old style.

          auto faceEnd = gv.iend(*cell);

          for (auto face=gv.ibegin(*cell); face!=faceEnd; ++face)

          {

            // @warning: make SURE the following does always hold: (i)

            // On boundary faces, there is exactly one intersection, and

            // this covers the whole face. (ii) When an intersection

            // covers the whole codim 1 subentity, its geometry in the

            // cell is the same as specified in the reference

            // element. Currently this is not guaranteed by the Dune

            // interface. Maybe there is a relation to the ominous

            // TwistUtility from Freiburg?


            bool const onBoundary = face->boundary();


            // Assemble only if needed.

            if (innerBoundaries || onBoundary)

            {

              GeometryType gt = face->type();

              QuadratureRule<CoordType,dim-1> const qr = faceQuadratureCache.rule(gt,integrationOrderOnFace);

              size_t const nQuadPos = qr.size();


              // Move the caches to the current face (and neighboring evaluators to the adjacent cell).

              if (onBoundary)

                boundaryCache.moveTo(face);

              else if constexpr (innerBoundaries) // the constexpr if just protects the otherwise ill-formed body

              {

                assert(face->neighbor());

                assert(gt == face->geometryInOutside().type());


                // If the problem claims the face is not relevant, skip assembly

                if (! f.considerFace(*face))

                  continue;


                innerBoundaryCache.moveTo(face);

                moveEvaluatorsToCell(neighbourEvaluators,face->outside());


                // for each neighbor (i.e. face), there is one local matrix that is computed by quadrature. Let's

                // create a new local matrix if needed. The row (test variable) is given by the current cell, and the

                // column (ansatz variable) determined by the neighbor.

                if (flags & MATRIX)

                  for_each(localNeighborMatrices,

                           NewLocalMatrix<Evaluators,AnsatzVariableSetDescription,

                                                     TestVariableSetDescription>(evaluators,neighbourEvaluators));

              }


              for (size_t g=0; g<nQuadPos; ++g)

              {

                // Evaluation by quadrature point index cannot be used on faces due to inconsistent numbering

                // of quadrature points relative to the cell (see below). Hence we don't need to announce the quadrature

                // rule to the evaluators here.

                // useQuadratureRuleInEvaluators(evaluators,qr,face->indexInInside());


                // position of integration point

                Dune::FieldVector<CoordType,dim-1> quadPos = qr[g].position();

                CoordType weightTimesDetJac = qr[g].weight() * face->geometry().integrationElement(quadPos);


                // evaluate values at integration points for all spaces

                // involved, update the evaluators associated to this

                // quadrature point

                //

                // TODO: check whether this call is

                // thread-safe. (currently as of 2010-02-11 this is not

                // guaranteed by the Dune interface for UG). Copying the

                // quadrature position instead of obtaining a const

                // reference minimizes the time window for concurrent

                // access.

                // Note that global() here returns the *cell-local* position.

                FieldVector<CoordType,dim> const quadPosInCell = face->geometryInInside().global(quadPos);


                // Move evaluators to integration point

                // quadrature points on faces are not consistently indexed (if even symmetric...) - hence evaluating

                // shape functions based on quadrature point index is impossible

                // moveEvaluatorsToIntegrationPoint(evaluators,quadPosInCell,qr,g,face->indexInInside());

                moveEvaluatorsToIntegrationPoint(evaluators,quadPosInCell);


                if (onBoundary)     // assemble on domain boundary

                {

                  boundaryCache.evaluateAt(quadPos,evaluators);


                  // step through all rhs blocks and update their local rhs

                  if constexpr (Self::hasValue)

                    if (flags & VALUE)

                      floc += weightTimesDetJac*boundaryCache.d0();

                  if (flags & RHS)

                    for_each(localRhs,UpdateLocalRhs<TestVariableSetDescription,Evaluators,Scalar,

                      typename F::BoundaryCache>(evaluators,weightTimesDetJac,boundaryCache));

                  if (flags & MATRIX)

                    for_each(localMatrices,UpdateLocalMatrix<AnsatzVariableSetDescription,TestVariableSetDescription,

                      Evaluators,Scalar,typename F::BoundaryCache>(evaluators,weightTimesDetJac,boundaryCache));


                }  // done boundary faces

                else if constexpr (innerBoundaries)   // assemble on inner boundary ("constexpr if"

                {                                     // only because the body may be ill-formed)

                  // Move in addition the neighboring evaluators to the correct evaluation point

                  moveEvaluatorsToIntegrationPoint(neighbourEvaluators,face->geometryInOutside().global(quadPos));


                  innerBoundaryCache.evaluateAt(quadPos,evaluators,neighbourEvaluators);


                  // Update value. Remember that each face is visited twice, so we add here only our half.

                  if constexpr (Self::hasValue)

                    if (flags & VALUE)

                      floc += 0.5 * weightTimesDetJac*innerBoundaryCache.d0();


                  using InnerBoundaryCache = typename Functional::InnerBoundaryCache;


                  // Step through all rhs blocks and update their local rhs. Remember that even if the face

                  // is visited twice, these visits correspond to different rows (the row being associated

                  // to the current center cell).

                  // Hence we do not sum up the samve values twice and have to omit the factor 0.5.

                  if (flags & RHS)

                    boost::fusion::for_each(localRhs,UpdateLocalRhs<TestVariableSetDescription,Evaluators,

                                            Scalar,InnerBoundaryCache>

                                            (evaluators,weightTimesDetJac,innerBoundaryCache));


                  // Update local matrices. As with the rhs, we have to omit the factor 0.5.

                  if (flags & MATRIX)

                  {

                    // update diagonal block, contribution of coupling terms on cell (boolean true)

                    boost::fusion::for_each(localMatrices,UpdateLocalMatrixFromInnerBoundaryCache<AnsatzVariableSetDescription,

                                            TestVariableSetDescription,Evaluators,Scalar,InnerBoundaryCache>

                                            (evaluators,evaluators,weightTimesDetJac,innerBoundaryCache,true));

                    // update off-diagonal block, contribution of coupling terms with neighbouring cell (boolean false)

                    boost::fusion::for_each(localNeighborMatrices,UpdateLocalMatrixFromInnerBoundaryCache<AnsatzVariableSetDescription,

                                            TestVariableSetDescription,Evaluators,Scalar,InnerBoundaryCache>

                                            (evaluators,neighbourEvaluators,weightTimesDetJac,innerBoundaryCache,false));

                  }

                }

              }

            }

          } // done face loop

        } // done boundary conditions


        // symmetrize local matrix (only the center cell matrices, not the off-diagonal neighbor matrices which are

        // not symmetric even for symmetric problems).

        if (flags & MATRIX)

          for_each(localMatrices,symmetrizeLocalMatrix);


        if (statistics & localTimerStatistics) scatterTimer.resume();

        if (statistics & localTimerStatistics) localTimer.stop();


        // Move to next cell.

        ++cell;

        // Scatter local data into global data (note that this occurs blockwise, i.e.

        // the actual scatter may be delayed). Local matrix buffers scatter automatically.

        fValue += floc;

        if (flags & RHS)

          for_each(localRhs,ScatterLocalRhs<RhsArray>(*globalRhs));


        if (statistics & localTimerStatistics) evalTimer.resume(); // count cell iterator increment as well

        if (statistics & localTimerStatistics) scatterTimer.stop();

      } // end iteration over cells


      if (statistics & localTimerStatistics) scatterTimer.resume();

      if (statistics & localTimerStatistics) evalTimer.stop();


      // scattering of local vectors may not be complete (there may be local data left over in the buffers). Again, local matrices

      // scatter automatically on destruction.

      if (flags & RHS)

        for_each(localRhs,ScatterLocalRhs<RhsArray>(*globalRhs,true));


      if (statistics & localTimerStatistics) scatterTimer.stop();


      // report statistics

      if (statistics & localTimerStatistics)

      {

        std::cerr << "--------------\nThread " << threadNo << ":\n";

        double totalTime = setupTimer.elapsed().wall + evalTimer.elapsed().wall + scatterTimer.elapsed().wall + localTimer.elapsed().wall;

        std::cerr.precision(1);

        std::cerr.setf(std::ios_base::fixed,std::ios_base::floatfield);

        std::cerr << "Total time:    " << 100* totalTimer.elapsed().wall / totalTime << "% -- " << totalTimer.format()

        << "Setup time:    " << 100* setupTimer.elapsed().wall / totalTime << "% -- " << setupTimer.format()

        << "Eval times:    " << 100* evalTimer.elapsed().wall / totalTime << "% -- " << evalTimer.format()

        << "Scatter times: " << 100* scatterTimer.elapsed().wall / totalTime << "% -- " << scatterTimer.format()

        << "Local times:   " << 100 * localTimer.elapsed().wall / totalTime << "% -- " << localTimer.format();

        std::cerr << "--------------\n";

      }


      return fValue;

    }


  public:

    int valid() { return validparts; }


    void flush(int flags=(VALUE|RHS|MATRIX))

    {

      validparts &= !flags;

      if (flags & VALUE)  this->fValue = 0;

      if (flags & RHS)

      {

        rhss.reset();

        rhsBlocks.reset();

      }

      if (flags & MATRIX) matrixBlocks.reset();

    }


    std::pair<size_t,size_t> size(int row, int col) const

    {

      return std::make_pair(TestVariableSetDescription::degreesOfFreedom(spaces(),row,row+1),

                            AnsatzVariableSetDescription::degreesOfFreedom(spaces(),col,col+1));

    }


    template <class Matrix>

    Matrix get(bool extractOnlyLowerTriangle=false,

               int rbegin=0, int rend=TestVariableSetDescription::noOfVariables,

               int cbegin=0, int cend=AnsatzVariableSetDescription::noOfVariables) const

    {

      // block sizes

      auto cSizes = AnsatzVariableSetDescription::variableDimensions(spaces());

      auto rSizes = TestVariableSetDescription::variableDimensions(spaces());


      // row and column offsets

      std::vector<size_t> rowOff(rend-rbegin,0), colOff(cend-cbegin,0);

      std::partial_sum(rSizes.begin()+rbegin,rSizes.begin()+rend-1,rowOff.begin()+1);

      std::partial_sum(cSizes.begin()+cbegin,cSizes.begin()+cend-1,colOff.begin()+1);


      return AssemblyDetail::Fill<Matrix>::apply(getMatrix(), rbegin, cbegin, rowOff, colOff,

                                                 extractOnlyLowerTriangle,

                                                 nnz(rbegin, rend, cbegin, cend,

                                                     extractOnlyLowerTriangle),

                                                 nrows(rbegin,rend), ncols(cbegin,cend));

    }


    template <int row, int col>

    auto const& get() const

    {

      return (*boost::fusion::find_if<AssemblyDetail::IsBlock<row,col>>(getMatrix())).globalMatrix();

    }


    template <class MatrixType, class BlockInformation>

    MatrixType get(bool extractOnlyLowerTriangle) const

    {

      using BI = BlockInformation;

      return get<MatrixType,BI::firstRow,BI::lastRow,BI::firstCol,BI::lastCol>(extractOnlyLowerTriangle);

    }


    template <class DataOutIter>

    void toSequence(int rbegin, int rend, DataOutIter xi) const

    {

      // WARNING: this assumes that for_each processes the rhsArray in

      // correct order from front to back!

      for_each(getRhs().first.data,BlockToSequence<DataOutIter>(rbegin,rend,xi));

    }


    size_t nnz(size_t rbegin=0, size_t rend=TestVariableSetDescription::noOfVariables,

               size_t cbegin=0, size_t cend=AnsatzVariableSetDescription::noOfVariables, bool extractOnlyLowerTriangle=false) const

    {

      size_t n = 0;

      boost::fusion::for_each(getMatrix(),CountNonzeros(n,rbegin,rend,cbegin,cend,extractOnlyLowerTriangle));

      return n;

    }


    size_t nrows(int firstBlock=0, int lastBlock=TestVariableSetDescription::noOfVariables) const

    {

      return TestVariableSetDescription::degreesOfFreedom(spaces(),firstBlock,lastBlock);

    }


    size_t ncols(int firstBlock=0, int lastBlock=AnsatzVariableSetDescription::noOfVariables) const

    {

      return AnsatzVariableSetDescription::degreesOfFreedom(spaces(),firstBlock,lastBlock);

    }


    Spaces const& spaces() const

    {

      return spaces_;

    }


    GridView const& gridView() const

    {

      return gv;

    }


    MatrixBlockArray& getMatrix() const

    {

      if (!matrixBlocks)

        createMatrix([](auto const& face) { return true; });

      return *matrixBlocks;

    }


  private:

    // Returns the matrix, creating it on the fly if necessary.

    MatrixBlockArray& getMatrix(F const& f)

    {

      if (!matrixBlocks)

        createMatrix([&](auto const& face)

        {

          if constexpr (innerBoundaries)

            return f.considerFace(face);

          else

            return true;

        });


      return *matrixBlocks;

    }


    template <class FaceOracle>

    void createMatrix(FaceOracle const& considerFace) const

    {

      matrixBlocks.reset(new MatrixBlockArray());

      boost::fusion::for_each(*matrixBlocks,[&](auto& block)

      {

        block.init(this->spaces(),gv.template begin<0>(),gv.template end<0>(),

                   considerFace);

      });

    }


  public:

    template <int first=0, int last=TestVariableSetDescription::noOfVariables>

    typename TestVariableSetDescription::template CoefficientVectorRepresentation<first,last>::type rhs() const

    {

      using Rhs = typename TestVariableSetDescription::template CoefficientVectorRepresentation<first,last>::type;

      return Rhs(make_range<first,last>(getRhs().first.data));

    }


  protected:

    std::pair<RhsArray&,RhsBlockArray&> getRhs() const

    {

      if(rhss.get()==0)

      {

        // construct global vectors

// old version, should be equivalent to the following line.

//        rhss.reset(new RhsArray(Variables_Detail::VariableRangeCreator<TestVariables,ConstructCoefficientVector<Spaces>>

//            ::apply(ConstructCoefficientVector<Spaces>(spaces()))));

        rhss.reset(new RhsArray(TestVariableSetDescription::template CoefficientVectorRepresentation<>::init(spaces())));

        // construct block infos

        rhsBlocks.reset(new RhsBlockArray());

        // Choose the number of row groups in the matrix blocks. The obvious choice would be 1 in sequential mode, but it

        // appears that a somewhat larger number is beneficial, probably due to better memory access locality. For multithreaded

        // mode, we choose the number of hardware threads as the default, since then all threads can (in principle) be active

        // simultaneously.

        int nrg = std::max((int)(rowBlockFactor*boost::thread::hardware_concurrency()),4);

        boost::fusion::for_each(*rhsBlocks,[&](auto& block)

        {

          block.init(this->spaces(),gv.template begin<0>(),gv.template end<0>(),nrg);

        });

      }


      return std::pair<RhsArray&,RhsBlockArray&>(*rhss,*rhsBlocks);

    }


    // Resource management: delete matrix and rhs data structures as well as cell ranges on

    // refinement since they are no longer meaningful on the new grid.

    void reactToRefinement(GridSignals::Status const status)

    {

      if (status == GridSignals::BeforeRefinement)

        flush();

    }


    // resource management

    boost::signals2::scoped_connection refConnection;


    Spaces const&                      spaces_;

    GridManagerBase<Grid> const&       gridManager;

    GridView const&                    gv;

    IndexSet const&                    indexSet;


    mutable std::shared_ptr<MatrixBlockArray> matrixBlocks; // matrix block info including global matrices

    mutable std::shared_ptr<RhsArray>         rhss;         // global rhs vectors

    mutable std::shared_ptr<RhsBlockArray>    rhsBlocks;    // rhs block info

    BoundaryDetector                          boundaryDetector;

    int                                       validparts;


    int nSimultaneousBlocks;

    double rowBlockFactor;

    size_t localStorageSize;

    bool gatherTimings = false;                 // if true, use default Kaskade timings


    template <class IdxOutIter, class DataOutIter>

    struct BlockToTriplet

    {

      BlockToTriplet(size_t rbegin_, size_t cbegin_, std::vector<size_t> const& rowOff_, std::vector<size_t> const& colOff_,

          IdxOutIter& ri_, IdxOutIter& ci_, DataOutIter& xi_, bool extractOnlyLowerTriangle_):

            rbegin(rbegin_), cbegin(cbegin_), rowOff(rowOff_), colOff(colOff_),

            ri(ri_), ci(ci_), xi(xi_), extractOnlyLowerTriangle(extractOnlyLowerTriangle_)

      {}


      template <class MatrixBlock>

      void operator()(MatrixBlock const& mb) const

      {

        // Check if block is in requested range

        if (inRange(mb.rowId,mb.colId))

          Matrix_to_Triplet<typename MatrixBlock::Matrix>::call(mb.globalMatrix(),ri,ci,xi,

              rowOff[MatrixBlock::rowId-rbegin],colOff[MatrixBlock::colId-cbegin],

              mb.rowId==mb.colId && extractOnlyLowerTriangle,

              mb.symmetric);

        // For mirror blocks, the transposed block needs to be written

        // if the transposed block is in the requested

        // range. Transposition is implicitly achieved by swapping

        // column and row index output iterators.

        if (MatrixBlock::mirror && inRange(mb.colId,mb.rowId) && extractOnlyLowerTriangle==false)

          Matrix_to_Triplet<typename MatrixBlock::Matrix>::call(mb.globalMatrix(),ci,ri,xi,

              colOff[MatrixBlock::rowId-cbegin],rowOff[MatrixBlock::colId-rbegin],

              false,

              mb.symmetric);

      }


      bool inRange(size_t r, size_t c) const

      {

        return r>=rbegin && r<rbegin+rowOff.size() && c>=cbegin && c<cbegin+colOff.size();

      }


      size_t rbegin, cbegin;

      std::vector<size_t> const& rowOff;

      std::vector<size_t> const& colOff;

      IdxOutIter& ri;

      IdxOutIter& ci;

      DataOutIter& xi;

      bool extractOnlyLowerTriangle;

    };


    struct CountNonzeros

    {

      CountNonzeros(size_t& n_, size_t rbegin_, size_t rend_, size_t cbegin_, size_t cend_, bool onlyLowerTriangle_):

        n(n_), rbegin(rbegin_), rend(rend_), cbegin(cbegin_), cend(cend_), onlyLowerTriangle(onlyLowerTriangle_)

      {}


      template <class MatrixBlock>

      void operator()(MatrixBlock const& mb) const

      {

        size_t myN = Matrix_to_Triplet<typename MatrixBlock::Matrix>::nnz(mb.globalMatrix(),

                                                                          (mb.rowId==mb.colId) && onlyLowerTriangle,

                                                                          mb.symmetric);

        // Check if block is in requested range

        if (inRange(MatrixBlock::rowId,MatrixBlock::colId))

          n += myN;


        // For subdiagonal blocks, the transposed block needs to be

        // counted if onlyLowerTriangle is false and the transposed

        // block is in the requested range and we need to mirror this

        // block.

        if (MatrixBlock::mirror && inRange(mb.colId,mb.rowId) && onlyLowerTriangle==false)

          n += myN;

      }


      bool inRange(size_t r, size_t c) const

      {

        return r>=rbegin && r<rend && c>=cbegin && c<cend;

      }


      size_t& n;

      size_t rbegin, rend, cbegin, cend;

      bool onlyLowerTriangle;

    };


    template <class DataOutIter>

    struct BlockToSequence

    {

      BlockToSequence(int& rbegin_, int& rend_, DataOutIter& out_): rbegin(rbegin_), rend(rend_), out(out_) {}

      template <class VectorBlock> void operator()(VectorBlock const& v) const

      {

        if (rbegin<=0 && rend>0)

          out = vectorToSequence(v,out);

        --rbegin;

        --rend;

      }

    private:

      int& rbegin;

      int& rend;

      DataOutIter& out;

    };


  };


  // End of VariationalFunctionalAssembler

  //---------------------------------------------------------------------

  //---------------------------------------------------------------------

} /* end of namespace Kaskade */


#endif

Dune::BlockVector
Definition: dynamicMatrix.hh:34

Dune::FieldMatrix
Definition: errorDistribution.hh:30

Dune::FieldVector
Definition: errorDistribution.hh:29

Dune::Matrix
Definition: lipschitzConstants.hh:7

Dune::QuadratureRule
Definition: errorDistribution.hh:31

Kaskade::CachingBoundaryDetector
Definition: assemblerCore.hh:1292

Kaskade::CachingBoundaryDetector::CachingBoundaryDetector
CachingBoundaryDetector(GridView const &gridView_)
Definition: assemblerCore.hh:1305

Kaskade::CachingBoundaryDetector::hasBoundaryIntersections
bool hasBoundaryIntersections(Cell const &cell) const
Definition: assemblerCore.hh:1311

Kaskade::CachingBoundaryDetector::CachingBoundaryDetector
CachingBoundaryDetector(GridSignals &signals, GridView const &gridView_)
Definition: assemblerCore.hh:1297

Kaskade::ForwardingBoundaryDetector
Definition: assemblerCore.hh:1344

Kaskade::ForwardingBoundaryDetector::ForwardingBoundaryDetector
ForwardingBoundaryDetector(GridView const &)
Definition: assemblerCore.hh:1351

Kaskade::ForwardingBoundaryDetector::ForwardingBoundaryDetector
ForwardingBoundaryDetector(GridSignals const &, GridView const &)
Definition: assemblerCore.hh:1347

Kaskade::ForwardingBoundaryDetector::hasBoundaryIntersections
bool hasBoundaryIntersections(Entity const &cell) const
Definition: assemblerCore.hh:1355

Kaskade::GridManagerBase< Grid >

Kaskade::GridManagerBase::cellRanges
CellRanges< typename Grid::LeafGridView > const & cellRanges(typename Grid::LeafGridView const &) const
Returns a CellRanges object for the given grid view. The cell ranges are created on demand....
Definition: gridmanager.hh:531

Kaskade::GridManagerBase::gridIsThreadSafe
bool gridIsThreadSafe() const
Returns true if concurrent read accesses to the grid do not lead to data races.
Definition: gridmanager.hh:516

Kaskade::GridManagerBase::signals
GridSignals signals
Definition: gridmanager.hh:611

Kaskade::LocalMatrices::InfoType
IT InfoType
Definition: localMatrices.hh:183

Kaskade::NumaThreadPool::instance
static NumaThreadPool & instance(int maxThreads=std::numeric_limits< int >::max())
Returns a globally unique thread pool instance.

Kaskade::NumaThreadPool::cpus
int cpus() const
Reports the total number of CPUs (usually a multiple of nodes).
Definition: threading.hh:327

Kaskade::ScopedTimingSection
A scope guard object that automatically closes a timing section on destruction.
Definition: timing.hh:181

Kaskade::Timings::instance
static Timings & instance()
Returns a reference to a single default instance.

Kaskade::TrivialBoundaryDetector
Definition: assemblerCore.hh:1368

Kaskade::TrivialBoundaryDetector::TrivialBoundaryDetector
TrivialBoundaryDetector(GridView const &)
Definition: assemblerCore.hh:1375

Kaskade::TrivialBoundaryDetector::TrivialBoundaryDetector
TrivialBoundaryDetector(GridSignals const &, GridView const &)
Definition: assemblerCore.hh:1371

Kaskade::TrivialBoundaryDetector::hasBoundaryIntersections
bool hasBoundaryIntersections(Entity const &cell) const
Definition: assemblerCore.hh:1379

Kaskade::VariationalFunctionalAssembler
A class for assembling Galerkin representation matrices and right hand sides for variational function...
Definition: assemblerCore.hh:1432

Kaskade::VariationalFunctionalAssembler::GridView
AnsatzVariableSetDescription::GridView GridView
The grid view on which the variables live.
Definition: assemblerCore.hh:1453

Kaskade::VariationalFunctionalAssembler::AnsatzVariableSetDescription
Functional::AnsatzVars AnsatzVariableSetDescription
ansatz variables
Definition: assemblerCore.hh:1442

Kaskade::VariationalFunctionalAssembler::setNSimultaneousBlocks
Self & setNSimultaneousBlocks(int n)
Defines how many cells are assembled locally before scattering them together into the global data str...
Definition: assemblerCore.hh:1545

Kaskade::VariationalFunctionalAssembler::Entity
CellIterator::Entity Entity
Definition: assemblerCore.hh:1608

Kaskade::VariationalFunctionalAssembler::validparts
int validparts
Definition: assemblerCore.hh:2381

Kaskade::VariationalFunctionalAssembler::gv
GridView const  & gv
Definition: assemblerCore.hh:2374

Kaskade::VariationalFunctionalAssembler::valid
int valid()
Returns a bitfield specifyign which of the parts have been assembled since construction or flush() ac...
Definition: assemblerCore.hh:2102

Kaskade::VariationalFunctionalAssembler::RhsArray
TestVariableSetDescription::template CoefficientVectorRepresentation ::type RhsArray
A LinearProductSpace type of right hand side coefficient vectors.
Definition: assemblerCore.hh:1498

Kaskade::VariationalFunctionalAssembler::flush
void flush(int flags=(VALUE|RHS|MATRIX))
Destructs parts of the assembled quatities according to the format (VALUE|RHS|MATRX)
Definition: assemblerCore.hh:2109

Kaskade::VariationalFunctionalAssembler::VALUE
static unsigned int const VALUE
DEPRECATED, enums in the Assembler namespace.
Definition: assemblerCore.hh:1528

Kaskade::VariationalFunctionalAssembler::localStorageSize
size_t localStorageSize
Definition: assemblerCore.hh:2386

Kaskade::VariationalFunctionalAssembler::rowBlockFactor
double rowBlockFactor
Definition: assemblerCore.hh:2385

Kaskade::VariationalFunctionalAssembler::setLocalStorageSize
Self & setLocalStorageSize(size_t s)
Defines how many memory the locally assembled matrices may occupy before they are scattered.
Definition: assemblerCore.hh:1574

Kaskade::VariationalFunctionalAssembler::get
Matrix get(bool extractOnlyLowerTriangle=false, int rbegin=0, int rend=TestVariableSetDescription::noOfVariables, int cbegin=0, int cend=AnsatzVariableSetDescription::noOfVariables) const
Extracts the submatrix defined by the half-open block ranges [rbegin,rend), [cbegin,...
Definition: assemblerCore.hh:2160

Kaskade::VariationalFunctionalAssembler::setGatherTimings
Self & setGatherTimings(bool gt)
Whether to gather timing statistics using Kaskade::Timings.
Definition: assemblerCore.hh:1587

Kaskade::VariationalFunctionalAssembler::Policy
AssemblyDetail::FormulationPolicy< F > Policy
Definition: assemblerCore.hh:1434

Kaskade::VariationalFunctionalAssembler::nSimultaneousBlocks
int nSimultaneousBlocks
Definition: assemblerCore.hh:2384

Kaskade::VariationalFunctionalAssembler::gridView
GridView const & gridView() const
The grid view used.
Definition: assemblerCore.hh:2269

Kaskade::VariationalFunctionalAssembler::field_type
Functional::Scalar field_type
Underlying field type.
Definition: assemblerCore.hh:1463

Kaskade::VariationalFunctionalAssembler::assemble
void assemble(F const &f, CellFilter const &cellFilter, unsigned int flags=Assembler::EVERYTHING, int nTasks=0, bool verbose=false)
Create data in assembler.
Definition: assemblerCore.hh:1652

Kaskade::VariationalFunctionalAssembler::TestVariableSetDescription
Functional::TestVars TestVariableSetDescription
test variables
Definition: assemblerCore.hh:1445

Kaskade::VariationalFunctionalAssembler::MatrixBlockArray
typename AssemblyDetail::BlockArray< Policy, AnsatzVariables, TestVariables, SparseIndex >::type MatrixBlockArray
A boost::fusion sequence of AssemblyDetail::MatrixBlock elements for present matrix blocks.
Definition: assemblerCore.hh:1486

Kaskade::VariationalFunctionalAssembler::spaces_
Spaces const  & spaces_
Definition: assemblerCore.hh:2372

Kaskade::VariationalFunctionalAssembler::toSequence
void toSequence(int rbegin, int rend, DataOutIter xi) const
Writes the subvector defined by the half-open block range [rbegin,rend) to the output iterator xi.
Definition: assemblerCore.hh:2213

Kaskade::VariationalFunctionalAssembler::get
auto const & get() const
Extracts a raw single submatrix block indexed by row and column.
Definition: assemblerCore.hh:2188

Kaskade::VariationalFunctionalAssembler::reactToRefinement
void reactToRefinement(GridSignals::Status const status)
Definition: assemblerCore.hh:2362

Kaskade::VariationalFunctionalAssembler::innerBoundaries
static constexpr bool innerBoundaries
Definition: assemblerCore.hh:1477

Kaskade::VariationalFunctionalAssembler::RHS
static unsigned int const RHS
Definition: assemblerCore.hh:1529

Kaskade::VariationalFunctionalAssembler::rhs
TestVariableSetDescription::template CoefficientVectorRepresentation< first, last >::type rhs() const
Returns a contiguous subrange of the rhs coefficient vectors.
Definition: assemblerCore.hh:2327

Kaskade::VariationalFunctionalAssembler::Grid
AnsatzVariableSetDescription::Grid Grid
grid
Definition: assemblerCore.hh:1448

Kaskade::VariationalFunctionalAssembler::MATRIX
static unsigned int const MATRIX
Definition: assemblerCore.hh:1530

Kaskade::VariationalFunctionalAssembler::rhss
std::shared_ptr< RhsArray > rhss
Definition: assemblerCore.hh:2378

Kaskade::VariationalFunctionalAssembler::Scalar
field_type Scalar
Definition: assemblerCore.hh:1465

Kaskade::VariationalFunctionalAssembler::TestVariables
TestVariableSetDescription::Variables TestVariables
Definition: assemblerCore.hh:1469

Kaskade::VariationalFunctionalAssembler::gatherTimings
bool gatherTimings
Definition: assemblerCore.hh:2387

Kaskade::VariationalFunctionalAssembler::CellIterator
GridView::template Codim< 0 >::Iterator CellIterator
Definition: assemblerCore.hh:1607

Kaskade::VariationalFunctionalAssembler::ncols
size_t ncols(int firstBlock=0, int lastBlock=AnsatzVariableSetDescription::noOfVariables) const
Returns the number of scalar cols in the column block range [firstBlock,lastBlock[.
Definition: assemblerCore.hh:2253

Kaskade::VariationalFunctionalAssembler::RhsBlockArray
AssemblyDetail::RhsBlockArray< Policy, TestVariables >::type RhsBlockArray
A boost::fusion sequence of AssemblyDetail::RhsBock elements for present rhs blocks.
Definition: assemblerCore.hh:1493

Kaskade::VariationalFunctionalAssembler::Spaces
AnsatzVariableSetDescription::Spaces Spaces
spaces
Definition: assemblerCore.hh:1456

Kaskade::VariationalFunctionalAssembler::matrixBlocks
std::shared_ptr< MatrixBlockArray > matrixBlocks
Definition: assemblerCore.hh:2377

Kaskade::VariationalFunctionalAssembler::Functional
F Functional
functional
Definition: assemblerCore.hh:1440

Kaskade::VariationalFunctionalAssembler::nrows
size_t nrows(int firstBlock=0, int lastBlock=TestVariableSetDescription::noOfVariables) const
Returns the number of scalar rows in the row block range [firstBlock,lastBlock[.
Definition: assemblerCore.hh:2245

Kaskade::VariationalFunctionalAssembler::AnsatzVariables
AnsatzVariableSetDescription::Variables AnsatzVariables
Definition: assemblerCore.hh:1468

Kaskade::VariationalFunctionalAssembler::spaces
Spaces const & spaces() const
Returns the list of spaces used.
Definition: assemblerCore.hh:2261

Kaskade::VariationalFunctionalAssembler::Self
VariationalFunctionalAssembler< F, SparseIndex, BoundaryDetector, QuadRule > Self
Definition: assemblerCore.hh:1437

Kaskade::VariationalFunctionalAssembler::VariationalFunctionalAssembler
VariationalFunctionalAssembler(Spaces const &spaces)
Construct an empty assembler, gridManager is implicitly obtained from the first space.
Definition: assemblerCore.hh:1521

Kaskade::VariationalFunctionalAssembler::IndexSet
AnsatzVariableSetDescription::IndexSet IndexSet
index set
Definition: assemblerCore.hh:1458

Kaskade::VariationalFunctionalAssembler::size
std::pair< size_t, size_t > size(int row, int col) const
the size of a matrix block (in terms of scalar rows/columns)
Definition: assemblerCore.hh:2125

Kaskade::VariationalFunctionalAssembler::nnz
size_t nnz(size_t rbegin=0, size_t rend=TestVariableSetDescription::noOfVariables, size_t cbegin=0, size_t cend=AnsatzVariableSetDescription::noOfVariables, bool extractOnlyLowerTriangle=false) const
Returns the number of structurally nonzero entries in the submatrix defined by the half-open block ra...
Definition: assemblerCore.hh:2234

Kaskade::VariationalFunctionalAssembler::get
MatrixType get(bool extractOnlyLowerTriangle) const
Extracts the submatrix defined by the half-open block ranges given as template parameter.
Definition: assemblerCore.hh:2199

Kaskade::VariationalFunctionalAssembler::getRhs
std::pair< RhsArray &, RhsBlockArray & > getRhs() const
Definition: assemblerCore.hh:2334

Kaskade::VariationalFunctionalAssembler::gridManager
GridManagerBase< Grid > const  & gridManager
Definition: assemblerCore.hh:2373

Kaskade::VariationalFunctionalAssembler::EVERYTHING
static unsigned int const EVERYTHING
Definition: assemblerCore.hh:1531

Kaskade::VariationalFunctionalAssembler::refConnection
boost::signals2::scoped_connection refConnection
Definition: assemblerCore.hh:2370

Kaskade::VariationalFunctionalAssembler::boundaryDetector
BoundaryDetector boundaryDetector
Definition: assemblerCore.hh:2380

Kaskade::VariationalFunctionalAssembler::assemble
void assemble(F const &f, unsigned int flags=Assembler::EVERYTHING, int nThreads=0, bool verbose=false)
Assembly without block filter or cell filter.
Definition: assemblerCore.hh:1598

Kaskade::VariationalFunctionalAssembler::rhsBlocks
std::shared_ptr< RhsBlockArray > rhsBlocks
Definition: assemblerCore.hh:2379

Kaskade::VariationalFunctionalAssembler::getMatrix
MatrixBlockArray & getMatrix() const
Returns a mutable reference to the sequence of matrix blocks.
Definition: assemblerCore.hh:2285

Kaskade::VariationalFunctionalAssembler::setRowBlockFactor
Self & setRowBlockFactor(double a)
Defines how many more row blocks in each matrix are used compared to the number of threads.
Definition: assemblerCore.hh:1561

Kaskade::VariationalFunctionalAssembler::indexSet
IndexSet const  & indexSet
Definition: assemblerCore.hh:2375

detailed_exception.hh

dynamicMatrix.hh

firstless.hh

fixfusion.hh

functional_aux.hh
Utility classes for the definition and use of variational functionals.

gridmanager.hh

Kaskade::Assembler::EVERYTHING
@ EVERYTHING
Definition: assemblerCore.hh:1402

Kaskade::Assembler::VALUE
@ VALUE
Definition: assemblerCore.hh:1402

Kaskade::Assembler::RHS
@ RHS
Definition: assemblerCore.hh:1402

Kaskade::Assembler::MATRIX
@ MATRIX
Definition: assemblerCore.hh:1402

Kaskade::useQuadratureRuleInEvaluators
void useQuadratureRuleInEvaluators(Evaluator &evals, QuadratureRule const &qr, int subId)
Tells all evaluators to use the given quadrature rule on the given subentity.
Definition: functionspace.hh:1912

Kaskade::moveEvaluatorsToIntegrationPoint
void moveEvaluatorsToIntegrationPoint(Evaluators &evals, Dune::FieldVector< CoordType, dim > const &x, Dune::QuadratureRule< CoordType, subDim > const &qr, int ip, int subId)
Moves all provided evaluators to the given integration point, evaluating the shape functions there.
Definition: functionspace.hh:1929

Kaskade::maxOrder
int maxOrder(Evaluators const &evals)
Computes the maximum ansatz order used in a collection of evaluators.
Definition: functionspace.hh:1954

Kaskade::Evaluators
typename boost::fusion::result_of::as_vector< typename boost::fusion::result_of::transform< Spaces, GetEvaluatorTypes >::type >::type Evaluators
the heterogeneous sequence type of Evaluators for the given spaces
Definition: functionspace.hh:1858

Kaskade::WeakFormulation
@ WeakFormulation
Definition: functionspace.hh:114

Kaskade::VariationalFunctional
@ VariationalFunctional
Definition: functionspace.hh:114

Kaskade::Cell
typename GridView::template Codim< 0 >::Entity Cell
The type of cells (entities of codimension 0) in the grid view.
Definition: gridBasics.hh:35

Kaskade::GridSignals::informAboutRefinement
boost::signals2::signal< void(Status)> informAboutRefinement
A signal that is emitted thrice on grid modifications, once before adaptation takes place and twice a...
Definition: gridmanager.hh:74

Kaskade::GridSignals::Status
Status
The argument type of the signal that is emitted before and after grid adaptation.
Definition: gridmanager.hh:64

Kaskade::GridSignals::allocResources
@ allocResources
Definition: gridmanager.hh:54

Kaskade::GridSignals::freeResources
@ freeResources
Definition: gridmanager.hh:54

Kaskade::GridSignals::AfterRefinement
@ AfterRefinement
Definition: gridmanager.hh:64

Kaskade::GridSignals::BeforeRefinement
@ BeforeRefinement
Definition: gridmanager.hh:64

Dune::max
Dune::FieldVector< T, n > max(Dune::FieldVector< T, n > x, Dune::FieldVector< T, n > const &y)
Componentwise maximum.
Definition: fixdune.hh:110

Dune::min
Dune::FieldVector< T, n > min(Dune::FieldVector< T, n > x, Dune::FieldVector< T, n > const &y)
Componentwise minimum.
Definition: fixdune.hh:122

Kaskade::parallelFor
void parallelFor(Func const &f, int maxTasks=std::numeric_limits< int >::max())
A parallel for loop that executes the given functor in parallel on different CPUs.
Definition: threading.hh:489

Kaskade::removeConst
T & removeConst(T const &t)
A convenience template for removing the const qualifier from references and pointers.
Definition: typeTraits.hh:30

localMatrices.hh

Dune
Definition: errorDistribution.hh:28

Kaskade::PartitionedSpaceDetail::considerFace
bool considerFace(Face const &face, std::vector< int > const &boundaryIds, std::vector< int > const &usedIds)
Definition: partitionedspace.hh:142

Kaskade
Definition: abstract_interface.hh:15

Kaskade::transpose
T transpose(T x)
Definition: dynamicMatrix.hh:750

Kaskade::vectorToSequence
OutIter vectorToSequence(double x, OutIter iter)
Definition: crsutil.hh:30

Kaskade::moveEvaluatorsToCell
void moveEvaluatorsToCell(Evaluators &evals, Cell const &cell)
Moves all provided evaluators to the given cell.
Definition: functionspace.hh:1888

Kaskade::symmetryCheck
constexpr bool symmetryCheck
Definition: functional_aux.hh:249

boost::fusion
Definition: fixfusion.hh:53

boost
Definition: fixfusion.hh:52

quadrature.hh

Kaskade::AssemblyDetail::Fill
Specialize this template for your matrix type in order to use it with VariationalFunctionalAssembler:...
Definition: assemblerMatrixExtraction.hh:114

Kaskade::GridSignals
A class that provides access to signals that are emitted from the grid manager on various occasions.
Definition: gridmanager.hh:47

Kaskade::Matrix_to_Triplet
A class template that supports converting certain Dune matrices into the coordinate (triplet) format.
Definition: crsutil.hh:177

Kaskade::SpaceType::type
std::remove_pointer_t< typename boost::fusion::result_of::value_at_c< Spaces, Idx >::type > type
Definition: functionspace.hh:133

Kaskade::VariationalFunctionalAssembler::BlockToSequence
Definition: assemblerCore.hh:2472

Kaskade::VariationalFunctionalAssembler::BlockToSequence::BlockToSequence
BlockToSequence(int &rbegin_, int &rend_, DataOutIter &out_)
Definition: assemblerCore.hh:2473

Kaskade::VariationalFunctionalAssembler::BlockToSequence::operator()
void operator()(VectorBlock const &v) const
Definition: assemblerCore.hh:2474

Kaskade::VariationalFunctionalAssembler::BlockToTriplet
Definition: assemblerCore.hh:2392

Kaskade::VariationalFunctionalAssembler::BlockToTriplet::colOff
std::vector< size_t > const  & colOff
Definition: assemblerCore.hh:2427

Kaskade::VariationalFunctionalAssembler::BlockToTriplet::extractOnlyLowerTriangle
bool extractOnlyLowerTriangle
Definition: assemblerCore.hh:2431

Kaskade::VariationalFunctionalAssembler::BlockToTriplet::ci
IdxOutIter & ci
Definition: assemblerCore.hh:2429

Kaskade::VariationalFunctionalAssembler::BlockToTriplet::rbegin
size_t rbegin
Definition: assemblerCore.hh:2425

Kaskade::VariationalFunctionalAssembler::BlockToTriplet::inRange
bool inRange(size_t r, size_t c) const
Definition: assemblerCore.hh:2419

Kaskade::VariationalFunctionalAssembler::BlockToTriplet::operator()
void operator()(MatrixBlock const &mb) const
Definition: assemblerCore.hh:2400

Kaskade::VariationalFunctionalAssembler::BlockToTriplet::BlockToTriplet
BlockToTriplet(size_t rbegin_, size_t cbegin_, std::vector< size_t > const &rowOff_, std::vector< size_t > const &colOff_, IdxOutIter &ri_, IdxOutIter &ci_, DataOutIter &xi_, bool extractOnlyLowerTriangle_)
Definition: assemblerCore.hh:2393

Kaskade::VariationalFunctionalAssembler::BlockToTriplet::xi
DataOutIter & xi
Definition: assemblerCore.hh:2430

Kaskade::VariationalFunctionalAssembler::BlockToTriplet::ri
IdxOutIter & ri
Definition: assemblerCore.hh:2428

Kaskade::VariationalFunctionalAssembler::BlockToTriplet::cbegin
size_t cbegin
Definition: assemblerCore.hh:2425

Kaskade::VariationalFunctionalAssembler::BlockToTriplet::rowOff
std::vector< size_t > const  & rowOff
Definition: assemblerCore.hh:2426

Kaskade::VariationalFunctionalAssembler::CountNonzeros
Definition: assemblerCore.hh:2435

Kaskade::VariationalFunctionalAssembler::CountNonzeros::onlyLowerTriangle
bool onlyLowerTriangle
Definition: assemblerCore.hh:2467

Kaskade::VariationalFunctionalAssembler::CountNonzeros::CountNonzeros
CountNonzeros(size_t &n_, size_t rbegin_, size_t rend_, size_t cbegin_, size_t cend_, bool onlyLowerTriangle_)
Definition: assemblerCore.hh:2436

Kaskade::VariationalFunctionalAssembler::CountNonzeros::inRange
bool inRange(size_t r, size_t c) const
Definition: assemblerCore.hh:2458

Kaskade::VariationalFunctionalAssembler::CountNonzeros::rbegin
size_t rbegin
Definition: assemblerCore.hh:2466

Kaskade::VariationalFunctionalAssembler::CountNonzeros::rend
size_t rend
Definition: assemblerCore.hh:2466

Kaskade::VariationalFunctionalAssembler::CountNonzeros::cend
size_t cend
Definition: assemblerCore.hh:2466

Kaskade::VariationalFunctionalAssembler::CountNonzeros::cbegin
size_t cbegin
Definition: assemblerCore.hh:2466

Kaskade::VariationalFunctionalAssembler::CountNonzeros::operator()
void operator()(MatrixBlock const &mb) const
Definition: assemblerCore.hh:2441

Kaskade::VariationalFunctionalAssembler::CountNonzeros::n
size_t & n
Definition: assemblerCore.hh:2465

threadedMatrix.hh

threading.hh

timing.hh

typeTraits.hh

variables.hh
Variables and their descriptions.