TR-mbed/ConservativeSparseSparseProduct_8h_source.html

// This file is part of Eigen, a lightweight C++ template library

// for linear algebra.

//

// Copyright (C) 2008-2015 Gael Guennebaud <gael.guennebaud@inria.fr>

//

// This Source Code Form is subject to the terms of the Mozilla

// Public License v. 2.0. If a copy of the MPL was not distributed

// with this file, You can obtain one at http://mozilla.org/MPL/2.0/.


#ifndef EIGEN_CONSERVATIVESPARSESPARSEPRODUCT_H

#define EIGEN_CONSERVATIVESPARSESPARSEPRODUCT_H


namespace Eigen {


namespace internal {


template<typename Lhs, typename Rhs, typename ResultType>

static void conservative_sparse_sparse_product_impl(const Lhs& lhs, const Rhs& rhs, ResultType& res, bool sortedInsertion = false)

{

  typedef typename remove_all<Lhs>::type::Scalar LhsScalar;

  typedef typename remove_all<Rhs>::type::Scalar RhsScalar;

  typedef typename remove_all<ResultType>::type::Scalar ResScalar;


  // make sure to call innerSize/outerSize since we fake the storage order.

  Index rows = lhs.innerSize();

  Index cols = rhs.outerSize();

  eigen_assert(lhs.outerSize() == rhs.innerSize());


  ei_declare_aligned_stack_constructed_variable(bool,   mask,     rows, 0);

  ei_declare_aligned_stack_constructed_variable(ResScalar, values,   rows, 0);

  ei_declare_aligned_stack_constructed_variable(Index,  indices,  rows, 0);


  std::memset(mask,0,sizeof(bool)*rows);


  evaluator<Lhs> lhsEval(lhs);

  evaluator<Rhs> rhsEval(rhs);


  // estimate the number of non zero entries

  // given a rhs column containing Y non zeros, we assume that the respective Y columns

  // of the lhs differs in average of one non zeros, thus the number of non zeros for

  // the product of a rhs column with the lhs is X+Y where X is the average number of non zero

  // per column of the lhs.

  // Therefore, we have nnz(lhs*rhs) = nnz(lhs) + nnz(rhs)

  Index estimated_nnz_prod = lhsEval.nonZerosEstimate() + rhsEval.nonZerosEstimate();


  res.setZero();

  res.reserve(Index(estimated_nnz_prod));

  // we compute each column of the result, one after the other

  for (Index j=0; j<cols; ++j)

  {


    res.startVec(j);

    Index nnz = 0;

    for (typename evaluator<Rhs>::InnerIterator rhsIt(rhsEval, j); rhsIt; ++rhsIt)

    {

      RhsScalar y = rhsIt.value();

      Index k = rhsIt.index();

      for (typename evaluator<Lhs>::InnerIterator lhsIt(lhsEval, k); lhsIt; ++lhsIt)

      {

        Index i = lhsIt.index();

        LhsScalar x = lhsIt.value();

        if(!mask[i])

        {

          mask[i] = true;

          values[i] = x * y;

          indices[nnz] = i;

          ++nnz;

        }

        else

          values[i] += x * y;

      }

    }

    if(!sortedInsertion)

    {

      // unordered insertion

      for(Index k=0; k<nnz; ++k)

      {

        Index i = indices[k];

        res.insertBackByOuterInnerUnordered(j,i) = values[i];

        mask[i] = false;

      }

    }

    else

    {

      // alternative ordered insertion code:

      const Index t200 = rows/11; // 11 == (log2(200)*1.39)

      const Index t = (rows*100)/139;


      // FIXME reserve nnz non zeros

      // FIXME implement faster sorting algorithms for very small nnz

      // if the result is sparse enough => use a quick sort

      // otherwise => loop through the entire vector

      // In order to avoid to perform an expensive log2 when the

      // result is clearly very sparse we use a linear bound up to 200.

      if((nnz<200 && nnz<t200) || nnz * numext::log2(int(nnz)) < t)

      {

        if(nnz>1) std::sort(indices,indices+nnz);

        for(Index k=0; k<nnz; ++k)

        {

          Index i = indices[k];

          res.insertBackByOuterInner(j,i) = values[i];

          mask[i] = false;

        }

      }

      else

      {

        // dense path

        for(Index i=0; i<rows; ++i)

        {

          if(mask[i])

          {

            mask[i] = false;

            res.insertBackByOuterInner(j,i) = values[i];

          }

        }

      }

    }

  }

  res.finalize();

}


} // end namespace internal


namespace internal {


template<typename Lhs, typename Rhs, typename ResultType,

  int LhsStorageOrder = (traits<Lhs>::Flags&RowMajorBit) ? RowMajor : ColMajor,

  int RhsStorageOrder = (traits<Rhs>::Flags&RowMajorBit) ? RowMajor : ColMajor,

  int ResStorageOrder = (traits<ResultType>::Flags&RowMajorBit) ? RowMajor : ColMajor>

struct conservative_sparse_sparse_product_selector;


template<typename Lhs, typename Rhs, typename ResultType>


struct conservative_sparse_sparse_product_selector<Lhs,Rhs,ResultType,ColMajor,ColMajor,ColMajor>

{

  typedef typename remove_all<Lhs>::type LhsCleaned;

  typedef typename LhsCleaned::Scalar Scalar;


  static void run(const Lhs& lhs, const Rhs& rhs, ResultType& res)

  {

    typedef SparseMatrix<typename ResultType::Scalar,RowMajor,typename ResultType::StorageIndex> RowMajorMatrix;

    typedef SparseMatrix<typename ResultType::Scalar,ColMajor,typename ResultType::StorageIndex> ColMajorMatrixAux;

    typedef typename sparse_eval<ColMajorMatrixAux,ResultType::RowsAtCompileTime,ResultType::ColsAtCompileTime,ColMajorMatrixAux::Flags>::type ColMajorMatrix;


    // If the result is tall and thin (in the extreme case a column vector)

    // then it is faster to sort the coefficients inplace instead of transposing twice.

    // FIXME, the following heuristic is probably not very good.

    if(lhs.rows()>rhs.cols())

    {

      ColMajorMatrix resCol(lhs.rows(),rhs.cols());

      // perform sorted insertion

      internal::conservative_sparse_sparse_product_impl<Lhs,Rhs,ColMajorMatrix>(lhs, rhs, resCol, true);

      res = resCol.markAsRValue();

    }

    else

    {

      ColMajorMatrixAux resCol(lhs.rows(),rhs.cols());

      // resort to transpose to sort the entries

      internal::conservative_sparse_sparse_product_impl<Lhs,Rhs,ColMajorMatrixAux>(lhs, rhs, resCol, false);

      RowMajorMatrix resRow(resCol);

      res = resRow.markAsRValue();

    }

  }


};


template<typename Lhs, typename Rhs, typename ResultType>


struct conservative_sparse_sparse_product_selector<Lhs,Rhs,ResultType,RowMajor,ColMajor,ColMajor>

{


  static void run(const Lhs& lhs, const Rhs& rhs, ResultType& res)

  {

    typedef SparseMatrix<typename Rhs::Scalar,RowMajor,typename ResultType::StorageIndex> RowMajorRhs;

    typedef SparseMatrix<typename ResultType::Scalar,RowMajor,typename ResultType::StorageIndex> RowMajorRes;

    RowMajorRhs rhsRow = rhs;

    RowMajorRes resRow(lhs.rows(), rhs.cols());

    internal::conservative_sparse_sparse_product_impl<RowMajorRhs,Lhs,RowMajorRes>(rhsRow, lhs, resRow);

    res = resRow;

  }


};


template<typename Lhs, typename Rhs, typename ResultType>


struct conservative_sparse_sparse_product_selector<Lhs,Rhs,ResultType,ColMajor,RowMajor,ColMajor>

{


  static void run(const Lhs& lhs, const Rhs& rhs, ResultType& res)

  {

    typedef SparseMatrix<typename Lhs::Scalar,RowMajor,typename ResultType::StorageIndex> RowMajorLhs;

    typedef SparseMatrix<typename ResultType::Scalar,RowMajor,typename ResultType::StorageIndex> RowMajorRes;

    RowMajorLhs lhsRow = lhs;

    RowMajorRes resRow(lhs.rows(), rhs.cols());

    internal::conservative_sparse_sparse_product_impl<Rhs,RowMajorLhs,RowMajorRes>(rhs, lhsRow, resRow);

    res = resRow;

  }


};


template<typename Lhs, typename Rhs, typename ResultType>


struct conservative_sparse_sparse_product_selector<Lhs,Rhs,ResultType,RowMajor,RowMajor,ColMajor>

{


  static void run(const Lhs& lhs, const Rhs& rhs, ResultType& res)

  {

    typedef SparseMatrix<typename ResultType::Scalar,RowMajor,typename ResultType::StorageIndex> RowMajorMatrix;

    RowMajorMatrix resRow(lhs.rows(), rhs.cols());

    internal::conservative_sparse_sparse_product_impl<Rhs,Lhs,RowMajorMatrix>(rhs, lhs, resRow);

    res = resRow;

  }


};


template<typename Lhs, typename Rhs, typename ResultType>


struct conservative_sparse_sparse_product_selector<Lhs,Rhs,ResultType,ColMajor,ColMajor,RowMajor>

{

  typedef typename traits<typename remove_all<Lhs>::type>::Scalar Scalar;


  static void run(const Lhs& lhs, const Rhs& rhs, ResultType& res)

  {

    typedef SparseMatrix<typename ResultType::Scalar,ColMajor,typename ResultType::StorageIndex> ColMajorMatrix;

    ColMajorMatrix resCol(lhs.rows(), rhs.cols());

    internal::conservative_sparse_sparse_product_impl<Lhs,Rhs,ColMajorMatrix>(lhs, rhs, resCol);

    res = resCol;

  }


};


template<typename Lhs, typename Rhs, typename ResultType>


struct conservative_sparse_sparse_product_selector<Lhs,Rhs,ResultType,RowMajor,ColMajor,RowMajor>

{


  static void run(const Lhs& lhs, const Rhs& rhs, ResultType& res)

  {

    typedef SparseMatrix<typename Lhs::Scalar,ColMajor,typename ResultType::StorageIndex> ColMajorLhs;

    typedef SparseMatrix<typename ResultType::Scalar,ColMajor,typename ResultType::StorageIndex> ColMajorRes;

    ColMajorLhs lhsCol = lhs;

    ColMajorRes resCol(lhs.rows(), rhs.cols());

    internal::conservative_sparse_sparse_product_impl<ColMajorLhs,Rhs,ColMajorRes>(lhsCol, rhs, resCol);

    res = resCol;

  }


};


template<typename Lhs, typename Rhs, typename ResultType>


struct conservative_sparse_sparse_product_selector<Lhs,Rhs,ResultType,ColMajor,RowMajor,RowMajor>

{


  static void run(const Lhs& lhs, const Rhs& rhs, ResultType& res)

  {

    typedef SparseMatrix<typename Rhs::Scalar,ColMajor,typename ResultType::StorageIndex> ColMajorRhs;

    typedef SparseMatrix<typename ResultType::Scalar,ColMajor,typename ResultType::StorageIndex> ColMajorRes;

    ColMajorRhs rhsCol = rhs;

    ColMajorRes resCol(lhs.rows(), rhs.cols());

    internal::conservative_sparse_sparse_product_impl<Lhs,ColMajorRhs,ColMajorRes>(lhs, rhsCol, resCol);

    res = resCol;

  }


};


template<typename Lhs, typename Rhs, typename ResultType>


struct conservative_sparse_sparse_product_selector<Lhs,Rhs,ResultType,RowMajor,RowMajor,RowMajor>

{


  static void run(const Lhs& lhs, const Rhs& rhs, ResultType& res)

  {

    typedef SparseMatrix<typename ResultType::Scalar,RowMajor,typename ResultType::StorageIndex> RowMajorMatrix;

    typedef SparseMatrix<typename ResultType::Scalar,ColMajor,typename ResultType::StorageIndex> ColMajorMatrix;

    RowMajorMatrix resRow(lhs.rows(),rhs.cols());

    internal::conservative_sparse_sparse_product_impl<Rhs,Lhs,RowMajorMatrix>(rhs, lhs, resRow);

    // sort the non zeros:

    ColMajorMatrix resCol(resRow);

    res = resCol;

  }


};


} // end namespace internal


namespace internal {


template<typename Lhs, typename Rhs, typename ResultType>

static void sparse_sparse_to_dense_product_impl(const Lhs& lhs, const Rhs& rhs, ResultType& res)

{

  typedef typename remove_all<Lhs>::type::Scalar LhsScalar;

  typedef typename remove_all<Rhs>::type::Scalar RhsScalar;

  Index cols = rhs.outerSize();

  eigen_assert(lhs.outerSize() == rhs.innerSize());


  evaluator<Lhs> lhsEval(lhs);

  evaluator<Rhs> rhsEval(rhs);


  for (Index j=0; j<cols; ++j)

  {

    for (typename evaluator<Rhs>::InnerIterator rhsIt(rhsEval, j); rhsIt; ++rhsIt)

    {

      RhsScalar y = rhsIt.value();

      Index k = rhsIt.index();

      for (typename evaluator<Lhs>::InnerIterator lhsIt(lhsEval, k); lhsIt; ++lhsIt)

      {

        Index i = lhsIt.index();

        LhsScalar x = lhsIt.value();

        res.coeffRef(i,j) += x * y;

      }

    }

  }

}


} // end namespace internal


namespace internal {


template<typename Lhs, typename Rhs, typename ResultType,

  int LhsStorageOrder = (traits<Lhs>::Flags&RowMajorBit) ? RowMajor : ColMajor,

  int RhsStorageOrder = (traits<Rhs>::Flags&RowMajorBit) ? RowMajor : ColMajor>

struct sparse_sparse_to_dense_product_selector;


template<typename Lhs, typename Rhs, typename ResultType>


struct sparse_sparse_to_dense_product_selector<Lhs,Rhs,ResultType,ColMajor,ColMajor>

{


  static void run(const Lhs& lhs, const Rhs& rhs, ResultType& res)

  {

    internal::sparse_sparse_to_dense_product_impl<Lhs,Rhs,ResultType>(lhs, rhs, res);

  }


};


template<typename Lhs, typename Rhs, typename ResultType>


struct sparse_sparse_to_dense_product_selector<Lhs,Rhs,ResultType,RowMajor,ColMajor>

{


  static void run(const Lhs& lhs, const Rhs& rhs, ResultType& res)

  {

    typedef SparseMatrix<typename Lhs::Scalar,ColMajor,typename ResultType::StorageIndex> ColMajorLhs;

    ColMajorLhs lhsCol(lhs);

    internal::sparse_sparse_to_dense_product_impl<ColMajorLhs,Rhs,ResultType>(lhsCol, rhs, res);

  }


};


template<typename Lhs, typename Rhs, typename ResultType>


struct sparse_sparse_to_dense_product_selector<Lhs,Rhs,ResultType,ColMajor,RowMajor>

{


  static void run(const Lhs& lhs, const Rhs& rhs, ResultType& res)

  {

    typedef SparseMatrix<typename Rhs::Scalar,ColMajor,typename ResultType::StorageIndex> ColMajorRhs;

    ColMajorRhs rhsCol(rhs);

    internal::sparse_sparse_to_dense_product_impl<Lhs,ColMajorRhs,ResultType>(lhs, rhsCol, res);

  }


};


template<typename Lhs, typename Rhs, typename ResultType>


struct sparse_sparse_to_dense_product_selector<Lhs,Rhs,ResultType,RowMajor,RowMajor>

{


  static void run(const Lhs& lhs, const Rhs& rhs, ResultType& res)

  {

    Transpose<ResultType> trRes(res);

    internal::sparse_sparse_to_dense_product_impl<Rhs,Lhs,Transpose<ResultType> >(rhs, lhs, trRes);

  }


};


} // end namespace internal


} // end namespace Eigen


#endif // EIGEN_CONSERVATIVESPARSESPARSEPRODUCT_H

i
int i
Definition BiCGSTAB_step_by_step.cpp:9

eigen_assert
#define eigen_assert(x)
Definition Macros.h:1037

ei_declare_aligned_stack_constructed_variable
#define ei_declare_aligned_stack_constructed_variable(TYPE, NAME, SIZE, BUFFER)
Definition Memory.h:768

res
cout<< "Here is the matrix m:"<< endl<< m<< endl;Matrix< ptrdiff_t, 3, 1 > res
Definition PartialRedux_count.cpp:3

rows
int rows
Definition Tutorial_commainit_02.cpp:1

cols
int cols
Definition Tutorial_commainit_02.cpp:1

Scalar
SCALAR Scalar
Definition bench_gemm.cpp:46

Eigen::Triplet< double >

x
set noclip points set clip one set noclip two set bar set border lt lw set xdata set ydata set zdata set x2data set y2data set boxwidth set dummy x
Definition gnuplot_common_settings.hh:12

Eigen::ColMajor
@ ColMajor
Definition Constants.h:319

Eigen::RowMajor
@ RowMajor
Definition Constants.h:321

Eigen::RowMajorBit
const unsigned int RowMajorBit
Definition Constants.h:66

int
return int(ret)+1

Eigen::internal::y
const Scalar & y
Definition MathFunctions.h:821

Eigen::internal::Lhs
@ Lhs
Definition TensorContractionMapper.h:19

Eigen::internal::Rhs
@ Rhs
Definition TensorContractionMapper.h:18

Eigen::numext::log2
int log2(int x)
Definition MathFunctions.h:1441

Eigen
Namespace containing all symbols from the Eigen library.
Definition bench_norm.cpp:85

Eigen::Index
EIGEN_DEFAULT_DENSE_INDEX_TYPE Index
The Index type as used for the API.
Definition Meta.h:74

internal
Definition BandTriangularSolver.h:13

Eigen::internal::conservative_sparse_sparse_product_selector< Lhs, Rhs, ResultType, RowMajor, ColMajor, RowMajor >::run
static void run(const Lhs &lhs, const Rhs &rhs, ResultType &res)
Definition ConservativeSparseSparseProduct.h:224

Eigen::internal::conservative_sparse_sparse_product_selector< Lhs, Rhs, ResultType, ColMajor, RowMajor, RowMajor >::run
static void run(const Lhs &lhs, const Rhs &rhs, ResultType &res)
Definition ConservativeSparseSparseProduct.h:238

Eigen::internal::conservative_sparse_sparse_product_selector< Lhs, Rhs, ResultType, RowMajor, RowMajor, RowMajor >::run
static void run(const Lhs &lhs, const Rhs &rhs, ResultType &res)
Definition ConservativeSparseSparseProduct.h:252

Eigen::internal::conservative_sparse_sparse_product_selector< Lhs, Rhs, ResultType, RowMajor, ColMajor, ColMajor >::run
static void run(const Lhs &lhs, const Rhs &rhs, ResultType &res)
Definition ConservativeSparseSparseProduct.h:169

Eigen::internal::conservative_sparse_sparse_product_selector< Lhs, Rhs, ResultType, RowMajor, RowMajor, ColMajor >::run
static void run(const Lhs &lhs, const Rhs &rhs, ResultType &res)
Definition ConservativeSparseSparseProduct.h:197

Eigen::internal::conservative_sparse_sparse_product_selector< Lhs, Rhs, ResultType, ColMajor, ColMajor, RowMajor >::Scalar
traits< typenameremove_all< Lhs >::type >::Scalar Scalar
Definition ConservativeSparseSparseProduct.h:210

Eigen::internal::conservative_sparse_sparse_product_selector< Lhs, Rhs, ResultType, ColMajor, ColMajor, RowMajor >::run
static void run(const Lhs &lhs, const Rhs &rhs, ResultType &res)
Definition ConservativeSparseSparseProduct.h:212

Eigen::internal::conservative_sparse_sparse_product_selector< Lhs, Rhs, ResultType, ColMajor, ColMajor, ColMajor >::run
static void run(const Lhs &lhs, const Rhs &rhs, ResultType &res)
Definition ConservativeSparseSparseProduct.h:139

Eigen::internal::conservative_sparse_sparse_product_selector< Lhs, Rhs, ResultType, ColMajor, ColMajor, ColMajor >::Scalar
LhsCleaned::Scalar Scalar
Definition ConservativeSparseSparseProduct.h:137

Eigen::internal::conservative_sparse_sparse_product_selector< Lhs, Rhs, ResultType, ColMajor, ColMajor, ColMajor >::LhsCleaned
remove_all< Lhs >::type LhsCleaned
Definition ConservativeSparseSparseProduct.h:136

Eigen::internal::conservative_sparse_sparse_product_selector< Lhs, Rhs, ResultType, ColMajor, RowMajor, ColMajor >::run
static void run(const Lhs &lhs, const Rhs &rhs, ResultType &res)
Definition ConservativeSparseSparseProduct.h:183

Eigen::internal::conservative_sparse_sparse_product_selector
Definition ConservativeSparseSparseProduct.h:131

Eigen::internal::sparse_sparse_to_dense_product_selector< Lhs, Rhs, ResultType, ColMajor, RowMajor >::run
static void run(const Lhs &lhs, const Rhs &rhs, ResultType &res)
Definition ConservativeSparseSparseProduct.h:329

Eigen::internal::sparse_sparse_to_dense_product_selector< Lhs, Rhs, ResultType, ColMajor, ColMajor >::run
static void run(const Lhs &lhs, const Rhs &rhs, ResultType &res)
Definition ConservativeSparseSparseProduct.h:309

Eigen::internal::sparse_sparse_to_dense_product_selector< Lhs, Rhs, ResultType, RowMajor, ColMajor >::run
static void run(const Lhs &lhs, const Rhs &rhs, ResultType &res)
Definition ConservativeSparseSparseProduct.h:318

Eigen::internal::sparse_sparse_to_dense_product_selector< Lhs, Rhs, ResultType, RowMajor, RowMajor >::run
static void run(const Lhs &lhs, const Rhs &rhs, ResultType &res)
Definition ConservativeSparseSparseProduct.h:340

Eigen::internal::sparse_sparse_to_dense_product_selector
Definition ConservativeSparseSparseProduct.h:304

Eigen::internal::traits
Definition ForwardDeclarations.h:17

j
std::ptrdiff_t j
Definition tut_arithmetic_redux_minmax.cpp:2