TR-mbed/TensorInflation_8h_source.html

// This file is part of Eigen, a lightweight C++ template library

// for linear algebra.

//

// Copyright (C) 2015 Ke Yang <yangke@gmail.com>

//

// This Source Code Form is subject to the terms of the Mozilla

// Public License v. 2.0. If a copy of the MPL was not distributed

// with this file, You can obtain one at http://mozilla.org/MPL/2.0/.


#ifndef EIGEN_CXX11_TENSOR_TENSOR_INFLATION_H

#define EIGEN_CXX11_TENSOR_TENSOR_INFLATION_H


namespace Eigen {


namespace internal {

template<typename Strides, typename XprType>


struct traits<TensorInflationOp<Strides, XprType> > : public traits<XprType>

{

  typedef typename XprType::Scalar Scalar;

  typedef traits<XprType> XprTraits;

  typedef typename XprTraits::StorageKind StorageKind;

  typedef typename XprTraits::Index Index;

  typedef typename XprType::Nested Nested;

  typedef typename remove_reference<Nested>::type _Nested;

  static const int NumDimensions = XprTraits::NumDimensions;

  static const int Layout = XprTraits::Layout;

  typedef typename XprTraits::PointerType PointerType;

};


template<typename Strides, typename XprType>


struct eval<TensorInflationOp<Strides, XprType>, Eigen::Dense>

{

  typedef const TensorInflationOp<Strides, XprType>& type;

};


template<typename Strides, typename XprType>


struct nested<TensorInflationOp<Strides, XprType>, 1, typename eval<TensorInflationOp<Strides, XprType> >::type>

{

  typedef TensorInflationOp<Strides, XprType> type;

};


}  // end namespace internal


template<typename Strides, typename XprType>


class TensorInflationOp : public TensorBase<TensorInflationOp<Strides, XprType>, ReadOnlyAccessors>

{

  public:

  typedef typename Eigen::internal::traits<TensorInflationOp>::Scalar Scalar;

  typedef typename Eigen::NumTraits<Scalar>::Real RealScalar;

  typedef typename XprType::CoeffReturnType CoeffReturnType;

  typedef typename Eigen::internal::nested<TensorInflationOp>::type Nested;

  typedef typename Eigen::internal::traits<TensorInflationOp>::StorageKind StorageKind;

  typedef typename Eigen::internal::traits<TensorInflationOp>::Index Index;


  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorInflationOp(const XprType& expr, const Strides& strides)

      : m_xpr(expr), m_strides(strides) {}


    EIGEN_DEVICE_FUNC

    const Strides& strides() const { return m_strides; }


    EIGEN_DEVICE_FUNC

    const typename internal::remove_all<typename XprType::Nested>::type&

    expression() const { return m_xpr; }


  protected:

    typename XprType::Nested m_xpr;

    const Strides m_strides;

};


// Eval as rvalue

template<typename Strides, typename ArgType, typename Device>


struct TensorEvaluator<const TensorInflationOp<Strides, ArgType>, Device>

{

  typedef TensorInflationOp<Strides, ArgType> XprType;

  typedef typename XprType::Index Index;

  static const int NumDims = internal::array_size<typename TensorEvaluator<ArgType, Device>::Dimensions>::value;

  typedef DSizes<Index, NumDims> Dimensions;

  typedef typename XprType::Scalar Scalar;

  typedef typename XprType::CoeffReturnType CoeffReturnType;

  typedef typename PacketType<CoeffReturnType, Device>::type PacketReturnType;

  static const int PacketSize = PacketType<CoeffReturnType, Device>::size;

  typedef StorageMemory<CoeffReturnType, Device> Storage;

  typedef typename Storage::Type EvaluatorPointerType;


  enum {

    IsAligned = /*TensorEvaluator<ArgType, Device>::IsAligned*/ false,

    PacketAccess = TensorEvaluator<ArgType, Device>::PacketAccess,

    BlockAccess = false,

    PreferBlockAccess = false,

    Layout = TensorEvaluator<ArgType, Device>::Layout,

    CoordAccess = false,  // to be implemented

    RawAccess = false

  };


  //===- Tensor block evaluation strategy (see TensorBlock.h) -------------===//

  typedef internal::TensorBlockNotImplemented TensorBlock;

  //===--------------------------------------------------------------------===//


  EIGEN_STRONG_INLINE TensorEvaluator(const XprType& op, const Device& device)

      : m_impl(op.expression(), device), m_strides(op.strides())

  {

    m_dimensions = m_impl.dimensions();

    // Expand each dimension to the inflated dimension.

    for (int i = 0; i < NumDims; ++i) {

      m_dimensions[i] = (m_dimensions[i] - 1) * op.strides()[i] + 1;

    }


    // Remember the strides for fast division.

    for (int i = 0; i < NumDims; ++i) {

      m_fastStrides[i] = internal::TensorIntDivisor<Index>(m_strides[i]);

    }


    const typename TensorEvaluator<ArgType, Device>::Dimensions& input_dims = m_impl.dimensions();

    if (static_cast<int>(Layout) == static_cast<int>(ColMajor)) {

      m_outputStrides[0] = 1;

      m_inputStrides[0] = 1;

      for (int i = 1; i < NumDims; ++i) {

        m_outputStrides[i] = m_outputStrides[i-1] * m_dimensions[i-1];

        m_inputStrides[i] = m_inputStrides[i-1] * input_dims[i-1];

      }

    } else {  // RowMajor

      m_outputStrides[NumDims-1] = 1;

      m_inputStrides[NumDims-1] = 1;

      for (int i = NumDims - 2; i >= 0; --i) {

        m_outputStrides[i] = m_outputStrides[i+1] * m_dimensions[i+1];

        m_inputStrides[i] = m_inputStrides[i+1] * input_dims[i+1];

      }

    }

  }


  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Dimensions& dimensions() const { return m_dimensions; }


  EIGEN_STRONG_INLINE bool evalSubExprsIfNeeded(EvaluatorPointerType /*data*/) {

    m_impl.evalSubExprsIfNeeded(NULL);

    return true;

  }


  EIGEN_STRONG_INLINE void cleanup() {

    m_impl.cleanup();

  }


  // Computes the input index given the output index. Returns true if the output

  // index doesn't fall into a hole.


  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE bool getInputIndex(Index index, Index* inputIndex) const

  {

    eigen_assert(index < dimensions().TotalSize());

    *inputIndex = 0;

    if (static_cast<int>(Layout) == static_cast<int>(ColMajor)) {

      EIGEN_UNROLL_LOOP

      for (int i = NumDims - 1; i > 0; --i) {

        const Index idx = index / m_outputStrides[i];

        if (idx != idx / m_fastStrides[i] * m_strides[i]) {

          return false;

        }

        *inputIndex += idx / m_strides[i] * m_inputStrides[i];

        index -= idx * m_outputStrides[i];

      }

      if (index != index / m_fastStrides[0] * m_strides[0]) {

        return false;

      }

      *inputIndex += index / m_strides[0];

      return true;

    } else {

      EIGEN_UNROLL_LOOP

      for (int i = 0; i < NumDims - 1; ++i) {

        const Index idx = index / m_outputStrides[i];

        if (idx != idx / m_fastStrides[i] * m_strides[i]) {

          return false;

        }

        *inputIndex += idx / m_strides[i] * m_inputStrides[i];

        index -= idx * m_outputStrides[i];

      }

      if (index != index / m_fastStrides[NumDims-1] * m_strides[NumDims-1]) {

        return false;

      }

      *inputIndex += index / m_strides[NumDims - 1];

    }

    return true;

  }


  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE CoeffReturnType coeff(Index index) const

  {

    Index inputIndex = 0;

    if (getInputIndex(index, &inputIndex)) {

     return m_impl.coeff(inputIndex);

    } else {

     return Scalar(0);

    }

  }


  // TODO(yangke): optimize this function so that we can detect and produce

  // all-zero packets

  template<int LoadMode>


  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE PacketReturnType packet(Index index) const

  {

    EIGEN_STATIC_ASSERT((PacketSize > 1), YOU_MADE_A_PROGRAMMING_MISTAKE)

    eigen_assert(index+PacketSize-1 < dimensions().TotalSize());


    EIGEN_ALIGN_MAX typename internal::remove_const<CoeffReturnType>::type values[PacketSize];

    EIGEN_UNROLL_LOOP

    for (int i = 0; i < PacketSize; ++i) {

      values[i] = coeff(index+i);

    }

    PacketReturnType rslt = internal::pload<PacketReturnType>(values);

    return rslt;

  }


  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(bool vectorized) const {

    const double compute_cost = NumDims * (3 * TensorOpCost::DivCost<Index>() +

                                           3 * TensorOpCost::MulCost<Index>() +

                                           2 * TensorOpCost::AddCost<Index>());

    const double input_size = m_impl.dimensions().TotalSize();

    const double output_size = m_dimensions.TotalSize();

    if (output_size == 0)

      return TensorOpCost();

    return m_impl.costPerCoeff(vectorized) +

           TensorOpCost(sizeof(CoeffReturnType) * input_size / output_size, 0,

                        compute_cost, vectorized, PacketSize);

  }


  EIGEN_DEVICE_FUNC EvaluatorPointerType data() const { return NULL; }


#ifdef EIGEN_USE_SYCL

  // binding placeholder accessors to a command group handler for SYCL

  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE void bind(cl::sycl::handler &cgh) const {

    m_impl.bind(cgh);

  }

#endif


 protected:

  Dimensions m_dimensions;

  array<Index, NumDims> m_outputStrides;

  array<Index, NumDims> m_inputStrides;

  TensorEvaluator<ArgType, Device> m_impl;

  const Strides m_strides;

  array<internal::TensorIntDivisor<Index>, NumDims> m_fastStrides;

};


} // end namespace Eigen


#endif // EIGEN_CXX11_TENSOR_TENSOR_INFLATION_H

i
int i
Definition BiCGSTAB_step_by_step.cpp:9

EIGEN_ALIGN_MAX
#define EIGEN_ALIGN_MAX
Definition ConfigureVectorization.h:157

EIGEN_UNROLL_LOOP
#define EIGEN_UNROLL_LOOP
Definition Macros.h:1461

EIGEN_DEVICE_FUNC
#define EIGEN_DEVICE_FUNC
Definition Macros.h:976

eigen_assert
#define eigen_assert(x)
Definition Macros.h:1037

EIGEN_STRONG_INLINE
#define EIGEN_STRONG_INLINE
Definition Macros.h:917

EIGEN_STATIC_ASSERT
#define EIGEN_STATIC_ASSERT(CONDITION, MSG)
Definition StaticAssert.h:127

Eigen::CwiseBinaryOp
Generic expression where a coefficient-wise binary operator is applied to two expressions.
Definition CwiseBinaryOp.h:84

Eigen::TensorBase
The tensor base class.
Definition TensorBase.h:973

Eigen::TensorInflationOp
Definition TensorInflation.h:53

Eigen::TensorInflationOp::TensorInflationOp
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorInflationOp(const XprType &expr, const Strides &strides)
Definition TensorInflation.h:62

Eigen::TensorInflationOp::Scalar
Eigen::internal::traits< TensorInflationOp >::Scalar Scalar
Definition TensorInflation.h:55

Eigen::TensorInflationOp::RealScalar
Eigen::NumTraits< Scalar >::Real RealScalar
Definition TensorInflation.h:56

Eigen::TensorInflationOp::CoeffReturnType
XprType::CoeffReturnType CoeffReturnType
Definition TensorInflation.h:57

Eigen::TensorInflationOp::m_xpr
XprType::Nested m_xpr
Definition TensorInflation.h:73

Eigen::TensorInflationOp::expression
EIGEN_DEVICE_FUNC const internal::remove_all< typenameXprType::Nested >::type & expression() const
Definition TensorInflation.h:70

Eigen::TensorInflationOp::strides
EIGEN_DEVICE_FUNC const Strides & strides() const
Definition TensorInflation.h:66

Eigen::TensorInflationOp::Nested
Eigen::internal::nested< TensorInflationOp >::type Nested
Definition TensorInflation.h:58

Eigen::TensorInflationOp::m_strides
const Strides m_strides
Definition TensorInflation.h:74

Eigen::TensorInflationOp::StorageKind
Eigen::internal::traits< TensorInflationOp >::StorageKind StorageKind
Definition TensorInflation.h:59

Eigen::TensorInflationOp::Index
Eigen::internal::traits< TensorInflationOp >::Index Index
Definition TensorInflation.h:60

Eigen::TensorOpCost
Definition TensorCostModel.h:25

Eigen::Triplet< double >

Eigen::array
Definition EmulateArray.h:21

Eigen::internal::TensorBlockNotImplemented
Definition TensorBlock.h:617

Eigen::internal::TensorLazyEvaluatorWritable
Definition TensorRef.h:81

Eigen::ColMajor
@ ColMajor
Definition Constants.h:319

Eigen
Namespace containing all symbols from the Eigen library.
Definition bench_norm.cpp:85

internal
Definition BandTriangularSolver.h:13

Eigen::DSizes
Definition TensorDimensions.h:263

Eigen::Dense
Definition Constants.h:507

Eigen::PacketType
Definition TensorMeta.h:50

Eigen::StorageMemory
Definition TensorForwardDeclarations.h:37

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::cleanup
EIGEN_STRONG_INLINE void cleanup()
Definition TensorInflation.h:144

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::Dimensions
DSizes< Index, NumDims > Dimensions
Definition TensorInflation.h:84

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::dimensions
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Dimensions & dimensions() const
Definition TensorInflation.h:138

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::Storage
StorageMemory< CoeffReturnType, Device > Storage
Definition TensorInflation.h:89

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::m_inputStrides
array< Index, NumDims > m_inputStrides
Definition TensorInflation.h:239

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::m_strides
const Strides m_strides
Definition TensorInflation.h:241

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::EvaluatorPointerType
Storage::Type EvaluatorPointerType
Definition TensorInflation.h:90

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::Index
XprType::Index Index
Definition TensorInflation.h:82

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::m_dimensions
Dimensions m_dimensions
Definition TensorInflation.h:237

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::data
EIGEN_DEVICE_FUNC EvaluatorPointerType data() const
Definition TensorInflation.h:227

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::getInputIndex
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE bool getInputIndex(Index index, Index *inputIndex) const
Definition TensorInflation.h:150

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::PacketReturnType
PacketType< CoeffReturnType, Device >::type PacketReturnType
Definition TensorInflation.h:87

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::coeff
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE CoeffReturnType coeff(Index index) const
Definition TensorInflation.h:187

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::XprType
TensorInflationOp< Strides, ArgType > XprType
Definition TensorInflation.h:81

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::evalSubExprsIfNeeded
EIGEN_STRONG_INLINE bool evalSubExprsIfNeeded(EvaluatorPointerType)
Definition TensorInflation.h:140

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::TensorBlock
internal::TensorBlockNotImplemented TensorBlock
Definition TensorInflation.h:103

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::Scalar
XprType::Scalar Scalar
Definition TensorInflation.h:85

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::m_outputStrides
array< Index, NumDims > m_outputStrides
Definition TensorInflation.h:238

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::CoeffReturnType
XprType::CoeffReturnType CoeffReturnType
Definition TensorInflation.h:86

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::m_fastStrides
array< internal::TensorIntDivisor< Index >, NumDims > m_fastStrides
Definition TensorInflation.h:242

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::m_impl
TensorEvaluator< ArgType, Device > m_impl
Definition TensorInflation.h:240

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::packet
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE PacketReturnType packet(Index index) const
Definition TensorInflation.h:200

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::costPerCoeff
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(bool vectorized) const
Definition TensorInflation.h:214

Eigen::TensorEvaluator< const TensorInflationOp< Strides, ArgType >, Device >::TensorEvaluator
EIGEN_STRONG_INLINE TensorEvaluator(const XprType &op, const Device &device)
Definition TensorInflation.h:106

Eigen::TensorEvaluator
A cost model used to limit the number of threads used for evaluating tensor expression.
Definition TensorEvaluator.h:29

Eigen::TensorEvaluator::Scalar
Derived::Scalar Scalar
Definition TensorEvaluator.h:31

Eigen::TensorEvaluator::dimensions
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE const Dimensions & dimensions() const
Definition TensorEvaluator.h:73

Eigen::TensorEvaluator::coeff
EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE CoeffReturnType coeff(Index index) const
Definition TensorEvaluator.h:94

Eigen::TensorEvaluator::BlockAccess
@ BlockAccess
Definition TensorEvaluator.h:48

Eigen::TensorEvaluator::PreferBlockAccess
@ PreferBlockAccess
Definition TensorEvaluator.h:49

Eigen::TensorEvaluator::PacketAccess
@ PacketAccess
Definition TensorEvaluator.h:47

Eigen::TensorEvaluator::Layout
@ Layout
Definition TensorEvaluator.h:50

Eigen::TensorEvaluator::IsAligned
@ IsAligned
Definition TensorEvaluator.h:46

Eigen::TensorEvaluator::Dimensions
Derived::Dimensions Dimensions
Definition TensorEvaluator.h:34

Eigen::TensorEvaluator::PacketSize
static const int PacketSize
Definition TensorEvaluator.h:36

Eigen::internal::eval< TensorInflationOp< Strides, XprType >, Eigen::Dense >::type
const TensorInflationOp< Strides, XprType > & type
Definition TensorInflation.h:40

Eigen::internal::eval
Definition XprHelper.h:332

Eigen::internal::nested< TensorInflationOp< Strides, XprType >, 1, typename eval< TensorInflationOp< Strides, XprType > >::type >::type
TensorInflationOp< Strides, XprType > type
Definition TensorInflation.h:46

Eigen::internal::nested
Definition TensorTraits.h:175

Eigen::internal::traits< TensorInflationOp< Strides, XprType > >::XprTraits
traits< XprType > XprTraits
Definition TensorInflation.h:27

Eigen::internal::traits< TensorInflationOp< Strides, XprType > >::PointerType
XprTraits::PointerType PointerType
Definition TensorInflation.h:34

Eigen::internal::traits< TensorInflationOp< Strides, XprType > >::Scalar
XprType::Scalar Scalar
Definition TensorInflation.h:26

Eigen::internal::traits< TensorInflationOp< Strides, XprType > >::StorageKind
XprTraits::StorageKind StorageKind
Definition TensorInflation.h:28

Eigen::internal::traits< TensorInflationOp< Strides, XprType > >::Nested
XprType::Nested Nested
Definition TensorInflation.h:30

Eigen::internal::traits< TensorInflationOp< Strides, XprType > >::Index
XprTraits::Index Index
Definition TensorInflation.h:29

Eigen::internal::traits< TensorInflationOp< Strides, XprType > >::_Nested
remove_reference< Nested >::type _Nested
Definition TensorInflation.h:31

Eigen::internal::traits
Definition ForwardDeclarations.h:17