eigen/unsupported/TensorForcedEval_8h_source.html

 // This file is part of Eigen, a lightweight C++ template library

 // for linear algebra.

 //

 // Copyright (C) 2014 Benoit Steiner <benoit.steiner.goog@gmail.com>

 //

 // This Source Code Form is subject to the terms of the Mozilla

 // Public License v. 2.0. If a copy of the MPL was not distributed

 // with this file, You can obtain one at http://mozilla.org/MPL/2.0/.


 #ifndef EIGEN_CXX11_TENSOR_TENSOR_FORCED_EVAL_H

 #define EIGEN_CXX11_TENSOR_TENSOR_FORCED_EVAL_H


 #include "./InternalHeaderCheck.h"


 namespace Eigen {


 namespace internal {

 template<typename XprType>

 struct traits<TensorForcedEvalOp<XprType> >

 {

   // Type promotion to handle the case where the types of the lhs and the rhs are different.

   typedef typename XprType::Scalar Scalar;

   typedef traits<XprType> XprTraits;

   typedef typename traits<XprType>::StorageKind StorageKind;

   typedef typename traits<XprType>::Index Index;

   typedef typename XprType::Nested Nested;

   typedef std::remove_reference_t<Nested> Nested_;

   static constexpr int NumDimensions = XprTraits::NumDimensions;

   static constexpr int Layout = XprTraits::Layout;

   typedef typename XprTraits::PointerType PointerType;


   enum {

     Flags = 0

   };

 };


 template<typename XprType>

 struct eval<TensorForcedEvalOp<XprType>, Eigen::Dense>

 {

   typedef const TensorForcedEvalOp<XprType>& type;

 };


 template<typename XprType>

 struct nested<TensorForcedEvalOp<XprType>, 1, typename eval<TensorForcedEvalOp<XprType> >::type>

 {

   typedef TensorForcedEvalOp<XprType> type;

 };


 }  // end namespace internal


 template<typename XprType>

 class TensorForcedEvalOp : public TensorBase<TensorForcedEvalOp<XprType>, ReadOnlyAccessors>

 {

   public:

   typedef typename Eigen::internal::traits<TensorForcedEvalOp>::Scalar Scalar;

   typedef typename Eigen::NumTraits<Scalar>::Real RealScalar;

   typedef std::remove_const_t<typename XprType::CoeffReturnType> CoeffReturnType;

   typedef typename Eigen::internal::nested<TensorForcedEvalOp>::type Nested;

   typedef typename Eigen::internal::traits<TensorForcedEvalOp>::StorageKind StorageKind;

   typedef typename Eigen::internal::traits<TensorForcedEvalOp>::Index Index;


   EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorForcedEvalOp(const XprType& expr)

       : m_xpr(expr) {}


     EIGEN_DEVICE_FUNC

     const internal::remove_all_t<typename XprType::Nested>&

     expression() const { return m_xpr; }


   protected:

     typename XprType::Nested m_xpr;

 };


 namespace internal {

 template <typename Device, typename CoeffReturnType>

 struct non_integral_type_placement_new{

   template <typename StorageType>

 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE void operator()(Index numValues, StorageType m_buffer) {

    // Initialize non-trivially constructible types.

     if (!internal::is_arithmetic<CoeffReturnType>::value) {

       for (Index i = 0; i < numValues; ++i) new (m_buffer + i) CoeffReturnType();

     }

 }

 };


 // SYCL does not support non-integral types

 // having new (m_buffer + i) CoeffReturnType() causes the following compiler error for SYCL Devices

 // no matching function for call to 'operator new'

 template <typename CoeffReturnType>

 struct non_integral_type_placement_new<Eigen::SyclDevice, CoeffReturnType> {

   template <typename StorageType>

 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE void operator()(Index, StorageType) {

 }

 };

 } // end namespace internal


 template<typename ArgType_, typename Device>

 struct TensorEvaluator<const TensorForcedEvalOp<ArgType_>, Device>

 {

   typedef const internal::remove_all_t<ArgType_> ArgType;

   typedef TensorForcedEvalOp<ArgType> XprType;

   typedef typename ArgType::Scalar Scalar;

   typedef typename TensorEvaluator<ArgType, Device>::Dimensions Dimensions;

   typedef typename XprType::Index Index;

   typedef typename XprType::CoeffReturnType CoeffReturnType;

   typedef typename PacketType<CoeffReturnType, Device>::type PacketReturnType;

   static constexpr int PacketSize = PacketType<CoeffReturnType, Device>::size;

   typedef typename Eigen::internal::traits<XprType>::PointerType TensorPointerType;

   typedef StorageMemory<CoeffReturnType, Device> Storage;

   typedef typename Storage::Type EvaluatorPointerType;


   enum {

     IsAligned         = true,

     PacketAccess      = (PacketType<CoeffReturnType, Device>::size > 1),

     BlockAccess       = internal::is_arithmetic<CoeffReturnType>::value,

     PreferBlockAccess = false,

     RawAccess         = true

   };


   static constexpr int Layout = TensorEvaluator<ArgType, Device>::Layout;

   static constexpr int NumDims = internal::traits<ArgType>::NumDimensions;


   //===- Tensor block evaluation strategy (see TensorBlock.h) -------------===//

   typedef internal::TensorBlockDescriptor<NumDims, Index> TensorBlockDesc;

   typedef internal::TensorBlockScratchAllocator<Device> TensorBlockScratch;


   typedef typename internal::TensorMaterializedBlock<CoeffReturnType, NumDims,

                                                      Layout, Index>

       TensorBlock;

   //===--------------------------------------------------------------------===//


   TensorEvaluator(const XprType& op, const Device& device)

       : m_impl(op.expression(), device), m_op(op.expression()),

       m_device(device), m_buffer(NULL)

   { }


   EIGEN_DEVICE_FUNC const Dimensions& dimensions() const { return m_impl.dimensions(); }


   EIGEN_STRONG_INLINE bool evalSubExprsIfNeeded(EvaluatorPointerType) {

     const Index numValues =  internal::array_prod(m_impl.dimensions());

     m_buffer = m_device.get((CoeffReturnType*)m_device.allocate_temp(numValues * sizeof(CoeffReturnType)));


    internal::non_integral_type_placement_new<Device, CoeffReturnType>()(numValues, m_buffer);


     typedef TensorEvalToOp< const std::remove_const_t<ArgType> > EvalTo;

     EvalTo evalToTmp(m_device.get(m_buffer), m_op);


     internal::TensorExecutor<

         const EvalTo, std::remove_const_t<Device>,

         /*Vectorizable=*/internal::IsVectorizable<Device, const ArgType>::value,

         /*Tiling=*/internal::IsTileable<Device, const ArgType>::value>::

         run(evalToTmp, m_device);


     return true;

   }


 #ifdef EIGEN_USE_THREADS

   template <typename EvalSubExprsCallback>

   EIGEN_STRONG_INLINE void evalSubExprsIfNeededAsync(

       EvaluatorPointerType, EvalSubExprsCallback done) {

     const Index numValues = internal::array_prod(m_impl.dimensions());

     m_buffer = m_device.get((CoeffReturnType*)m_device.allocate_temp(

         numValues * sizeof(CoeffReturnType)));

     typedef TensorEvalToOp<const std::remove_const_t<ArgType>>

         EvalTo;

     EvalTo evalToTmp(m_device.get(m_buffer), m_op);


     auto on_done = std::bind([](EvalSubExprsCallback done_) { done_(true); },

                              std::move(done));

     internal::TensorAsyncExecutor<

         const EvalTo, std::remove_const_t<Device>,

         decltype(on_done),

         /*Vectorizable=*/internal::IsVectorizable<Device, const ArgType>::value,

         /*Tiling=*/internal::IsTileable<Device, const ArgType>::value>::

         runAsync(evalToTmp, m_device, std::move(on_done));

   }

 #endif


   EIGEN_STRONG_INLINE void cleanup() {

     m_device.deallocate_temp(m_buffer);

     m_buffer = NULL;

   }


   EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE CoeffReturnType coeff(Index index) const

   {

     return m_buffer[index];

   }


   template<int LoadMode>

   EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE PacketReturnType packet(Index index) const

   {

     return internal::ploadt<PacketReturnType, LoadMode>(m_buffer + index);

   }


   EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE

   internal::TensorBlockResourceRequirements getResourceRequirements() const {

     return internal::TensorBlockResourceRequirements::any();

   }


   EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorBlock

   block(TensorBlockDesc& desc, TensorBlockScratch& scratch,

           bool /*root_of_expr_ast*/ = false) const {

     eigen_assert(m_buffer != NULL);

     return TensorBlock::materialize(m_buffer, m_impl.dimensions(), desc, scratch);

   }


   EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(bool vectorized) const {

     return TensorOpCost(sizeof(CoeffReturnType), 0, 0, vectorized, PacketSize);

   }


   EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE

   EvaluatorPointerType data() const { return m_buffer; }


  private:

   TensorEvaluator<ArgType, Device> m_impl;

   const ArgType m_op;

   const Device EIGEN_DEVICE_REF m_device;

   EvaluatorPointerType m_buffer;

 };


 } // end namespace Eigen


 #endif // EIGEN_CXX11_TENSOR_TENSOR_FORCED_EVAL_H

i
int i

operator()
IndexedView_or_VectorBlock operator()(const Indices &indices)

EIGEN_DEVICE_FUNC
#define EIGEN_DEVICE_FUNC

eigen_assert
#define eigen_assert(x)

EIGEN_DEVICE_REF
#define EIGEN_DEVICE_REF
Definition: TensorMacros.h:36

Eigen::TensorBase
The tensor base class.
Definition: TensorForwardDeclarations.h:58

Eigen::TensorEvalToOp
Definition: TensorEvalTo.h:71

Eigen::TensorForcedEvalOp
Definition: TensorForcedEval.h:62

Eigen::TensorForcedEvalOp::Scalar
Eigen::internal::traits< TensorForcedEvalOp >::Scalar Scalar
Definition: TensorForcedEval.h:64

Eigen::TensorForcedEvalOp::Index
Eigen::internal::traits< TensorForcedEvalOp >::Index Index
Definition: TensorForcedEval.h:69

Eigen::TensorForcedEvalOp::CoeffReturnType
std::remove_const_t< typename XprType::CoeffReturnType > CoeffReturnType
Definition: TensorForcedEval.h:66

Eigen::TensorForcedEvalOp::TensorForcedEvalOp
TensorForcedEvalOp(const XprType &expr)
Definition: TensorForcedEval.h:71

Eigen::TensorForcedEvalOp::m_xpr
XprType::Nested m_xpr
Definition: TensorForcedEval.h:79

Eigen::TensorForcedEvalOp::StorageKind
Eigen::internal::traits< TensorForcedEvalOp >::StorageKind StorageKind
Definition: TensorForcedEval.h:68

Eigen::TensorForcedEvalOp::Nested
Eigen::internal::nested< TensorForcedEvalOp >::type Nested
Definition: TensorForcedEval.h:67

Eigen::TensorForcedEvalOp::RealScalar
Eigen::NumTraits< Scalar >::Real RealScalar
Definition: TensorForcedEval.h:65

Eigen::TensorForcedEvalOp::expression
const internal::remove_all_t< typename XprType::Nested > & expression() const
Definition: TensorForcedEval.h:76

Eigen::TensorOpCost
Definition: TensorCostModel.h:27

Eigen::Triplet

traits

Eigen::internal::remove_all_t
typename remove_all< T >::type remove_all_t

Eigen::internal::array_prod
constexpr auto array_prod(const array< T, N > &arr) -> decltype(array_reduce< product_op, T, N >(arr, static_cast< T >(1)))

Eigen
: TensorContractionSycl.h, provides various tensor contraction kernel for SYCL backend

Eigen::Index
EIGEN_DEFAULT_DENSE_INDEX_TYPE Index

internal

InternalHeaderCheck.h

Eigen::PacketType
Definition: TensorMeta.h:54

Eigen::PacketType::type
internal::packet_traits< Scalar >::type type
Definition: TensorMeta.h:55

Eigen::StorageMemory
Definition: TensorForwardDeclarations.h:39

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::TensorBlockScratch
internal::TensorBlockScratchAllocator< Device > TensorBlockScratch
Definition: TensorForcedEval.h:133

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::getResourceRequirements
internal::TensorBlockResourceRequirements getResourceRequirements() const
Definition: TensorForcedEval.h:204

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::packet
PacketReturnType packet(Index index) const
Definition: TensorForcedEval.h:198

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::cleanup
void cleanup()
Definition: TensorForcedEval.h:187

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::Dimensions
TensorEvaluator< ArgType, Device >::Dimensions Dimensions
Definition: TensorForcedEval.h:111

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::data
EvaluatorPointerType data() const
Definition: TensorForcedEval.h:220

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::Index
XprType::Index Index
Definition: TensorForcedEval.h:112

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::TensorEvaluator
TensorEvaluator(const XprType &op, const Device &device)
Definition: TensorForcedEval.h:140

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::Scalar
ArgType::Scalar Scalar
Definition: TensorForcedEval.h:110

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::TensorPointerType
Eigen::internal::traits< XprType >::PointerType TensorPointerType
Definition: TensorForcedEval.h:116

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::block
TensorBlock block(TensorBlockDesc &desc, TensorBlockScratch &scratch, bool=false) const
Definition: TensorForcedEval.h:209

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::EvaluatorPointerType
Storage::Type EvaluatorPointerType
Definition: TensorForcedEval.h:118

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::m_buffer
EvaluatorPointerType m_buffer
Definition: TensorForcedEval.h:226

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::m_impl
TensorEvaluator< ArgType, Device > m_impl
Definition: TensorForcedEval.h:223

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::XprType
TensorForcedEvalOp< ArgType > XprType
Definition: TensorForcedEval.h:109

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::TensorBlock
internal::TensorMaterializedBlock< CoeffReturnType, NumDims, Layout, Index > TensorBlock
Definition: TensorForcedEval.h:137

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::TensorBlockDesc
internal::TensorBlockDescriptor< NumDims, Index > TensorBlockDesc
Definition: TensorForcedEval.h:132

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::m_op
const ArgType m_op
Definition: TensorForcedEval.h:224

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::ArgType
const internal::remove_all_t< ArgType_ > ArgType
Definition: TensorForcedEval.h:108

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::m_device
const Device EIGEN_DEVICE_REF m_device
Definition: TensorForcedEval.h:225

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::Storage
StorageMemory< CoeffReturnType, Device > Storage
Definition: TensorForcedEval.h:117

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::costPerCoeff
TensorOpCost costPerCoeff(bool vectorized) const
Definition: TensorForcedEval.h:215

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::dimensions
const Dimensions & dimensions() const
Definition: TensorForcedEval.h:145

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::PacketReturnType
PacketType< CoeffReturnType, Device >::type PacketReturnType
Definition: TensorForcedEval.h:114

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::evalSubExprsIfNeeded
bool evalSubExprsIfNeeded(EvaluatorPointerType)
Definition: TensorForcedEval.h:147

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::CoeffReturnType
XprType::CoeffReturnType CoeffReturnType
Definition: TensorForcedEval.h:113

Eigen::TensorEvaluator< const TensorForcedEvalOp< ArgType_ >, Device >::coeff
CoeffReturnType coeff(Index index) const
Definition: TensorForcedEval.h:192

Eigen::TensorEvaluator
A cost model used to limit the number of threads used for evaluating tensor expression.
Definition: TensorEvaluator.h:31

Eigen::TensorEvaluator::Layout
static constexpr int Layout
Definition: TensorEvaluator.h:46

Eigen::TensorEvaluator::m_device
const Device EIGEN_DEVICE_REF m_device
Definition: TensorEvaluator.h:189

Eigen::TensorEvaluator::EvaluatorPointerType
Storage::Type EvaluatorPointerType
Definition: TensorEvaluator.h:41

Eigen::TensorEvaluator::PacketSize
static constexpr int PacketSize
Definition: TensorEvaluator.h:38

Eigen::TensorEvaluator::CoeffReturnType
Derived::Scalar CoeffReturnType
Definition: TensorEvaluator.h:34

Eigen::TensorEvaluator::TensorBlock
internal::TensorMaterializedBlock< ScalarNoConst, NumCoords, Layout, Index > TensorBlock
Definition: TensorEvaluator.h:65

Eigen::TensorEvaluator::PacketAccess
@ PacketAccess
Definition: TensorEvaluator.h:50

Eigen::TensorEvaluator::IsAligned
@ IsAligned
Definition: TensorEvaluator.h:49