10#ifndef EIGEN_CXX11_TENSOR_TENSOR_FORCED_EVAL_H
11#define EIGEN_CXX11_TENSOR_TENSOR_FORCED_EVAL_H
14#include "./InternalHeaderCheck.h"
21template <
typename XprType>
22struct traits<TensorForcedEvalOp<XprType>> {
24 typedef typename XprType::Scalar Scalar;
25 typedef traits<XprType> XprTraits;
26 typedef typename traits<XprType>::StorageKind StorageKind;
27 typedef typename traits<XprType>::Index
Index;
28 typedef typename XprType::Nested Nested;
29 typedef std::remove_reference_t<Nested> Nested_;
30 static constexpr int NumDimensions = XprTraits::NumDimensions;
31 static constexpr int Layout = XprTraits::Layout;
32 typedef typename XprTraits::PointerType PointerType;
37template <
typename XprType>
38struct eval<TensorForcedEvalOp<XprType>, Eigen::Dense> {
39 typedef const TensorForcedEvalOp<XprType>& type;
42template <
typename XprType>
43struct nested<TensorForcedEvalOp<XprType>, 1, typename eval<TensorForcedEvalOp<XprType>>::type> {
44 typedef TensorForcedEvalOp<XprType> type;
54template <
typename XprType>
55class TensorForcedEvalOp :
public TensorBase<TensorForcedEvalOp<XprType>, ReadOnlyAccessors> {
57 typedef typename Eigen::internal::traits<TensorForcedEvalOp>::Scalar Scalar;
59 typedef std::remove_const_t<typename XprType::CoeffReturnType> CoeffReturnType;
60 typedef typename Eigen::internal::nested<TensorForcedEvalOp>::type Nested;
61 typedef typename Eigen::internal::traits<TensorForcedEvalOp>::StorageKind StorageKind;
62 typedef typename Eigen::internal::traits<TensorForcedEvalOp>::Index Index;
64 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorForcedEvalOp(
const XprType& expr) : m_xpr(expr) {}
66 EIGEN_DEVICE_FUNC
const internal::remove_all_t<typename XprType::Nested>& expression()
const {
return m_xpr; }
69 typename XprType::Nested m_xpr;
73template <
typename Device,
typename CoeffReturnType>
74struct non_integral_type_placement_new {
75 template <
typename StorageType>
76 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
void operator()(
Index numValues, StorageType m_buffer) {
78 if (!internal::is_arithmetic<CoeffReturnType>::value) {
87template <
typename CoeffReturnType>
88struct non_integral_type_placement_new<Eigen::SyclDevice, CoeffReturnType> {
89 template <
typename StorageType>
90 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
void operator()(
Index, StorageType) {}
94template <
typename Device>
95class DeviceTempPointerHolder {
97 DeviceTempPointerHolder(
const Device& device,
size_t size)
98 : device_(device), size_(size), ptr_(device.allocate_temp(size)) {}
100 ~DeviceTempPointerHolder() {
101 device_.deallocate_temp(ptr_);
106 void* ptr() {
return ptr_; }
114template <
typename ArgType_,
typename Device>
116 typedef const internal::remove_all_t<ArgType_> ArgType;
117 typedef TensorForcedEvalOp<ArgType> XprType;
118 typedef typename ArgType::Scalar Scalar;
119 typedef typename TensorEvaluator<ArgType, Device>::Dimensions Dimensions;
120 typedef typename XprType::Index Index;
121 typedef typename XprType::CoeffReturnType CoeffReturnType;
122 typedef typename PacketType<CoeffReturnType, Device>::type PacketReturnType;
123 static constexpr int PacketSize = PacketType<CoeffReturnType, Device>::size;
124 typedef typename Eigen::internal::traits<XprType>::PointerType TensorPointerType;
125 typedef StorageMemory<CoeffReturnType, Device> Storage;
126 typedef typename Storage::Type EvaluatorPointerType;
130 PacketAccess = (PacketType<CoeffReturnType, Device>::size > 1),
131 BlockAccess = internal::is_arithmetic<CoeffReturnType>::value,
132 PreferBlockAccess =
false,
136 static constexpr int Layout = TensorEvaluator<ArgType, Device>::Layout;
137 static constexpr int NumDims = internal::traits<ArgType>::NumDimensions;
140 typedef internal::TensorBlockDescriptor<NumDims, Index> TensorBlockDesc;
141 typedef internal::TensorBlockScratchAllocator<Device> TensorBlockScratch;
143 typedef typename internal::TensorMaterializedBlock<CoeffReturnType, NumDims, Layout, Index> TensorBlock;
146 TensorEvaluator(
const XprType& op,
const Device& device)
147 : m_impl(op.expression(), device),
148 m_op(op.expression()),
150 m_buffer_holder(nullptr),
153 ~TensorEvaluator() { cleanup(); }
155 EIGEN_DEVICE_FUNC
const Dimensions& dimensions()
const {
return m_impl.dimensions(); }
157 EIGEN_STRONG_INLINE
bool evalSubExprsIfNeeded(EvaluatorPointerType) {
158 const Index numValues = internal::array_prod(m_impl.dimensions());
159 m_buffer_holder = std::make_shared<DeviceTempPointerHolder<Device>>(m_device, numValues *
sizeof(CoeffReturnType));
160 m_buffer =
static_cast<EvaluatorPointerType
>(m_buffer_holder->ptr());
162 internal::non_integral_type_placement_new<Device, CoeffReturnType>()(numValues, m_buffer);
164 typedef TensorEvalToOp<const std::remove_const_t<ArgType>> EvalTo;
165 EvalTo evalToTmp(m_device.get(m_buffer), m_op);
167 internal::TensorExecutor<const EvalTo, std::remove_const_t<Device>,
168 internal::IsVectorizable<Device, const ArgType>::value,
169 internal::IsTileable<Device, const ArgType>::value>::run(evalToTmp, m_device);
174#ifdef EIGEN_USE_THREADS
175 template <
typename EvalSubExprsCallback>
176 EIGEN_STRONG_INLINE
void evalSubExprsIfNeededAsync(EvaluatorPointerType, EvalSubExprsCallback done) {
177 const Index numValues = internal::array_prod(m_impl.dimensions());
178 m_buffer_holder = std::make_shared<DeviceTempPointerHolder<Device>>(m_device, numValues *
sizeof(CoeffReturnType));
179 m_buffer =
static_cast<EvaluatorPointerType
>(m_buffer_holder->ptr());
181 typedef TensorEvalToOp<const std::remove_const_t<ArgType>> EvalTo;
182 EvalTo evalToTmp(m_device.get(m_buffer), m_op);
184 auto on_done = std::bind([](EvalSubExprsCallback done_) { done_(
true); }, std::move(done));
185 internal::TensorAsyncExecutor<
186 const EvalTo, std::remove_const_t<Device>,
decltype(on_done),
187 internal::IsVectorizable<Device, const ArgType>::value,
188 internal::IsTileable<Device, const ArgType>::value>::runAsync(evalToTmp, m_device,
193 EIGEN_STRONG_INLINE
void cleanup() {
194 m_buffer_holder =
nullptr;
198 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE CoeffReturnType coeff(Index index)
const {
return m_buffer[index]; }
200 template <
int LoadMode>
201 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE PacketReturnType packet(Index index)
const {
202 return internal::ploadt<PacketReturnType, LoadMode>(m_buffer + index);
205 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE internal::TensorBlockResourceRequirements getResourceRequirements()
const {
206 return internal::TensorBlockResourceRequirements::any();
209 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorBlock block(TensorBlockDesc& desc, TensorBlockScratch& scratch,
210 bool =
false)
const {
211 eigen_assert(m_buffer !=
nullptr);
212 return TensorBlock::materialize(m_buffer, m_impl.dimensions(), desc, scratch);
215 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost costPerCoeff(
bool vectorized)
const {
216 return TensorOpCost(
sizeof(CoeffReturnType), 0, 0, vectorized, PacketSize);
219 EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE EvaluatorPointerType data()
const {
return m_buffer; }
222 TensorEvaluator<ArgType, Device> m_impl;
224 const Device EIGEN_DEVICE_REF m_device;
225 std::shared_ptr<DeviceTempPointerHolder<Device>> m_buffer_holder;
226 EvaluatorPointerType m_buffer;
The tensor base class.
Definition TensorForwardDeclarations.h:68
Tensor reshaping class.
Definition TensorForcedEval.h:55
Namespace containing all symbols from the Eigen library.
EIGEN_DEFAULT_DENSE_INDEX_TYPE Index
The tensor evaluator class.
Definition TensorEvaluator.h:30