11#ifndef EIGEN_CXX11_TENSOR_TENSOR_ARG_MAX_H
12#define EIGEN_CXX11_TENSOR_TENSOR_ARG_MAX_H
17template<
typename XprType>
18struct traits<TensorIndexTupleOp<XprType> > :
public traits<XprType>
20 typedef traits<XprType> XprTraits;
21 typedef typename XprTraits::StorageKind StorageKind;
22 typedef typename XprTraits::Index
Index;
23 typedef Tuple<Index, typename XprTraits::Scalar> Scalar;
24 typedef typename XprType::Nested Nested;
25 typedef typename remove_reference<Nested>::type _Nested;
26 static const int NumDimensions = XprTraits::NumDimensions;
27 static const int Layout = XprTraits::Layout;
30template<
typename XprType>
31struct eval<TensorIndexTupleOp<XprType>, Eigen::Dense>
33 typedef const TensorIndexTupleOp<XprType>EIGEN_DEVICE_REF type;
36template<
typename XprType>
37struct nested<TensorIndexTupleOp<XprType>, 1,
38 typename eval<TensorIndexTupleOp<XprType> >::type>
40 typedef TensorIndexTupleOp<XprType> type;
50template<
typename XprType>
51class TensorIndexTupleOp :
public TensorBase<TensorIndexTupleOp<XprType>, ReadOnlyAccessors>
54 typedef typename Eigen::internal::traits<TensorIndexTupleOp>::Scalar Scalar;
56 typedef typename Eigen::internal::nested<TensorIndexTupleOp>::type Nested;
57 typedef typename Eigen::internal::traits<TensorIndexTupleOp>::StorageKind StorageKind;
58 typedef typename Eigen::internal::traits<TensorIndexTupleOp>::Index Index;
59 typedef Tuple<Index, typename XprType::CoeffReturnType> CoeffReturnType;
61 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorIndexTupleOp(
const XprType& expr)
65 const typename internal::remove_all<typename XprType::Nested>::type&
66 expression()
const {
return m_xpr; }
69 typename XprType::Nested m_xpr;
73template<
typename ArgType,
typename Device>
77 typedef typename XprType::Index
Index;
78 typedef typename XprType::Scalar
Scalar;
81 typedef typename TensorEvaluator<ArgType, Device>::Dimensions
Dimensions;
82 static const int NumDims = internal::array_size<Dimensions>::value;
83 typedef StorageMemory<CoeffReturnType, Device> Storage;
84 typedef typename Storage::Type EvaluatorPointerType;
90 PreferBlockAccess = TensorEvaluator<ArgType, Device>::PreferBlockAccess,
91 Layout = TensorEvaluator<ArgType, Device>::Layout,
97 typedef internal::TensorBlockNotImplemented TensorBlock;
100 EIGEN_STRONG_INLINE TensorEvaluator(
const XprType& op,
const Device& device)
101 : m_impl(op.expression(), device) { }
103 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
const Dimensions& dimensions()
const {
104 return m_impl.dimensions();
107 EIGEN_STRONG_INLINE
bool evalSubExprsIfNeeded(EvaluatorPointerType ) {
108 m_impl.evalSubExprsIfNeeded(NULL);
111 EIGEN_STRONG_INLINE
void cleanup() {
115 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE CoeffReturnType coeff(Index index)
const
117 return CoeffReturnType(index, m_impl.coeff(index));
120 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost
121 costPerCoeff(
bool vectorized)
const {
122 return m_impl.costPerCoeff(vectorized) + TensorOpCost(0, 0, 1);
125 EIGEN_DEVICE_FUNC EvaluatorPointerType data()
const {
return NULL; }
128 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
void bind(cl::sycl::handler &cgh)
const {
134 TensorEvaluator<ArgType, Device> m_impl;
145template<
typename ReduceOp,
typename Dims,
typename XprType>
146struct traits<TensorTupleReducerOp<ReduceOp, Dims, XprType> > :
public traits<XprType>
148 typedef traits<XprType> XprTraits;
149 typedef typename XprTraits::StorageKind StorageKind;
150 typedef typename XprTraits::Index Index;
151 typedef Index Scalar;
152 typedef typename XprType::Nested Nested;
153 typedef typename remove_reference<Nested>::type _Nested;
154 static const int NumDimensions = XprTraits::NumDimensions - array_size<Dims>::value;
155 static const int Layout = XprTraits::Layout;
158template<
typename ReduceOp,
typename Dims,
typename XprType>
159struct eval<TensorTupleReducerOp<ReduceOp, Dims, XprType>,
Eigen::Dense>
161 typedef const TensorTupleReducerOp<ReduceOp, Dims, XprType>EIGEN_DEVICE_REF type;
164template<
typename ReduceOp,
typename Dims,
typename XprType>
165struct nested<TensorTupleReducerOp<ReduceOp, Dims, XprType>, 1,
166 typename eval<TensorTupleReducerOp<ReduceOp, Dims, XprType> >::type>
168 typedef TensorTupleReducerOp<ReduceOp, Dims, XprType> type;
173template<
typename ReduceOp,
typename Dims,
typename XprType>
174class TensorTupleReducerOp :
public TensorBase<TensorTupleReducerOp<ReduceOp, Dims, XprType>, ReadOnlyAccessors>
177 typedef typename Eigen::internal::traits<TensorTupleReducerOp>::Scalar Scalar;
178 typedef typename Eigen::NumTraits<Scalar>::Real RealScalar;
179 typedef typename Eigen::internal::nested<TensorTupleReducerOp>::type Nested;
180 typedef typename Eigen::internal::traits<TensorTupleReducerOp>::StorageKind StorageKind;
181 typedef typename Eigen::internal::traits<TensorTupleReducerOp>::Index Index;
182 typedef Index CoeffReturnType;
184 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorTupleReducerOp(
const XprType& expr,
185 const ReduceOp& reduce_op,
186 const Index return_dim,
187 const Dims& reduce_dims)
188 : m_xpr(expr), m_reduce_op(reduce_op), m_return_dim(return_dim), m_reduce_dims(reduce_dims) {}
191 const typename internal::remove_all<typename XprType::Nested>::type&
192 expression()
const {
return m_xpr; }
195 const ReduceOp& reduce_op()
const {
return m_reduce_op; }
198 const Dims& reduce_dims()
const {
return m_reduce_dims; }
201 Index return_dim()
const {
return m_return_dim; }
204 typename XprType::Nested m_xpr;
205 const ReduceOp m_reduce_op;
206 const Index m_return_dim;
207 const Dims m_reduce_dims;
211template<
typename ReduceOp,
typename Dims,
typename ArgType,
typename Device>
212struct TensorEvaluator<const TensorTupleReducerOp<ReduceOp, Dims, ArgType>, Device>
214 typedef TensorTupleReducerOp<ReduceOp, Dims, ArgType> XprType;
215 typedef typename XprType::Index Index;
216 typedef typename XprType::Scalar Scalar;
217 typedef typename XprType::CoeffReturnType CoeffReturnType;
218 typedef typename TensorIndexTupleOp<ArgType>::CoeffReturnType TupleType;
219 typedef typename TensorEvaluator<const TensorReductionOp<ReduceOp, Dims, const TensorIndexTupleOp<ArgType> >, Device>::Dimensions Dimensions;
220 typedef typename TensorEvaluator<const TensorIndexTupleOp<ArgType> , Device>::Dimensions InputDimensions;
221 static const int NumDims = internal::array_size<InputDimensions>::value;
222 typedef array<Index, NumDims> StrideDims;
223 typedef StorageMemory<CoeffReturnType, Device> Storage;
224 typedef typename Storage::Type EvaluatorPointerType;
225 typedef StorageMemory<TupleType, Device> TupleStorageMem;
229 PacketAccess =
false,
231 PreferBlockAccess = TensorEvaluator<ArgType, Device>::PreferBlockAccess,
232 Layout = TensorEvaluator<const TensorReductionOp<ReduceOp, Dims, const TensorIndexTupleOp<ArgType> >, Device>::Layout,
238 typedef internal::TensorBlockNotImplemented TensorBlock;
241 EIGEN_STRONG_INLINE TensorEvaluator(
const XprType& op,
const Device& device)
242 : m_orig_impl(op.expression(), device),
243 m_impl(op.expression().index_tuples().reduce(op.reduce_dims(), op.reduce_op()), device),
244 m_return_dim(op.return_dim())
246 gen_strides(m_orig_impl.dimensions(), m_strides);
247 if (Layout ==
static_cast<int>(
ColMajor)) {
248 const Index total_size = internal::array_prod(m_orig_impl.dimensions());
249 m_stride_mod = (m_return_dim < NumDims - 1) ? m_strides[m_return_dim + 1] : total_size;
251 const Index total_size = internal::array_prod(m_orig_impl.dimensions());
252 m_stride_mod = (m_return_dim > 0) ? m_strides[m_return_dim - 1] : total_size;
255 m_stride_div = ((m_return_dim >= 0) &&
256 (m_return_dim < static_cast<Index>(m_strides.size())))
257 ? m_strides[m_return_dim] : 1;
260 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
const Dimensions& dimensions()
const {
261 return m_impl.dimensions();
264 EIGEN_STRONG_INLINE
bool evalSubExprsIfNeeded(EvaluatorPointerType ) {
265 m_impl.evalSubExprsIfNeeded(NULL);
268 EIGEN_STRONG_INLINE
void cleanup() {
272 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE CoeffReturnType coeff(Index index)
const {
273 const TupleType v = m_impl.coeff(index);
274 return (m_return_dim < 0) ? v.first : (v.first % m_stride_mod) / m_stride_div;
277 EIGEN_DEVICE_FUNC EvaluatorPointerType data()
const {
return NULL; }
279 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE
void bind(cl::sycl::handler &cgh)
const {
281 m_orig_impl.bind(cgh);
285 EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE TensorOpCost
286 costPerCoeff(
bool vectorized)
const {
287 const double compute_cost = 1.0 +
288 (m_return_dim < 0 ? 0.0 : (TensorOpCost::ModCost<Index>() + TensorOpCost::DivCost<Index>()));
289 return m_orig_impl.costPerCoeff(vectorized) +
290 m_impl.costPerCoeff(vectorized) + TensorOpCost(0, 0, compute_cost);
294 EIGEN_DEVICE_FUNC
void gen_strides(
const InputDimensions& dims, StrideDims& strides) {
295 if (m_return_dim < 0) {
298 eigen_assert(m_return_dim < NumDims &&
299 "Asking to convert index to a dimension outside of the rank");
303 if (Layout ==
static_cast<int>(
ColMajor)) {
305 for (
int i = 1; i < NumDims; ++i) {
306 strides[i] = strides[i-1] * dims[i-1];
309 strides[NumDims-1] = 1;
310 for (
int i = NumDims - 2; i >= 0; --i) {
311 strides[i] = strides[i+1] * dims[i+1];
317 TensorEvaluator<const TensorIndexTupleOp<ArgType>, Device> m_orig_impl;
318 TensorEvaluator<const TensorReductionOp<ReduceOp, Dims, const TensorIndexTupleOp<ArgType> >, Device> m_impl;
319 const Index m_return_dim;
320 StrideDims m_strides;
The tensor base class.
Definition TensorForwardDeclarations.h:56
Tensor + Index Pair class.
Definition TensorArgMax.h:52
Namespace containing all symbols from the Eigen library.
EIGEN_DEFAULT_DENSE_INDEX_TYPE Index
The tensor evaluator class.
Definition TensorEvaluator.h:27