10 #ifndef EIGEN_CXX11_TENSOR_TENSOR_SHUFFLING_H
11 #define EIGEN_CXX11_TENSOR_TENSOR_SHUFFLING_H
23 template<
typename Shuffle,
typename XprType>
30 typedef typename XprType::Nested
Nested;
32 static const int NumDimensions = XprTraits::NumDimensions;
33 static const int Layout = XprTraits::Layout;
36 template<
typename Shuffle,
typename XprType>
42 template<
typename Shuffle,
typename XprType>
52 template<
typename Shuffle,
typename XprType>
77 Assign assign(*
this, other);
82 template<
typename OtherDerived>
87 Assign assign(*
this, other);
99 template<
typename Shuffle,
typename ArgType,
typename Device>
124 for (
int i = 0; i < NumDims; ++i) {
125 m_dimensions[i] = input_dims[shuffle[i]];
132 m_outputStrides[0] = 1;
133 for (
int i = 1; i < NumDims; ++i) {
134 inputStrides[i] = inputStrides[i - 1] * input_dims[i - 1];
135 m_outputStrides[i] = m_outputStrides[i - 1] * m_dimensions[i - 1];
138 inputStrides[NumDims - 1] = 1;
139 m_outputStrides[NumDims - 1] = 1;
140 for (
int i = NumDims - 2; i >= 0; --i) {
141 inputStrides[i] = inputStrides[i + 1] * input_dims[i + 1];
142 m_outputStrides[i] = m_outputStrides[i + 1] * m_dimensions[i + 1];
146 for (
int i = 0; i < NumDims; ++i) {
147 m_inputStrides[i] = inputStrides[shuffle[i]];
154 m_impl.evalSubExprsIfNeeded(NULL);
163 return m_impl.coeff(srcCoeff(index));
166 template<
int LoadMode>
173 for (
int i = 0; i < PacketSize; ++i) {
174 values[i] =
coeff(index+i);
181 const double compute_cost = NumDims * (2 * TensorOpCost::AddCost<Index>() +
182 2 * TensorOpCost::MulCost<Index>() +
183 TensorOpCost::DivCost<Index>());
184 return m_impl.costPerCoeff(vectorized) +
192 Index inputIndex = 0;
194 for (
int i = NumDims - 1; i > 0; --i) {
195 const Index idx = index / m_outputStrides[i];
196 inputIndex += idx * m_inputStrides[i];
197 index -= idx * m_outputStrides[i];
199 return inputIndex + index * m_inputStrides[0];
201 for (
int i = 0; i < NumDims - 1; ++i) {
202 const Index idx = index / m_outputStrides[i];
203 inputIndex += idx * m_inputStrides[i];
204 index -= idx * m_outputStrides[i];
206 return inputIndex + index * m_inputStrides[NumDims - 1];
218 template<
typename Shuffle,
typename ArgType,
typename Device>
220 :
public TensorEvaluator<const TensorShufflingOp<Shuffle, ArgType>, Device>
245 return this->
m_impl.coeffRef(this->srcCoeff(index));
254 internal::pstore<CoeffReturnType, PacketReturnType>(values,
x);
255 for (
int i = 0; i < PacketSize; ++i) {
256 this->
coeffRef(index+i) = values[i];
264 #endif // EIGEN_CXX11_TENSOR_TENSOR_SHUFFLING_H