13 #ifndef EIGEN_PRODUCTEVALUATORS_H
14 #define EIGEN_PRODUCTEVALUATORS_H
28 template<
typename Lhs,
typename Rhs,
int Options>
40 template<
typename Lhs,
typename Rhs,
typename Scalar1,
typename Scalar2,
typename Plain1>
42 const
CwiseNullaryOp<internal::scalar_constant_op<Scalar1>, Plain1>,
43 const
Product<Lhs, Rhs, DefaultProduct> > >
47 template<
typename Lhs,
typename Rhs,
typename Scalar1,
typename Scalar2,
typename Plain1>
49 const
CwiseNullaryOp<internal::scalar_constant_op<Scalar1>, Plain1>,
50 const
Product<Lhs, Rhs, DefaultProduct> > >
51 :
public evaluator<Product<EIGEN_SCALAR_BINARYOP_EXPR_RETURN_TYPE(Scalar1,Lhs,product), Rhs, DefaultProduct> >
59 :
Base(xpr.lhs().functor().m_other * xpr.rhs().lhs() * xpr.rhs().rhs())
64 template<
typename Lhs,
typename Rhs,
int DiagIndex>
66 :
public evaluator<Diagonal<const Product<Lhs, Rhs, LazyProduct>, DiagIndex> >
82 template<
typename Lhs,
typename Rhs,
88 template<
typename Lhs,
typename Rhs>
95 template<
typename Lhs,
typename Rhs,
int Options,
int ProductTag,
typename LhsShape,
typename RhsShape>
97 :
public evaluator<typename Product<Lhs, Rhs, Options>::PlainObject>
108 : m_result(xpr.rows(), xpr.cols())
110 ::new (
static_cast<Base*
>(
this))
Base(m_result);
135 template<
typename DstXprType,
typename Lhs,
typename Rhs,
int Options,
typename Scalar>
137 typename
enable_if<(Options==DefaultProduct || Options==AliasFreeProduct)>::type>
145 if((dst.rows()!=dstRows) || (dst.cols()!=dstCols))
146 dst.resize(dstRows, dstCols);
153 template<
typename DstXprType,
typename Lhs,
typename Rhs,
int Options,
typename Scalar>
155 typename
enable_if<(Options==DefaultProduct || Options==AliasFreeProduct)>::type>
168 template<
typename DstXprType,
typename Lhs,
typename Rhs,
int Options,
typename Scalar>
170 typename
enable_if<(Options==DefaultProduct || Options==AliasFreeProduct)>::type>
186 template<
typename DstXprType,
typename Lhs,
typename Rhs,
typename AssignFunc,
typename Scalar,
typename ScalarBis,
typename Plain>
204 template<
typename OtherXpr,
typename Lhs,
typename Rhs>
210 template<
typename OtherXpr,
typename Lhs,
typename Rhs>
216 template<
typename DstXprType,
typename OtherXpr,
typename ProductType,
typename Func1,
typename Func2>
219 template<
typename SrcXprType,
typename InitialFunc>
221 void run(DstXprType &dst,
const SrcXprType &src,
const InitialFunc& )
228 #define EIGEN_CATCH_ASSIGN_XPR_OP_PRODUCT(ASSIGN_OP,BINOP,ASSIGN_OP2) \
229 template< typename DstXprType, typename OtherXpr, typename Lhs, typename Rhs, typename DstScalar, typename SrcScalar, typename OtherScalar,typename ProdScalar> \
230 struct Assignment<DstXprType, CwiseBinaryOp<internal::BINOP<OtherScalar,ProdScalar>, const OtherXpr, \
231 const Product<Lhs,Rhs,DefaultProduct> >, internal::ASSIGN_OP<DstScalar,SrcScalar>, Dense2Dense> \
232 : assignment_from_xpr_op_product<DstXprType, OtherXpr, Product<Lhs,Rhs,DefaultProduct>, internal::ASSIGN_OP<DstScalar,OtherScalar>, internal::ASSIGN_OP2<DstScalar,ProdScalar> > \
245 template<
typename Lhs,
typename Rhs>
248 template<
typename Dst>
251 dst.coeffRef(0,0) = (lhs.transpose().cwiseProduct(rhs)).sum();
254 template<
typename Dst>
257 dst.coeffRef(0,0) += (lhs.transpose().cwiseProduct(rhs)).sum();
260 template<
typename Dst>
262 { dst.coeffRef(0,0) -= (lhs.transpose().cwiseProduct(rhs)).sum(); }
271 template<
typename Dst,
typename Lhs,
typename Rhs,
typename Func>
278 const Index cols = dst.cols();
279 for (
Index j=0; j<cols; ++j)
280 func(dst.col(j), rhsEval.coeff(
Index(0),j) * actual_lhs);
284 template<
typename Dst,
typename Lhs,
typename Rhs,
typename Func>
291 const Index rows = dst.rows();
292 for (
Index i=0; i<rows; ++i)
293 func(dst.row(i), lhsEval.coeff(i,
Index(0)) * actual_rhs);
296 template<
typename Lhs,
typename Rhs>
299 template<
typename T>
struct is_row_major :
internal::conditional<(int(T::Flags)&RowMajorBit), internal::true_type, internal::false_type>::type {};
303 struct set {
template<
typename Dst,
typename Src>
void operator()(
const Dst& dst,
const Src& src)
const { dst.const_cast_derived() = src; } };
304 struct add {
template<
typename Dst,
typename Src>
void operator()(
const Dst& dst,
const Src& src)
const { dst.const_cast_derived() += src; } };
305 struct sub {
template<
typename Dst,
typename Src>
void operator()(
const Dst& dst,
const Src& src)
const { dst.const_cast_derived() -= src; } };
309 template<
typename Dst,
typename Src>
void operator()(
const Dst& dst,
const Src& src)
const {
310 dst.const_cast_derived() += m_scale * src;
314 template<
typename Dst>
320 template<
typename Dst>
326 template<
typename Dst>
332 template<
typename Dst>
342 template<
typename Lhs,
typename Rhs,
typename Derived>
347 template<
typename Dst>
351 template<
typename Dst>
355 template<
typename Dst>
359 template<
typename Dst>
361 { Derived::scaleAndAddTo(dst,lhs,rhs,
alpha); }
365 template<
typename Lhs,
typename Rhs>
375 template<
typename Dest>
387 template<
typename Lhs,
typename Rhs>
392 template<
typename Dst>
400 template<
typename Dst>
407 template<
typename Dst>
420 template<
typename Lhs,
typename Rhs>
430 template<
int Traversal,
int UnrollingIndex,
typename Lhs,
typename Rhs,
typename RetScalar>
433 template<
int StorageOrder,
int UnrollingIndex,
typename Lhs,
typename Rhs,
typename Packet,
int LoadMode>
436 template<
typename Lhs,
typename Rhs,
int ProductTag>
451 m_innerDim(xpr.lhs().cols())
457 std::cerr <<
"LhsOuterStrideBytes= " << LhsOuterStrideBytes <<
"\n";
458 std::cerr <<
"RhsOuterStrideBytes= " << RhsOuterStrideBytes <<
"\n";
459 std::cerr <<
"LhsAlignment= " << LhsAlignment <<
"\n";
460 std::cerr <<
"RhsAlignment= " << RhsAlignment <<
"\n";
461 std::cerr <<
"CanVectorizeLhs= " << CanVectorizeLhs <<
"\n";
462 std::cerr <<
"CanVectorizeRhs= " << CanVectorizeRhs <<
"\n";
463 std::cerr <<
"CanVectorizeInner= " << CanVectorizeInner <<
"\n";
464 std::cerr <<
"EvalToRowMajor= " << EvalToRowMajor <<
"\n";
465 std::cerr <<
"Alignment= " << Alignment <<
"\n";
466 std::cerr <<
"Flags= " << Flags <<
"\n";
482 RowsAtCompileTime = LhsNestedCleaned::RowsAtCompileTime,
483 ColsAtCompileTime = RhsNestedCleaned::ColsAtCompileTime,
485 MaxRowsAtCompileTime = LhsNestedCleaned::MaxRowsAtCompileTime,
486 MaxColsAtCompileTime = RhsNestedCleaned::MaxColsAtCompileTime
494 LhsCoeffReadCost = LhsEtorType::CoeffReadCost,
495 RhsCoeffReadCost = RhsEtorType::CoeffReadCost,
503 LhsFlags = LhsEtorType::Flags,
504 RhsFlags = RhsEtorType::Flags,
518 CanVectorizeRhs = bool(RhsRowMajor) && (RhsFlags &
PacketAccessBit) && (ColsAtCompileTime!=1),
519 CanVectorizeLhs = (!LhsRowMajor) && (LhsFlags &
PacketAccessBit) && (RowsAtCompileTime!=1),
521 EvalToRowMajor = (MaxRowsAtCompileTime==1&&MaxColsAtCompileTime!=1) ? 1
522 : (MaxColsAtCompileTime==1&&MaxRowsAtCompileTime!=1) ? 0
523 : (
bool(RhsRowMajor) && !CanVectorizeLhs),
528 | (SameType && (CanVectorizeLhs || CanVectorizeRhs) ?
PacketAccessBit : 0)
534 Alignment = bool(CanVectorizeLhs) ? (LhsOuterStrideBytes<=0 || (
int(LhsOuterStrideBytes) %
EIGEN_PLAIN_ENUM_MAX(1,LhsAlignment))!=0 ? 0 : LhsAlignment)
535 : bool(CanVectorizeRhs) ? (RhsOuterStrideBytes<=0 || (
int(RhsOuterStrideBytes) %
EIGEN_PLAIN_ENUM_MAX(1,RhsAlignment))!=0 ? 0 : RhsAlignment)
543 CanVectorizeInner = SameType
552 return (m_lhs.row(
row).transpose().cwiseProduct( m_rhs.col(
col) )).sum();
561 const Index row = (RowsAtCompileTime == 1 || MaxRowsAtCompileTime==1) ? 0 : index;
562 const Index col = (RowsAtCompileTime == 1 || MaxRowsAtCompileTime==1) ? index : 0;
563 return (m_lhs.row(
row).transpose().cwiseProduct( m_rhs.col(
col) )).sum();
566 template<
int LoadMode,
typename PacketType>
577 template<
int LoadMode,
typename PacketType>
580 const Index row = (RowsAtCompileTime == 1 || MaxRowsAtCompileTime==1) ? 0 : index;
581 const Index col = (RowsAtCompileTime == 1 || MaxRowsAtCompileTime==1) ? index : 0;
582 return packet<LoadMode,PacketType>(
row,
col);
596 template<
typename Lhs,
typename Rhs>
598 :
product_evaluator<Product<Lhs, Rhs, LazyProduct>, CoeffBasedProductMode, DenseShape, DenseShape>
615 template<
int UnrollingIndex,
typename Lhs,
typename Rhs,
typename Packet,
int LoadMode>
620 etor_product_packet_impl<RowMajor, UnrollingIndex-1, Lhs, Rhs, Packet, LoadMode>::run(
row,
col, lhs, rhs, innerDim, res);
621 res =
pmadd(pset1<Packet>(lhs.coeff(
row,
Index(UnrollingIndex-1))), rhs.template packet<LoadMode,Packet>(
Index(UnrollingIndex-1),
col), res);
625 template<
int UnrollingIndex,
typename Lhs,
typename Rhs,
typename Packet,
int LoadMode>
630 etor_product_packet_impl<ColMajor, UnrollingIndex-1, Lhs, Rhs, Packet, LoadMode>::run(
row,
col, lhs, rhs, innerDim, res);
631 res =
pmadd(lhs.template packet<LoadMode,Packet>(
row,
Index(UnrollingIndex-1)), pset1<Packet>(rhs.coeff(
Index(UnrollingIndex-1),
col)), res);
635 template<
typename Lhs,
typename Rhs,
typename Packet,
int LoadMode>
640 res =
pmul(pset1<Packet>(lhs.coeff(
row,
Index(0))),rhs.template packet<LoadMode,Packet>(
Index(0),
col));
644 template<
typename Lhs,
typename Rhs,
typename Packet,
int LoadMode>
649 res =
pmul(lhs.template packet<LoadMode,Packet>(
row,
Index(0)), pset1<Packet>(rhs.coeff(
Index(0),
col)));
653 template<
typename Lhs,
typename Rhs,
typename Packet,
int LoadMode>
662 template<
typename Lhs,
typename Rhs,
typename Packet,
int LoadMode>
671 template<
typename Lhs,
typename Rhs,
typename Packet,
int LoadMode>
677 for(
Index i = 0; i < innerDim; ++i)
678 res =
pmadd(pset1<Packet>(lhs.coeff(
row, i)), rhs.template packet<LoadMode,Packet>(i,
col), res);
682 template<
typename Lhs,
typename Rhs,
typename Packet,
int LoadMode>
688 for(
Index i = 0; i < innerDim; ++i)
689 res =
pmadd(lhs.template packet<LoadMode,Packet>(
row, i), pset1<Packet>(rhs.coeff(i,
col)), res);
697 template<
int Mode,
bool LhsIsTriangular,
698 typename Lhs,
bool LhsIsVector,
699 typename Rhs,
bool RhsIsVector>
702 template<
typename Lhs,
typename Rhs,
int ProductTag>
708 template<
typename Dest>
712 ::run(dst, lhs.nestedExpression(), rhs,
alpha);
716 template<
typename Lhs,
typename Rhs,
int ProductTag>
722 template<
typename Dest>
733 template <
typename Lhs,
int LhsMode,
bool LhsIsVector,
734 typename Rhs,
int RhsMode,
bool RhsIsVector>
737 template<
typename Lhs,
typename Rhs,
int ProductTag>
743 template<
typename Dest>
750 template<
typename Lhs,
typename Rhs,
int ProductTag>
756 template<
typename Dest>
768 template<
typename MatrixType,
typename DiagonalType,
typename Derived,
int ProductOrder>
791 || (DiagonalType::SizeAtCompileTime==
Dynamic && MatrixType::RowsAtCompileTime==1 && ProductOrder==
OnTheLeft)
792 || (DiagonalType::SizeAtCompileTime==
Dynamic && MatrixType::ColsAtCompileTime==1 && ProductOrder==
OnTheRight)
811 template<
int LoadMode,
typename PacketType>
815 internal::pset1<PacketType>(
m_diagImpl.coeff(
id)));
818 template<
int LoadMode,
typename PacketType>
822 InnerSize = (MatrixType::Flags &
RowMajorBit) ? MatrixType::ColsAtCompileTime : MatrixType::RowsAtCompileTime,
826 m_diagImpl.template packet<DiagonalPacketLoadMode,PacketType>(
id));
834 template<
typename Lhs,
typename Rhs,
int ProductKind,
int ProductTag>
839 using Base::m_diagImpl;
840 using Base::m_matImpl;
852 :
Base(xpr.rhs(), xpr.lhs().diagonal())
858 return m_diagImpl.coeff(
row) * m_matImpl.coeff(
row,
col);
862 template<
int LoadMode,
typename PacketType>
867 return this->
template packet_impl<LoadMode,PacketType>(
row,
col,
row,
871 template<
int LoadMode,
typename PacketType>
874 return packet<LoadMode,PacketType>(
int(StorageOrder)==
ColMajor?idx:0,
int(StorageOrder)==
ColMajor?0:idx);
880 template<
typename Lhs,
typename Rhs,
int ProductKind,
int ProductTag>
885 using Base::m_diagImpl;
886 using Base::m_matImpl;
896 :
Base(xpr.lhs(), xpr.rhs().diagonal())
902 return m_matImpl.coeff(
row,
col) * m_diagImpl.coeff(
col);
906 template<
int LoadMode,
typename PacketType>
909 return this->
template packet_impl<LoadMode,PacketType>(
row,
col,
col,
913 template<
int LoadMode,
typename PacketType>
916 return packet<LoadMode,PacketType>(
int(StorageOrder)==
ColMajor?idx:0,
int(StorageOrder)==
ColMajor?0:idx);
930 template<
typename ExpressionType,
int S
ide,
bool Transposed,
typename ExpressionShape>
933 template<
typename ExpressionType,
int S
ide,
bool Transposed>
939 template<
typename Dest,
typename PermutationType>
940 static inline void run(Dest& dst,
const PermutationType& perm,
const ExpressionType& xpr)
953 while(r < perm.size())
956 while(r<perm.size() && mask[r]) r++;
963 for(
Index k=perm.indices().coeff(k0); k!=k0; k=perm.indices().coeff(k))
967 (dst,((Side==
OnTheLeft) ^ Transposed) ? k0 : kPrev));
976 for(
Index i = 0; i <
n; ++i)
979 (dst, ((Side==
OnTheLeft) ^ Transposed) ? perm.indices().coeff(i) : i)
984 (
mat, ((Side==
OnTheRight) ^ Transposed) ? perm.indices().coeff(i) : i);
990 template<
typename Lhs,
typename Rhs,
int ProductTag,
typename MatrixShape>
993 template<
typename Dest>
1000 template<
typename Lhs,
typename Rhs,
int ProductTag,
typename MatrixShape>
1003 template<
typename Dest>
1010 template<
typename Lhs,
typename Rhs,
int ProductTag,
typename MatrixShape>
1013 template<
typename Dest>
1020 template<
typename Lhs,
typename Rhs,
int ProductTag,
typename MatrixShape>
1023 template<
typename Dest>
1041 template<
typename ExpressionType,
int S
ide,
bool Transposed,
typename ExpressionShape>
1047 template<
typename Dest,
typename TranspositionType>
1048 static inline void run(Dest& dst,
const TranspositionType& tr,
const ExpressionType& xpr)
1051 typedef typename TranspositionType::StorageIndex StorageIndex;
1058 for(
Index k=(Transposed?
size-1:0) ; Transposed?k>=0:k<
size ; Transposed?--k:++k)
1059 if(
Index(j=tr.coeff(k))!=k)
1061 if(Side==
OnTheLeft) dst.row(k).swap(dst.row(j));
1062 else if(Side==
OnTheRight) dst.col(k).swap(dst.col(j));
1067 template<
typename Lhs,
typename Rhs,
int ProductTag,
typename MatrixShape>
1070 template<
typename Dest>
1077 template<
typename Lhs,
typename Rhs,
int ProductTag,
typename MatrixShape>
1080 template<
typename Dest>
1088 template<
typename Lhs,
typename Rhs,
int ProductTag,
typename MatrixShape>
1091 template<
typename Dest>
1098 template<
typename Lhs,
typename Rhs,
int ProductTag,
typename MatrixShape>
1101 template<
typename Dest>
1112 #endif // EIGEN_PRODUCT_EVALUATORS_H