12 #ifndef EIGEN_ASSIGN_EVALUATOR_H
13 #define EIGEN_ASSIGN_EVALUATOR_H
27 template <
typename DstEvaluator,
typename SrcEvaluator,
typename AssignFunc>
28 struct copy_using_evaluator_traits
30 typedef typename DstEvaluator::XprType Dst;
31 typedef typename Dst::Scalar DstScalar;
33 typedef typename find_best_packet<DstScalar,Dst::SizeAtCompileTime>::type PacketType;
36 DstFlags = DstEvaluator::Flags,
37 SrcFlags = SrcEvaluator::Flags,
38 RequiredAlignment = unpacket_traits<PacketType>::alignment
43 DstAlignment = DstEvaluator::Alignment,
44 SrcAlignment = SrcEvaluator::Alignment,
46 JointAlignment = EIGEN_PLAIN_ENUM_MIN(DstAlignment,SrcAlignment)
51 InnerSize = int(Dst::IsVectorAtCompileTime) ? int(Dst::SizeAtCompileTime)
52 : int(DstFlags)&
RowMajorBit ? int(Dst::ColsAtCompileTime)
53 : int(Dst::RowsAtCompileTime),
54 InnerMaxSize = int(Dst::IsVectorAtCompileTime) ? int(Dst::MaxSizeAtCompileTime)
55 : int(DstFlags)&
RowMajorBit ? int(Dst::MaxColsAtCompileTime)
56 : int(Dst::MaxRowsAtCompileTime),
57 MaxSizeAtCompileTime = Dst::SizeAtCompileTime,
58 PacketSize = unpacket_traits<PacketType>::size
64 StorageOrdersAgree = (int(DstIsRowMajor) == int(SrcIsRowMajor)),
65 MightVectorize = StorageOrdersAgree
67 && (functor_traits<AssignFunc>::PacketAccess),
68 MayInnerVectorize = MightVectorize && int(InnerSize)!=Dynamic && int(InnerSize)%int(PacketSize)==0
69 && int(JointAlignment)>=int(RequiredAlignment),
70 MayLinearize = StorageOrdersAgree && (int(DstFlags) & int(SrcFlags) &
LinearAccessBit),
71 MayLinearVectorize = MightVectorize && MayLinearize && DstHasDirectAccess
72 && ((
int(DstAlignment)>=
int(RequiredAlignment)) || MaxSizeAtCompileTime == Dynamic),
75 MaySliceVectorize = MightVectorize && DstHasDirectAccess
76 && (
int(InnerMaxSize)==Dynamic || int(InnerMaxSize)>=3*PacketSize)
84 Traversal = int(MayInnerVectorize) ? int(InnerVectorizedTraversal)
85 : int(MayLinearVectorize) ? int(LinearVectorizedTraversal)
86 : int(MaySliceVectorize) ? int(SliceVectorizedTraversal)
87 : int(MayLinearize) ? int(LinearTraversal)
88 : int(DefaultTraversal),
89 Vectorized = int(Traversal) == InnerVectorizedTraversal
90 || int(Traversal) == LinearVectorizedTraversal
91 || int(Traversal) == SliceVectorizedTraversal
96 UnrollingLimit = EIGEN_UNROLLING_LIMIT * (Vectorized ? int(PacketSize) : 1),
97 MayUnrollCompletely = int(Dst::SizeAtCompileTime) != Dynamic
98 && int(SrcEvaluator::CoeffReadCost) != Dynamic
99 && int(Dst::SizeAtCompileTime) * int(SrcEvaluator::CoeffReadCost) <= int(UnrollingLimit),
100 MayUnrollInner = int(InnerSize) != Dynamic
101 && int(SrcEvaluator::CoeffReadCost) != Dynamic
102 && int(InnerSize) * int(SrcEvaluator::CoeffReadCost) <= int(UnrollingLimit)
107 Unrolling = (int(Traversal) == int(InnerVectorizedTraversal) || int(Traversal) == int(DefaultTraversal))
109 int(MayUnrollCompletely) ? int(CompleteUnrolling)
110 : int(MayUnrollInner) ? int(InnerUnrolling)
113 : int(Traversal) == int(LinearVectorizedTraversal)
114 ? ( bool(MayUnrollCompletely) && (int(DstAlignment)>=int(RequiredAlignment)) ? int(CompleteUnrolling)
116 : int(Traversal) == int(LinearTraversal)
117 ? ( bool(MayUnrollCompletely) ? int(CompleteUnrolling)
122 #ifdef EIGEN_DEBUG_ASSIGN
125 std::cerr <<
"DstXpr: " <<
typeid(
typename DstEvaluator::XprType).name() << std::endl;
126 std::cerr <<
"SrcXpr: " <<
typeid(
typename SrcEvaluator::XprType).name() << std::endl;
127 std::cerr.setf(std::ios::hex, std::ios::basefield);
128 EIGEN_DEBUG_VAR(DstFlags)
129 EIGEN_DEBUG_VAR(SrcFlags)
130 std::cerr.unsetf(
std::ios::hex);
131 EIGEN_DEBUG_VAR(DstAlignment)
132 EIGEN_DEBUG_VAR(SrcAlignment)
133 EIGEN_DEBUG_VAR(RequiredAlignment)
134 EIGEN_DEBUG_VAR(JointAlignment)
135 EIGEN_DEBUG_VAR(InnerSize)
136 EIGEN_DEBUG_VAR(InnerMaxSize)
137 EIGEN_DEBUG_VAR(PacketSize)
138 EIGEN_DEBUG_VAR(StorageOrdersAgree)
139 EIGEN_DEBUG_VAR(MightVectorize)
140 EIGEN_DEBUG_VAR(MayLinearize)
141 EIGEN_DEBUG_VAR(MayInnerVectorize)
142 EIGEN_DEBUG_VAR(MayLinearVectorize)
143 EIGEN_DEBUG_VAR(MaySliceVectorize)
144 EIGEN_DEBUG_VAR(Traversal)
145 EIGEN_DEBUG_VAR(UnrollingLimit)
146 EIGEN_DEBUG_VAR(MayUnrollCompletely)
147 EIGEN_DEBUG_VAR(MayUnrollInner)
148 EIGEN_DEBUG_VAR(Unrolling)
162 template<
typename Kernel,
int Index,
int Stop>
163 struct copy_using_evaluator_DefaultTraversal_CompleteUnrolling
166 typedef typename Kernel::DstEvaluatorType DstEvaluatorType;
167 typedef typename DstEvaluatorType::XprType DstXprType;
170 outer = Index / DstXprType::InnerSizeAtCompileTime,
171 inner = Index % DstXprType::InnerSizeAtCompileTime
174 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel &kernel)
176 kernel.assignCoeffByOuterInner(outer, inner);
177 copy_using_evaluator_DefaultTraversal_CompleteUnrolling<Kernel, Index+1, Stop>::run(kernel);
181 template<
typename Kernel,
int Stop>
182 struct copy_using_evaluator_DefaultTraversal_CompleteUnrolling<Kernel, Stop, Stop>
184 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel&) { }
187 template<
typename Kernel,
int Index_,
int Stop>
188 struct copy_using_evaluator_DefaultTraversal_InnerUnrolling
190 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel &kernel, Index outer)
192 kernel.assignCoeffByOuterInner(outer, Index_);
193 copy_using_evaluator_DefaultTraversal_InnerUnrolling<Kernel, Index_+1, Stop>::run(kernel, outer);
197 template<
typename Kernel,
int Stop>
198 struct copy_using_evaluator_DefaultTraversal_InnerUnrolling<Kernel, Stop, Stop>
200 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel&, Index) { }
207 template<
typename Kernel,
int Index,
int Stop>
208 struct copy_using_evaluator_LinearTraversal_CompleteUnrolling
210 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel& kernel)
212 kernel.assignCoeff(Index);
213 copy_using_evaluator_LinearTraversal_CompleteUnrolling<Kernel, Index+1, Stop>::run(kernel);
217 template<
typename Kernel,
int Stop>
218 struct copy_using_evaluator_LinearTraversal_CompleteUnrolling<Kernel, Stop, Stop>
220 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel&) { }
227 template<
typename Kernel,
int Index,
int Stop>
228 struct copy_using_evaluator_innervec_CompleteUnrolling
231 typedef typename Kernel::DstEvaluatorType DstEvaluatorType;
232 typedef typename DstEvaluatorType::XprType DstXprType;
233 typedef typename Kernel::PacketType PacketType;
236 outer = Index / DstXprType::InnerSizeAtCompileTime,
237 inner = Index % DstXprType::InnerSizeAtCompileTime,
238 JointAlignment = Kernel::AssignmentTraits::JointAlignment
241 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel &kernel)
243 kernel.template assignPacketByOuterInner<Aligned, JointAlignment, PacketType>(outer, inner);
244 enum { NextIndex = Index + unpacket_traits<PacketType>::size };
245 copy_using_evaluator_innervec_CompleteUnrolling<Kernel, NextIndex, Stop>::run(kernel);
249 template<
typename Kernel,
int Stop>
250 struct copy_using_evaluator_innervec_CompleteUnrolling<Kernel, Stop, Stop>
252 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel&) { }
255 template<
typename Kernel,
int Index_,
int Stop>
256 struct copy_using_evaluator_innervec_InnerUnrolling
258 typedef typename Kernel::PacketType PacketType;
259 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel &kernel, Index outer)
261 kernel.template assignPacketByOuterInner<Aligned, Aligned, PacketType>(outer, Index_);
262 enum { NextIndex = Index_ + unpacket_traits<PacketType>::size };
263 copy_using_evaluator_innervec_InnerUnrolling<Kernel, NextIndex, Stop>::run(kernel, outer);
267 template<
typename Kernel,
int Stop>
268 struct copy_using_evaluator_innervec_InnerUnrolling<Kernel, Stop, Stop>
270 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel &, Index) { }
279 template<
typename Kernel,
280 int Traversal = Kernel::AssignmentTraits::Traversal,
281 int Unrolling = Kernel::AssignmentTraits::Unrolling>
282 struct dense_assignment_loop;
288 template<
typename Kernel>
289 struct dense_assignment_loop<Kernel, DefaultTraversal, NoUnrolling>
291 EIGEN_DEVICE_FUNC
static void run(Kernel &kernel)
293 for(Index outer = 0; outer < kernel.outerSize(); ++outer) {
294 for(Index inner = 0; inner < kernel.innerSize(); ++inner) {
295 kernel.assignCoeffByOuterInner(outer, inner);
301 template<
typename Kernel>
302 struct dense_assignment_loop<Kernel, DefaultTraversal, CompleteUnrolling>
304 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel &kernel)
306 typedef typename Kernel::DstEvaluatorType::XprType DstXprType;
307 copy_using_evaluator_DefaultTraversal_CompleteUnrolling<Kernel, 0, DstXprType::SizeAtCompileTime>::run(kernel);
311 template<
typename Kernel>
312 struct dense_assignment_loop<Kernel, DefaultTraversal, InnerUnrolling>
314 typedef typename Kernel::StorageIndex StorageIndex;
315 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel &kernel)
317 typedef typename Kernel::DstEvaluatorType::XprType DstXprType;
319 const Index outerSize = kernel.outerSize();
320 for(Index outer = 0; outer < outerSize; ++outer)
321 copy_using_evaluator_DefaultTraversal_InnerUnrolling<Kernel, 0, DstXprType::InnerSizeAtCompileTime>::run(kernel, outer);
333 template <
bool IsAligned = false>
334 struct unaligned_dense_assignment_loop
337 template <
typename Kernel>
338 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel&, Index, Index) {}
342 struct unaligned_dense_assignment_loop<false>
348 template <
typename Kernel>
349 static EIGEN_DONT_INLINE
void run(Kernel &kernel,
353 template <
typename Kernel>
354 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel &kernel,
359 for (Index index = start; index < end; ++index)
360 kernel.assignCoeff(index);
364 template<
typename Kernel>
365 struct dense_assignment_loop<Kernel, LinearVectorizedTraversal, NoUnrolling>
367 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel &kernel)
369 const Index size = kernel.size();
370 typedef typename Kernel::Scalar Scalar;
371 typedef typename Kernel::PacketType PacketType;
373 requestedAlignment = Kernel::AssignmentTraits::RequiredAlignment,
374 packetSize = unpacket_traits<PacketType>::size,
375 dstIsAligned = int(Kernel::AssignmentTraits::DstAlignment)>=int(requestedAlignment),
376 dstAlignment = packet_traits<Scalar>::AlignedOnScalar ? int(requestedAlignment)
377 : int(Kernel::AssignmentTraits::DstAlignment),
378 srcAlignment = Kernel::AssignmentTraits::JointAlignment
380 const Index alignedStart = dstIsAligned ? 0 : internal::first_aligned<requestedAlignment>(&kernel.dstEvaluator().coeffRef(0), size);
381 const Index alignedEnd = alignedStart + ((size-alignedStart)/packetSize)*packetSize;
383 unaligned_dense_assignment_loop<dstIsAligned!=0>::run(kernel, 0, alignedStart);
385 for(Index index = alignedStart; index < alignedEnd; index += packetSize)
386 kernel.template assignPacket<dstAlignment, srcAlignment, PacketType>(index);
388 unaligned_dense_assignment_loop<>::run(kernel, alignedEnd, size);
392 template<
typename Kernel>
393 struct dense_assignment_loop<Kernel, LinearVectorizedTraversal, CompleteUnrolling>
395 typedef typename Kernel::StorageIndex StorageIndex;
396 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel &kernel)
398 typedef typename Kernel::DstEvaluatorType::XprType DstXprType;
400 enum { size = DstXprType::SizeAtCompileTime,
401 packetSize = packet_traits<typename Kernel::Scalar>::size,
402 alignedSize = (size/packetSize)*packetSize };
404 copy_using_evaluator_innervec_CompleteUnrolling<Kernel, 0, alignedSize>::run(kernel);
405 copy_using_evaluator_DefaultTraversal_CompleteUnrolling<Kernel, alignedSize, size>::run(kernel);
413 template<
typename Kernel>
414 struct dense_assignment_loop<Kernel, InnerVectorizedTraversal, NoUnrolling>
416 typedef typename Kernel::PacketType PacketType;
417 EIGEN_DEVICE_FUNC
static inline void run(Kernel &kernel)
419 const Index innerSize = kernel.innerSize();
420 const Index outerSize = kernel.outerSize();
421 const Index packetSize = unpacket_traits<PacketType>::size;
422 for(Index outer = 0; outer < outerSize; ++outer)
423 for(Index inner = 0; inner < innerSize; inner+=packetSize)
424 kernel.template assignPacketByOuterInner<Aligned, Aligned, PacketType>(outer, inner);
428 template<
typename Kernel>
429 struct dense_assignment_loop<Kernel, InnerVectorizedTraversal, CompleteUnrolling>
431 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel &kernel)
433 typedef typename Kernel::DstEvaluatorType::XprType DstXprType;
434 copy_using_evaluator_innervec_CompleteUnrolling<Kernel, 0, DstXprType::SizeAtCompileTime>::run(kernel);
438 template<
typename Kernel>
439 struct dense_assignment_loop<Kernel, InnerVectorizedTraversal, InnerUnrolling>
441 typedef typename Kernel::StorageIndex StorageIndex;
442 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel &kernel)
444 typedef typename Kernel::DstEvaluatorType::XprType DstXprType;
445 const Index outerSize = kernel.outerSize();
446 for(Index outer = 0; outer < outerSize; ++outer)
447 copy_using_evaluator_innervec_InnerUnrolling<Kernel, 0, DstXprType::InnerSizeAtCompileTime>::run(kernel, outer);
455 template<
typename Kernel>
456 struct dense_assignment_loop<Kernel, LinearTraversal, NoUnrolling>
458 EIGEN_DEVICE_FUNC
static inline void run(Kernel &kernel)
460 const Index size = kernel.size();
461 for(Index i = 0; i < size; ++i)
462 kernel.assignCoeff(i);
466 template<
typename Kernel>
467 struct dense_assignment_loop<Kernel, LinearTraversal, CompleteUnrolling>
469 EIGEN_DEVICE_FUNC
static EIGEN_STRONG_INLINE
void run(Kernel &kernel)
471 typedef typename Kernel::DstEvaluatorType::XprType DstXprType;
472 copy_using_evaluator_LinearTraversal_CompleteUnrolling<Kernel, 0, DstXprType::SizeAtCompileTime>::run(kernel);
480 template<
typename Kernel>
481 struct dense_assignment_loop<Kernel, SliceVectorizedTraversal, NoUnrolling>
483 EIGEN_DEVICE_FUNC
static inline void run(Kernel &kernel)
485 typedef typename Kernel::Scalar Scalar;
486 typedef typename Kernel::PacketType PacketType;
488 packetSize = unpacket_traits<PacketType>::size,
489 requestedAlignment = int(Kernel::AssignmentTraits::RequiredAlignment),
490 alignable = packet_traits<Scalar>::AlignedOnScalar || int(Kernel::AssignmentTraits::DstAlignment)>=
sizeof(Scalar),
491 dstIsAligned =
int(Kernel::AssignmentTraits::DstAlignment)>=int(requestedAlignment),
492 dstAlignment = alignable ? int(requestedAlignment)
493 : int(Kernel::AssignmentTraits::DstAlignment)
495 const Scalar *dst_ptr = &kernel.dstEvaluator().coeffRef(0,0);
496 if((!
bool(dstIsAligned)) && (
size_t(dst_ptr) %
sizeof(Scalar))>0)
499 return dense_assignment_loop<Kernel,DefaultTraversal,NoUnrolling>::run(kernel);
501 const Index packetAlignedMask = packetSize - 1;
502 const Index innerSize = kernel.innerSize();
503 const Index outerSize = kernel.outerSize();
504 const Index alignedStep = alignable ? (packetSize - kernel.outerStride() % packetSize) & packetAlignedMask : 0;
505 Index alignedStart = ((!alignable) ||
bool(dstIsAligned)) ? 0 : internal::first_aligned<requestedAlignment>(dst_ptr, innerSize);
507 for(Index outer = 0; outer < outerSize; ++outer)
509 const Index alignedEnd = alignedStart + ((innerSize-alignedStart) & ~packetAlignedMask);
511 for(Index inner = 0; inner<alignedStart ; ++inner)
512 kernel.assignCoeffByOuterInner(outer, inner);
515 for(Index inner = alignedStart; inner<alignedEnd; inner+=packetSize)
516 kernel.template assignPacketByOuterInner<dstAlignment, Unaligned, PacketType>(outer, inner);
519 for(Index inner = alignedEnd; inner<innerSize ; ++inner)
520 kernel.assignCoeffByOuterInner(outer, inner);
522 alignedStart = std::min<Index>((alignedStart+alignedStep)%packetSize, innerSize);
537 template<
typename DstEvaluatorTypeT,
typename SrcEvaluatorTypeT,
typename Functor,
int Version = Specialized>
538 class generic_dense_assignment_kernel
541 typedef typename DstEvaluatorTypeT::XprType DstXprType;
542 typedef typename SrcEvaluatorTypeT::XprType SrcXprType;
545 typedef DstEvaluatorTypeT DstEvaluatorType;
546 typedef SrcEvaluatorTypeT SrcEvaluatorType;
547 typedef typename DstEvaluatorType::Scalar Scalar;
548 typedef typename DstEvaluatorType::StorageIndex StorageIndex;
549 typedef copy_using_evaluator_traits<DstEvaluatorTypeT, SrcEvaluatorTypeT, Functor> AssignmentTraits;
550 typedef typename AssignmentTraits::PacketType PacketType;
553 EIGEN_DEVICE_FUNC generic_dense_assignment_kernel(DstEvaluatorType &dst,
const SrcEvaluatorType &src,
const Functor &func, DstXprType& dstExpr)
554 : m_dst(dst), m_src(src), m_functor(func), m_dstExpr(dstExpr)
556 #ifdef EIGEN_DEBUG_ASSIGN
557 AssignmentTraits::debug();
561 EIGEN_DEVICE_FUNC Index size()
const {
return m_dstExpr.size(); }
562 EIGEN_DEVICE_FUNC Index innerSize()
const {
return m_dstExpr.innerSize(); }
563 EIGEN_DEVICE_FUNC Index outerSize()
const {
return m_dstExpr.outerSize(); }
564 EIGEN_DEVICE_FUNC Index rows()
const {
return m_dstExpr.rows(); }
565 EIGEN_DEVICE_FUNC Index cols()
const {
return m_dstExpr.cols(); }
566 EIGEN_DEVICE_FUNC Index outerStride()
const {
return m_dstExpr.outerStride(); }
569 EIGEN_DEVICE_FUNC DstXprType& dstExpression()
const {
return m_dstExpr; }
571 EIGEN_DEVICE_FUNC DstEvaluatorType& dstEvaluator() {
return m_dst; }
572 EIGEN_DEVICE_FUNC
const SrcEvaluatorType& srcEvaluator()
const {
return m_src; }
575 EIGEN_DEVICE_FUNC
void assignCoeff(Index row, Index col)
577 m_functor.assignCoeff(m_dst.coeffRef(row,col), m_src.coeff(row,col));
581 EIGEN_DEVICE_FUNC
void assignCoeff(Index index)
583 m_functor.assignCoeff(m_dst.coeffRef(index), m_src.coeff(index));
587 EIGEN_DEVICE_FUNC
void assignCoeffByOuterInner(Index outer, Index inner)
589 Index row = rowIndexByOuterInner(outer, inner);
590 Index col = colIndexByOuterInner(outer, inner);
591 assignCoeff(row, col);
595 template<
int StoreMode,
int LoadMode,
typename PacketType>
596 EIGEN_DEVICE_FUNC
void assignPacket(Index row, Index col)
598 m_functor.template assignPacket<StoreMode>(&m_dst.coeffRef(row,col), m_src.template packet<LoadMode,PacketType>(row,col));
601 template<
int StoreMode,
int LoadMode,
typename PacketType>
602 EIGEN_DEVICE_FUNC
void assignPacket(Index index)
604 m_functor.template assignPacket<StoreMode>(&m_dst.coeffRef(index), m_src.template packet<LoadMode,PacketType>(index));
607 template<
int StoreMode,
int LoadMode,
typename PacketType>
608 EIGEN_DEVICE_FUNC
void assignPacketByOuterInner(Index outer, Index inner)
610 Index row = rowIndexByOuterInner(outer, inner);
611 Index col = colIndexByOuterInner(outer, inner);
612 assignPacket<StoreMode,LoadMode,PacketType>(row, col);
615 EIGEN_DEVICE_FUNC
static Index rowIndexByOuterInner(Index outer, Index inner)
617 typedef typename DstEvaluatorType::ExpressionTraits Traits;
618 return int(Traits::RowsAtCompileTime) == 1 ? 0
619 : int(Traits::ColsAtCompileTime) == 1 ? inner
620 : int(DstEvaluatorType::Flags)&RowMajorBit ? outer
624 EIGEN_DEVICE_FUNC
static Index colIndexByOuterInner(Index outer, Index inner)
626 typedef typename DstEvaluatorType::ExpressionTraits Traits;
627 return int(Traits::ColsAtCompileTime) == 1 ? 0
628 : int(Traits::RowsAtCompileTime) == 1 ? inner
629 : int(DstEvaluatorType::Flags)&RowMajorBit ? inner
634 DstEvaluatorType& m_dst;
635 const SrcEvaluatorType& m_src;
636 const Functor &m_functor;
638 DstXprType& m_dstExpr;
645 template<
typename DstXprType,
typename SrcXprType,
typename Functor>
646 EIGEN_DEVICE_FUNC
void call_dense_assignment_loop(
const DstXprType& dst,
const SrcXprType& src,
const Functor &func)
648 eigen_assert(dst.rows() == src.rows() && dst.cols() == src.cols());
650 typedef evaluator<DstXprType> DstEvaluatorType;
651 typedef evaluator<SrcXprType> SrcEvaluatorType;
653 DstEvaluatorType dstEvaluator(dst);
654 SrcEvaluatorType srcEvaluator(src);
656 typedef generic_dense_assignment_kernel<DstEvaluatorType,SrcEvaluatorType,Functor> Kernel;
657 Kernel kernel(dstEvaluator, srcEvaluator, func, dst.const_cast_derived());
659 dense_assignment_loop<Kernel>::run(kernel);
662 template<
typename DstXprType,
typename SrcXprType>
663 EIGEN_DEVICE_FUNC
void call_dense_assignment_loop(
const DstXprType& dst,
const SrcXprType& src)
665 call_dense_assignment_loop(dst, src, internal::assign_op<typename DstXprType::Scalar>());
675 template<
typename DstShape,
typename SrcShape>
struct AssignmentKind;
678 struct Dense2Dense {};
679 struct EigenBase2EigenBase {};
681 template<
typename,
typename>
struct AssignmentKind {
typedef EigenBase2EigenBase Kind; };
682 template<>
struct AssignmentKind<DenseShape,DenseShape> {
typedef Dense2Dense Kind; };
685 template<
typename DstXprType,
typename SrcXprType,
typename Functor,
686 typename Kind =
typename AssignmentKind< typename evaluator_traits<DstXprType>::Shape ,
typename evaluator_traits<SrcXprType>::Shape >::Kind,
687 typename Scalar =
typename DstXprType::Scalar>
696 template<
typename Dst,
typename Src>
697 EIGEN_DEVICE_FUNC
void call_assignment(Dst& dst,
const Src& src)
699 call_assignment(dst, src, internal::assign_op<typename Dst::Scalar>());
701 template<
typename Dst,
typename Src>
702 EIGEN_DEVICE_FUNC
void call_assignment(
const Dst& dst,
const Src& src)
704 call_assignment(dst, src, internal::assign_op<typename Dst::Scalar>());
708 template<
typename Dst,
typename Src,
typename Func>
709 EIGEN_DEVICE_FUNC
void call_assignment(Dst& dst,
const Src& src,
const Func& func,
typename enable_if<evaluator_traits<Src>::AssumeAliasing==1,
void*>::type = 0)
711 typename plain_matrix_type<Src>::type tmp(src);
712 call_assignment_no_alias(dst, tmp, func);
715 template<
typename Dst,
typename Src,
typename Func>
716 EIGEN_DEVICE_FUNC
void call_assignment(Dst& dst,
const Src& src,
const Func& func,
typename enable_if<evaluator_traits<Src>::AssumeAliasing==0,
void*>::type = 0)
718 call_assignment_no_alias(dst, src, func);
724 template<
typename Dst,
template <
typename>
class StorageBase,
typename Src,
typename Func>
725 EIGEN_DEVICE_FUNC
void call_assignment(
const NoAlias<Dst,StorageBase>& dst,
const Src& src,
const Func& func)
727 call_assignment_no_alias(dst.expression(), src, func);
729 template<
typename Dst,
template <
typename>
class StorageBase,
typename Src,
typename Func>
730 EIGEN_DEVICE_FUNC
void call_assignment(NoAlias<Dst,StorageBase>& dst,
const Src& src,
const Func& func)
732 call_assignment_no_alias(dst.expression(), src, func);
736 template<
typename Dst,
typename Src,
typename Func>
737 EIGEN_DEVICE_FUNC
void call_assignment_no_alias(Dst& dst,
const Src& src,
const Func& func)
740 NeedToTranspose = ( (int(Dst::RowsAtCompileTime) == 1 && int(Src::ColsAtCompileTime) == 1)
743 (
int(Dst::ColsAtCompileTime) == 1 && int(Src::RowsAtCompileTime) == 1))
744 && int(Dst::SizeAtCompileTime) != 1
747 Index dstRows = NeedToTranspose ? src.cols() : src.rows();
748 Index dstCols = NeedToTranspose ? src.rows() : src.cols();
749 if((dst.rows()!=dstRows) || (dst.cols()!=dstCols))
750 dst.resize(dstRows, dstCols);
752 typedef typename internal::conditional<NeedToTranspose, Transpose<Dst>, Dst>::type ActualDstTypeCleaned;
753 typedef typename internal::conditional<NeedToTranspose, Transpose<Dst>, Dst&>::type ActualDstType;
754 ActualDstType actualDst(dst);
757 EIGEN_STATIC_ASSERT_LVALUE(Dst)
758 EIGEN_STATIC_ASSERT_SAME_MATRIX_SIZE(ActualDstTypeCleaned,Src)
765 Assignment<ActualDstTypeCleaned,Src,Func>::run(actualDst, src, func);
767 template<typename Dst, typename Src>
768 EIGEN_DEVICE_FUNC
void call_assignment_no_alias(Dst& dst, const Src& src)
770 call_assignment_no_alias(dst, src, internal::assign_op<typename Dst::Scalar>());
773 template<
typename Dst,
typename Src,
typename Func>
774 EIGEN_DEVICE_FUNC
void call_assignment_no_alias_no_transpose(Dst& dst,
const Src& src,
const Func& func)
776 Index dstRows = src.rows();
777 Index dstCols = src.cols();
778 if((dst.rows()!=dstRows) || (dst.cols()!=dstCols))
779 dst.resize(dstRows, dstCols);
782 EIGEN_STATIC_ASSERT_LVALUE(Dst)
783 EIGEN_STATIC_ASSERT_SAME_MATRIX_SIZE(Dst,Src)
785 Assignment<Dst,Src,Func>::run(dst, src, func);
787 template<typename Dst, typename Src>
788 EIGEN_DEVICE_FUNC
void call_assignment_no_alias_no_transpose(Dst& dst, const Src& src)
790 call_assignment_no_alias_no_transpose(dst, src, internal::assign_op<typename Dst::Scalar>());
794 template<
typename Dst,
typename Src>
void check_for_aliasing(
const Dst &dst,
const Src &src);
797 template<
typename DstXprType,
typename SrcXprType,
typename Functor,
typename Scalar>
798 struct Assignment<DstXprType, SrcXprType, Functor, Dense2Dense, Scalar>
800 EIGEN_DEVICE_FUNC
static void run(DstXprType &dst,
const SrcXprType &src,
const Functor &func)
802 eigen_assert(dst.rows() == src.rows() && dst.cols() == src.cols());
804 #ifndef EIGEN_NO_DEBUG
805 internal::check_for_aliasing(dst, src);
808 call_dense_assignment_loop(dst, src, func);
814 template<
typename DstXprType,
typename SrcXprType,
typename Functor,
typename Scalar>
815 struct Assignment<DstXprType, SrcXprType, Functor, EigenBase2EigenBase, Scalar>
817 EIGEN_DEVICE_FUNC
static void run(DstXprType &dst,
const SrcXprType &src,
const internal::assign_op<typename DstXprType::Scalar> &)
819 eigen_assert(dst.rows() == src.rows() && dst.cols() == src.cols());
828 #endif // EIGEN_ASSIGN_EVALUATOR_H
const unsigned int DirectAccessBit
Definition: Constants.h:141
Definition: StdDeque.h:58
const unsigned int RowMajorBit
Definition: Constants.h:53
Definition: Eigen_Colamd.h:54
const unsigned int ActualPacketAccessBit
Definition: Constants.h:91
const unsigned int LinearAccessBit
Definition: Constants.h:116