35#ifndef _BLAZE_MATH_EXPRESSIONS_DVECDVECMULTEXPR_H_
36#define _BLAZE_MATH_EXPRESSIONS_DVECDVECMULTEXPR_H_
97 :
public VecVecMultExpr< DenseVector< DVecDVecMultExpr<VT1,VT2,TF>, TF > >
119 static constexpr bool returnExpr = ( !IsTemporary_v<RN1> && !IsTemporary_v<RN2> );
134 ( RequiresEvaluation_v<VT1> || RequiresEvaluation_v<VT2> || !
returnExpr );
138 template<
typename VT >
139 static constexpr bool UseAssign_v =
useAssign;
151 template<
typename VT >
152 static constexpr bool UseSMPAssign_v =
153 ( ( !VT1::smpAssignable || !VT2::smpAssignable ) &&
useAssign );
297 return (*
left_) * (*right_);
306 inline auto load() const noexcept {
435 ( VT1::simdEnabled && VT2::simdEnabled && HasSIMDMult_v<ET1,ET2> );
438 static constexpr bool smpAssignable = ( VT1::smpAssignable && VT2::smpAssignable );
480 if( index >=
lhs_.size() ) {
483 return (*
this)[index];
496 return lhs_.load( index ) *
rhs_.load( index );
525 inline size_t size() const noexcept {
556 template<
typename T >
557 inline bool canAlias(
const T* alias )
const noexcept {
558 return ( IsExpression_v<VT1> && ( RequiresEvaluation_v<VT1> ?
lhs_.isAliased( alias ) :
lhs_.canAlias( alias ) ) ) ||
559 ( IsExpression_v<VT2> && ( RequiresEvaluation_v<VT2> ?
rhs_.isAliased( alias ) :
rhs_.canAlias( alias ) ) );
569 template<
typename T >
570 inline bool isAliased(
const T* alias )
const noexcept {
571 return (
lhs_.isAliased( alias ) ||
rhs_.isAliased( alias ) );
581 return lhs_.isAligned() &&
rhs_.isAligned();
591 return lhs_.canSMPAssign() ||
rhs_.canSMPAssign() ||
592 (
size() > SMP_DVECDVECMULT_THRESHOLD );
617 template<
typename VT >
625 if( !IsComputation_v<VT1> &&
isSame( *lhs, rhs.lhs_ ) ) {
626 multAssign( *lhs, rhs.rhs_ );
631 assign( *lhs, a * b );
651 template<
typename VT >
659 if( !IsComputation_v<VT1> &&
isSame( *lhs, rhs.lhs_ ) ) {
660 multAssign( *lhs, rhs.rhs_ );
662 else if( !IsComputation_v<VT2> &&
isSame( *lhs, rhs.rhs_ ) ) {
663 multAssign( *lhs, rhs.lhs_ );
665 else if( !RequiresEvaluation_v<VT2> ) {
666 assign ( *lhs, rhs.rhs_ );
667 multAssign( *lhs, rhs.lhs_ );
670 assign ( *lhs, rhs.lhs_ );
671 multAssign( *lhs, rhs.rhs_ );
691 template<
typename VT >
692 friend inline auto assign( SparseVector<VT,TF>& lhs,
const DVecDVecMultExpr& rhs )
693 -> EnableIf_t< UseAssign_v<VT> >
723 template<
typename VT >
724 friend inline auto addAssign( DenseVector<VT,TF>& lhs,
const DVecDVecMultExpr& rhs )
725 -> EnableIf_t< UseAssign_v<VT> >
736 addAssign( *lhs, tmp );
759 template<
typename VT >
760 friend inline auto subAssign( DenseVector<VT,TF>& lhs,
const DVecDVecMultExpr& rhs )
761 -> EnableIf_t< UseAssign_v<VT> >
772 subAssign( *lhs, tmp );
796 template<
typename VT >
797 friend inline auto multAssign( DenseVector<VT,TF>& lhs,
const DVecDVecMultExpr& rhs )
798 -> EnableIf_t< UseAssign_v<VT> && !IsCommutative_v<VT1,VT2> >
809 multAssign( *lhs, tmp );
829 template<
typename VT >
830 friend inline auto multAssign( DenseVector<VT,TF>& lhs,
const DVecDVecMultExpr& rhs )
831 -> EnableIf_t< UseAssign_v<VT> && IsCommutative_v<VT1,VT2> >
837 if( !RequiresEvaluation_v<VT2> ) {
838 multAssign( *lhs, rhs.rhs_ );
839 multAssign( *lhs, rhs.lhs_ );
842 multAssign( *lhs, rhs.lhs_ );
843 multAssign( *lhs, rhs.rhs_ );
867 template<
typename VT >
868 friend inline auto divAssign( DenseVector<VT,TF>& lhs,
const DVecDVecMultExpr& rhs )
869 -> EnableIf_t< UseAssign_v<VT> >
880 divAssign( *lhs, tmp );
904 template<
typename VT >
906 -> EnableIf_t< UseSMPAssign_v<VT> && !IsCommutative_v<VT1,VT2> >
912 if( !IsComputation_v<VT1> &&
isSame( *lhs, rhs.lhs_ ) ) {
913 multAssign( *lhs, rhs.rhs_ );
939 template<
typename VT >
941 -> EnableIf_t< UseSMPAssign_v<VT> && IsCommutative_v<VT1,VT2> >
947 if( !IsComputation_v<VT1> &&
isSame( *lhs, rhs.lhs_ ) ) {
950 else if( !IsComputation_v<VT2> &&
isSame( *lhs, rhs.rhs_ ) ) {
953 else if( !RequiresEvaluation_v<VT2> ) {
979 template<
typename VT >
981 -> EnableIf_t< UseSMPAssign_v<VT> >
1011 template<
typename VT >
1013 -> EnableIf_t< UseSMPAssign_v<VT> >
1048 template<
typename VT >
1050 -> EnableIf_t< UseSMPAssign_v<VT> >
1085 template<
typename VT >
1087 -> EnableIf_t< UseSMPAssign_v<VT> && !IsCommutative_v<VT1,VT2> >
1118 template<
typename VT >
1120 -> EnableIf_t< UseSMPAssign_v<VT> && IsCommutative_v<VT1,VT2> >
1126 if( !RequiresEvaluation_v<VT2> ) {
1156 template<
typename VT >
1158 -> EnableIf_t< UseSMPAssign_v<VT> >
1224template<
typename VT1
1227inline decltype(
auto)
1232 if( (*lhs).size() != (*rhs).size() ) {
1237 return ReturnType( *lhs, *rhs );
1252template<
typename VT1,
typename VT2,
bool TF >
1253struct IsAligned< DVecDVecMultExpr<VT1,VT2,TF> >
1254 :
public BoolConstant< IsAligned_v<VT1> && IsAligned_v<VT2> >
1270template<
typename VT1,
typename VT2,
bool TF >
1271struct IsPadded< DVecDVecMultExpr<VT1,VT2,TF> >
1272 :
public BoolConstant< IsPadded_v<VT1> && IsPadded_v<VT2> >
Header file for auxiliary alias declarations.
typename T::CompositeType CompositeType_t
Alias declaration for nested CompositeType type definitions.
Definition: Aliases.h:110
typename T::ReturnType ReturnType_t
Alias declaration for nested ReturnType type definitions.
Definition: Aliases.h:470
typename T::ResultType ResultType_t
Alias declaration for nested ResultType type definitions.
Definition: Aliases.h:450
typename T::ElementType ElementType_t
Alias declaration for nested ElementType type definitions.
Definition: Aliases.h:190
typename T::ConstIterator ConstIterator_t
Alias declaration for nested ConstIterator type definitions.
Definition: Aliases.h:130
typename T::TransposeType TransposeType_t
Alias declaration for nested TransposeType type definitions.
Definition: Aliases.h:550
Header file for run time assertion macros.
Header file for the EnableIf class template.
Header file for the function trace functionality.
Header file for the HasSIMDMult type trait.
Macro for CUDA compatibility.
Header file for the If class template.
Header file for the IntegralConstant class template.
Header file for the IsAligned type trait.
Header file for the IsCommutative type trait.
Header file for the IsComputation type trait class.
Header file for the IsExpression type trait class.
Header file for the IsPadded type trait.
Header file for the IsTemporary type trait class.
Deactivation of problematic macros.
Header file for the multiplication trait.
Header file for all SIMD functionality.
Iterator over the elements of the dense vector.
Definition: DVecDVecMultExpr.h:186
BLAZE_DEVICE_CALLABLE ConstIterator & operator++()
Pre-increment operator.
Definition: DVecDVecMultExpr.h:252
BLAZE_DEVICE_CALLABLE bool operator<=(const ConstIterator &rhs) const
Less-than comparison between two ConstIterator objects.
Definition: DVecDVecMultExpr.h:361
ElementType ValueType
Type of the underlying elements.
Definition: DVecDVecMultExpr.h:190
LeftIteratorType left_
Iterator to the current left-hand side element.
Definition: DVecDVecMultExpr.h:426
BLAZE_DEVICE_CALLABLE bool operator!=(const ConstIterator &rhs) const
Inequality comparison between two ConstIterator objects.
Definition: DVecDVecMultExpr.h:328
RightIteratorType right_
Iterator to the current right-hand side element.
Definition: DVecDVecMultExpr.h:427
friend BLAZE_DEVICE_CALLABLE const ConstIterator operator+(const ConstIterator &it, size_t inc)
Addition between a ConstIterator and an integral value.
Definition: DVecDVecMultExpr.h:395
BLAZE_DEVICE_CALLABLE ConstIterator(LeftIteratorType left, RightIteratorType right)
Constructor for the ConstIterator class.
Definition: DVecDVecMultExpr.h:215
ElementType * PointerType
Pointer return type.
Definition: DVecDVecMultExpr.h:191
PointerType pointer
Pointer return type.
Definition: DVecDVecMultExpr.h:198
BLAZE_DEVICE_CALLABLE ConstIterator & operator--()
Pre-decrement operator.
Definition: DVecDVecMultExpr.h:274
DifferenceType difference_type
Difference between two iterators.
Definition: DVecDVecMultExpr.h:200
BLAZE_DEVICE_CALLABLE ReturnType operator*() const
Direct access to the element at the current iterator position.
Definition: DVecDVecMultExpr.h:296
ElementType & ReferenceType
Reference return type.
Definition: DVecDVecMultExpr.h:192
BLAZE_DEVICE_CALLABLE ConstIterator & operator+=(size_t inc)
Addition assignment operator.
Definition: DVecDVecMultExpr.h:227
BLAZE_DEVICE_CALLABLE bool operator==(const ConstIterator &rhs) const
Equality comparison between two ConstIterator objects.
Definition: DVecDVecMultExpr.h:317
ptrdiff_t DifferenceType
Difference between two iterators.
Definition: DVecDVecMultExpr.h:193
BLAZE_DEVICE_CALLABLE const ConstIterator operator--(int)
Post-decrement operator.
Definition: DVecDVecMultExpr.h:286
friend BLAZE_DEVICE_CALLABLE const ConstIterator operator+(size_t inc, const ConstIterator &it)
Addition between an integral value and a ConstIterator.
Definition: DVecDVecMultExpr.h:407
BLAZE_DEVICE_CALLABLE ConstIterator & operator-=(size_t dec)
Subtraction assignment operator.
Definition: DVecDVecMultExpr.h:240
IteratorCategory iterator_category
The iterator category.
Definition: DVecDVecMultExpr.h:196
std::random_access_iterator_tag IteratorCategory
The iterator category.
Definition: DVecDVecMultExpr.h:189
BLAZE_DEVICE_CALLABLE DifferenceType operator-(const ConstIterator &rhs) const
Calculating the number of elements between two iterators.
Definition: DVecDVecMultExpr.h:383
BLAZE_DEVICE_CALLABLE bool operator>(const ConstIterator &rhs) const
Greater-than comparison between two ConstIterator objects.
Definition: DVecDVecMultExpr.h:350
ConstIterator_t< VT2 > RightIteratorType
ConstIterator type of the right-hand side dense vector expression.
Definition: DVecDVecMultExpr.h:206
ValueType value_type
Type of the underlying elements.
Definition: DVecDVecMultExpr.h:197
ReferenceType reference
Reference return type.
Definition: DVecDVecMultExpr.h:199
ConstIterator_t< VT1 > LeftIteratorType
ConstIterator type of the left-hand side dense vector expression.
Definition: DVecDVecMultExpr.h:203
BLAZE_DEVICE_CALLABLE bool operator>=(const ConstIterator &rhs) const
Greater-than comparison between two ConstIterator objects.
Definition: DVecDVecMultExpr.h:372
BLAZE_DEVICE_CALLABLE const ConstIterator operator++(int)
Post-increment operator.
Definition: DVecDVecMultExpr.h:264
BLAZE_DEVICE_CALLABLE bool operator<(const ConstIterator &rhs) const
Less-than comparison between two ConstIterator objects.
Definition: DVecDVecMultExpr.h:339
auto load() const noexcept
Access to the SIMD elements of the vector.
Definition: DVecDVecMultExpr.h:306
friend BLAZE_DEVICE_CALLABLE const ConstIterator operator-(const ConstIterator &it, size_t dec)
Subtraction between a ConstIterator and an integral value.
Definition: DVecDVecMultExpr.h:419
Expression object for dense vector-dense vector multiplications.
Definition: DVecDVecMultExpr.h:99
ElementType_t< ResultType > ElementType
Resulting element type.
Definition: DVecDVecMultExpr.h:167
bool isAliased(const T *alias) const noexcept
Returns whether the expression is aliased with the given address alias.
Definition: DVecDVecMultExpr.h:570
CompositeType_t< VT1 > CT1
Composite type of the left-hand side dense vector expression.
Definition: DVecDVecMultExpr.h:106
CompositeType_t< VT2 > CT2
Composite type of the right-hand side dense vector expression.
Definition: DVecDVecMultExpr.h:107
ElementType_t< VT2 > ET2
Element type of the right-hand side dense vector expression.
Definition: DVecDVecMultExpr.h:109
size_t size() const noexcept
Returns the current size/dimension of the vector.
Definition: DVecDVecMultExpr.h:525
BLAZE_ALWAYS_INLINE auto load(size_t index) const noexcept
Access to the SIMD elements of the vector.
Definition: DVecDVecMultExpr.h:493
ReturnType operator[](size_t index) const
Subscript operator for the direct access to the vector elements.
Definition: DVecDVecMultExpr.h:466
bool canAlias(const T *alias) const noexcept
Returns whether the expression can alias with the given address alias.
Definition: DVecDVecMultExpr.h:557
If_t< IsExpression_v< VT1 >, const VT1, const VT1 & > LeftOperand
Composite type of the left-hand side dense vector expression.
Definition: DVecDVecMultExpr.h:176
LeftOperand leftOperand() const noexcept
Returns the left-hand side dense vector operand.
Definition: DVecDVecMultExpr.h:535
If_t< IsExpression_v< VT2 >, const VT2, const VT2 & > RightOperand
Composite type of the right-hand side dense vector expression.
Definition: DVecDVecMultExpr.h:179
ConstIterator begin() const
Returns an iterator to the first non-zero element of the dense vector.
Definition: DVecDVecMultExpr.h:505
ElementType_t< VT1 > ET1
Element type of the left-hand side dense vector expression.
Definition: DVecDVecMultExpr.h:108
static constexpr bool useAssign
Compilation switch for the serial evaluation strategy of the multiplication expression.
Definition: DVecDVecMultExpr.h:133
LeftOperand lhs_
Left-hand side dense vector of the multiplication expression.
Definition: DVecDVecMultExpr.h:598
DVecDVecMultExpr(const VT1 &lhs, const VT2 &rhs) noexcept
Constructor for the DVecDVecMultExpr class.
Definition: DVecDVecMultExpr.h:452
static constexpr size_t SIMDSIZE
The number of elements packed within a single SIMD element.
Definition: DVecDVecMultExpr.h:443
ReturnType_t< VT1 > RN1
Return type of the left-hand side dense vector expression.
Definition: DVecDVecMultExpr.h:104
bool isAligned() const noexcept
Returns whether the operands of the expression are properly aligned in memory.
Definition: DVecDVecMultExpr.h:580
TransposeType_t< ResultType > TransposeType
Transpose type for expression template evaluations.
Definition: DVecDVecMultExpr.h:166
static constexpr bool simdEnabled
Compilation switch for the expression template evaluation strategy.
Definition: DVecDVecMultExpr.h:434
ResultType_t< VT1 > RT1
Result type of the left-hand side dense vector expression.
Definition: DVecDVecMultExpr.h:102
bool canSMPAssign() const noexcept
Returns whether the expression can be used in SMP assignments.
Definition: DVecDVecMultExpr.h:590
static constexpr bool returnExpr
Compilation switch for the selection of the subscript operator return type.
Definition: DVecDVecMultExpr.h:119
decltype(std::declval< RN1 >() *std::declval< RN2 >()) ExprReturnType
Expression return type for the subscript operator.
Definition: DVecDVecMultExpr.h:122
ConstIterator end() const
Returns an iterator just past the last non-zero element of the dense vector.
Definition: DVecDVecMultExpr.h:515
MultTrait_t< RT1, RT2 > ResultType
Result type for expression template evaluations.
Definition: DVecDVecMultExpr.h:165
RightOperand rhs_
Right-hand side dense vector of the multiplication expression.
Definition: DVecDVecMultExpr.h:599
static constexpr bool smpAssignable
Compilation switch for the expression template assignment strategy.
Definition: DVecDVecMultExpr.h:438
RightOperand rightOperand() const noexcept
Returns the right-hand side dense vector operand.
Definition: DVecDVecMultExpr.h:545
ResultType_t< VT2 > RT2
Result type of the right-hand side dense vector expression.
Definition: DVecDVecMultExpr.h:103
const If_t< returnExpr, ExprReturnType, ElementType > ReturnType
Return type for expression template evaluations.
Definition: DVecDVecMultExpr.h:170
If_t< useAssign, const ResultType, const DVecDVecMultExpr & > CompositeType
Data type for composite expression templates.
Definition: DVecDVecMultExpr.h:173
ReturnType_t< VT2 > RN2
Return type of the right-hand side dense vector expression.
Definition: DVecDVecMultExpr.h:105
ReturnType at(size_t index) const
Checked access to the vector elements.
Definition: DVecDVecMultExpr.h:479
Base class for N-dimensional dense vectors.
Definition: DenseVector.h:77
SIMD characteristics of data types.
Definition: SIMDTrait.h:297
Constraint on the data type.
Constraint on the data type.
Constraint on the data type.
Header file for the Computation base class.
Header file for the DenseVector base class.
Header file for the VecVecMultExpr base class.
decltype(auto) serial(const DenseMatrix< MT, SO > &dm)
Forces the serial evaluation of the given dense matrix expression dm.
Definition: DMatSerialExpr.h:812
#define BLAZE_CONSTRAINT_MUST_NOT_REQUIRE_EVALUATION(T)
Constraint on the data type.
Definition: RequiresEvaluation.h:81
#define BLAZE_CONSTRAINT_MUST_BE_VECTOR_WITH_TRANSPOSE_FLAG(T, TF)
Constraint on the data type.
Definition: TransposeFlag.h:63
#define BLAZE_CONSTRAINT_MUST_FORM_VALID_VECVECMULTEXPR(T1, T2)
Constraint on the data type.
Definition: VecVecMultExpr.h:104
#define BLAZE_CONSTRAINT_MUST_BE_DENSE_VECTOR_TYPE(T)
Constraint on the data type.
Definition: DenseVector.h:61
typename MultTrait< T1, T2 >::Type MultTrait_t
Auxiliary alias declaration for the MultTrait class template.
Definition: MultTrait.h:165
bool isSame(const Matrix< MT1, SO1 > &a, const Matrix< MT2, SO2 > &b) noexcept
Returns whether the two given matrices represent the same observable state.
Definition: Matrix.h:1424
#define BLAZE_INTERNAL_ASSERT(expr, msg)
Run time assertion macro for internal checks.
Definition: Assert.h:101
auto smpDivAssign(Vector< VT1, TF1 > &lhs, const Vector< VT2, TF2 > &rhs) -> EnableIf_t< IsDenseVector_v< VT1 > >
Default implementation of the SMP division assignment of a vector to a dense vector.
Definition: DenseVector.h:221
auto smpSubAssign(Matrix< MT1, SO1 > &lhs, const Matrix< MT2, SO2 > &rhs) -> EnableIf_t< IsDenseMatrix_v< MT1 > >
Default implementation of the SMP subtraction assignment of a matrix to dense matrix.
Definition: DenseMatrix.h:162
auto smpAssign(Matrix< MT1, SO1 > &lhs, const Matrix< MT2, SO2 > &rhs) -> EnableIf_t< IsDenseMatrix_v< MT1 > >
Default implementation of the SMP assignment of a matrix to a dense matrix.
Definition: DenseMatrix.h:100
auto smpMultAssign(Vector< VT1, TF1 > &lhs, const Vector< VT2, TF2 > &rhs) -> EnableIf_t< IsDenseVector_v< VT1 > >
Default implementation of the SMP multiplication assignment of a vector to a dense vector.
Definition: DenseVector.h:192
auto smpAddAssign(Matrix< MT1, SO1 > &lhs, const Matrix< MT2, SO2 > &rhs) -> EnableIf_t< IsDenseMatrix_v< MT1 > >
Default implementation of the SMP addition assignment of a matrix to a dense matrix.
Definition: DenseMatrix.h:131
#define BLAZE_ALWAYS_INLINE
Platform dependent setup of an enforced inline keyword.
Definition: Inline.h:85
#define BLAZE_DEVICE_CALLABLE
Conditional macro that sets host and device attributes when compiled with CUDA.
Definition: HostDevice.h:94
typename EnableIf< Condition, T >::Type EnableIf_t
Auxiliary type for the EnableIf class template.
Definition: EnableIf.h:138
typename If< Condition >::template Type< T1, T2 > If_t
Auxiliary alias template for the If class template.
Definition: If.h:108
IntegralConstant< bool, B > BoolConstant
Generic wrapper for a compile time constant boolean value.
Definition: IntegralConstant.h:110
#define BLAZE_THROW_OUT_OF_RANGE(MESSAGE)
Macro for the emission of a std::out_of_range exception.
Definition: Exception.h:331
#define BLAZE_THROW_INVALID_ARGUMENT(MESSAGE)
Macro for the emission of a std::invalid_argument exception.
Definition: Exception.h:235
#define BLAZE_FUNCTION_TRACE
Function trace macro.
Definition: FunctionTrace.h:94
Header file for the exception macros of the math module.
Constraint on the data type.
Header file for all forward declarations for expression class templates.
Header file for the serial shim.
Base class for all compute expression templates.
Definition: Computation.h:68
Base class for all vector/vector multiplication expression templates.
Definition: VecVecMultExpr.h:68
System settings for the inline keywords.
Header file for the thresholds for matrix/vector and matrix/matrix multiplications.
Header file for the RequiresEvaluation type trait.
Header file for basic type definitions.