35 #ifndef _BLAZE_MATH_EXPRESSIONS_DMATSMATMULTEXPR_H_
36 #define _BLAZE_MATH_EXPRESSIONS_DMATSMATMULTEXPR_H_
101 template<
typename MT1
133 template<
typename MT >
134 struct UseSMPAssign {
135 enum { value = ( evaluateLeft || evaluateRight ) };
145 template<
typename T1,
typename T2,
typename T3 >
146 struct UseOptimizedKernel {
147 enum { value = !IsResizable<typename T1::ElementType>::value };
157 template<
typename T1,
typename T2,
typename T3 >
158 struct UseDefaultKernel {
159 enum { value = !UseOptimizedKernel<T1,T2,T3>::value };
189 enum { vectorizable = 0 };
192 enum { smpAssignable = !evaluateLeft && MT1::smpAssignable &&
193 !evaluateRight && MT2::smpAssignable };
223 if(
lhs_.columns() != 0UL ) {
225 for(
size_t k=1UL; k<
lhs_.columns(); ++k ) {
253 return rhs_.columns();
283 template<
typename T >
285 return (
lhs_.isAliased( alias ) ||
rhs_.isAliased( alias ) );
295 template<
typename T >
297 return (
lhs_.isAliased( alias ) ||
rhs_.isAliased( alias ) );
307 return lhs_.isAligned();
340 template<
typename MT >
358 DMatSMatMultExpr::selectRowMajorAssignKernel( ~lhs, A, B );
377 template<
typename MT3
381 selectRowMajorAssignKernel( MT3& C,
const MT4& A,
const MT5& B )
385 for(
size_t i=0UL; i<A.rows(); ++i ) {
386 for(
size_t j=0UL; j<C.columns(); ++j ) {
389 for(
size_t j=0UL; j<B.rows(); ++j ) {
390 ConstIterator element( B.begin(j) );
391 const ConstIterator end( B.end(j) );
392 for( ; element!=end; ++element ) {
394 C(i,element->index()) = A(i,j) * element->value();
396 C(i,element->index()) += A(i,j) * element->value();
418 template<
typename MT3
421 static inline typename EnableIf< UseOptimizedKernel<MT3,MT4,MT5> >::Type
422 selectRowMajorAssignKernel( MT3& C,
const MT4& A,
const MT5& B )
426 BLAZE_INTERNAL_ASSERT( ( A.rows() - ( A.rows() % 4UL ) ) == ( A.rows() & size_t(-4) ),
"Invalid end calculation" );
427 const size_t last( A.rows() & size_t(-4) );
429 for(
size_t i=0UL; i<last; i+=4UL ) {
430 for(
size_t j=0UL; j<C.columns(); ++j ) {
436 for(
size_t j=0UL; j<B.rows(); ++j ) {
437 ConstIterator element( B.begin(j) );
438 const ConstIterator end( B.end(j) );
439 for( ; element!=end; ++element ) {
440 C(i ,element->index()) += A(i ,j) * element->value();
441 C(i+1UL,element->index()) += A(i+1UL,j) * element->value();
442 C(i+2UL,element->index()) += A(i+2UL,j) * element->value();
443 C(i+3UL,element->index()) += A(i+3UL,j) * element->value();
448 for(
size_t i=last; i<A.rows(); ++i ) {
449 for(
size_t j=0UL; j<C.columns(); ++j ) {
452 for(
size_t j=0UL; j<B.rows(); ++j ) {
453 ConstIterator element( B.begin(j) );
454 const ConstIterator end( B.end(j) );
455 for( ; element!=end; ++element ) {
456 C(i,element->index()) += A(i,j) * element->value();
477 template<
typename MT >
495 DMatSMatMultExpr::selectColumnMajorAssignKernel( ~lhs, A, B );
514 template<
typename MT3
517 static inline typename EnableIf< UseDefaultKernel<MT3,MT4,MT5> >::Type
518 selectColumnMajorAssignKernel( MT3& C,
const MT4& A,
const MT5& B )
524 for(
size_t i=0UL; i<B.rows(); ++i ) {
525 for(
size_t jj=0UL; jj<A.rows(); jj+=8UL ) {
526 const size_t jend( ( jj+8UL > A.rows() )?( A.rows() ):( jj+8UL ) );
527 ConstIterator element( B.begin(i) );
528 const ConstIterator end( B.end(i) );
529 for( ; element!=end; ++element ) {
530 for(
size_t j=jj; j<jend; ++j ) {
532 C(j,element->index()) = A(j,i) * element->value();
534 C(j,element->index()) += A(j,i) * element->value();
557 template<
typename MT3
560 static inline typename EnableIf< UseOptimizedKernel<MT3,MT4,MT5> >::Type
561 selectColumnMajorAssignKernel( MT3& C,
const MT4& A,
const MT5& B )
567 for(
size_t i=0UL; i<B.rows(); ++i ) {
568 for(
size_t jj=0UL; jj<A.rows(); jj+=8UL ) {
569 const size_t jend( ( jj+8UL > A.rows() )?( A.rows() ):( jj+8UL ) );
570 ConstIterator element( B.begin(i) );
571 const ConstIterator end( B.end(i) );
572 for( ; element!=end; ++element ) {
573 for(
size_t j=jj; j<jend; ++j ) {
574 C(j,element->index()) += A(j,i) * element->value();
596 template<
typename MT
602 typedef typename SelectType< SO, OppositeType, ResultType >::Type TmpType;
614 const TmpType tmp(
serial( rhs ) );
633 template<
typename MT >
651 DMatSMatMultExpr::selectRowMajorAddAssignKernel( ~lhs, A, B );
670 template<
typename MT3
673 static inline void selectRowMajorAddAssignKernel( MT3& C,
const MT4& A,
const MT5& B )
677 const size_t last( A.rows() & size_t(-4) );
679 for(
size_t i=0UL; i<last; i+=4UL ) {
680 for(
size_t j=0UL; j<B.rows(); ++j ) {
681 ConstIterator element( B.begin(j) );
682 const ConstIterator end( B.end(j) );
683 for( ; element!=end; ++element ) {
684 C(i ,element->index()) += A(i ,j) * element->value();
685 C(i+1UL,element->index()) += A(i+1UL,j) * element->value();
686 C(i+2UL,element->index()) += A(i+2UL,j) * element->value();
687 C(i+3UL,element->index()) += A(i+3UL,j) * element->value();
692 for(
size_t i=last; i<A.rows(); ++i ) {
693 for(
size_t j=0UL; j<B.rows(); ++j ) {
694 ConstIterator element( B.begin(j) );
695 const ConstIterator end( B.end(j) );
696 for( ; element!=end; ++element ) {
697 C(i,element->index()) += A(i,j) * element->value();
718 template<
typename MT >
736 DMatSMatMultExpr::selectColumnMajorAddAssignKernel( ~lhs, A, B );
755 template<
typename MT3
758 static inline void selectColumnMajorAddAssignKernel( MT3& C,
const MT4& A,
const MT5& B )
762 for(
size_t i=0UL; i<B.rows(); ++i ) {
763 for(
size_t jj=0UL; jj<A.rows(); jj+=8UL ) {
764 const size_t jend( ( jj+8UL > A.rows() )?( A.rows() ):( jj+8UL ) );
765 ConstIterator element( B.begin(i) );
766 const ConstIterator end( B.end(i) );
767 for( ; element!=end; ++element ) {
768 for(
size_t j=jj; j<jend; ++j ) {
769 C(j,element->index()) += A(j,i) * element->value();
795 template<
typename MT >
813 DMatSMatMultExpr::selectRowMajorSubAssignKernel( ~lhs, A, B );
832 template<
typename MT3
835 static inline void selectRowMajorSubAssignKernel( MT3& C,
const MT4& A,
const MT5& B )
839 const size_t last( A.rows() & size_t(-4) );
841 for(
size_t i=0UL; i<last; i+=4UL ) {
842 for(
size_t j=0UL; j<B.rows(); ++j ) {
843 ConstIterator element( B.begin(j) );
844 const ConstIterator end( B.end(j) );
845 for( ; element!=end; ++element ) {
846 C(i ,element->index()) -= A(i ,j) * element->value();
847 C(i+1UL,element->index()) -= A(i+1UL,j) * element->value();
848 C(i+2UL,element->index()) -= A(i+2UL,j) * element->value();
849 C(i+3UL,element->index()) -= A(i+3UL,j) * element->value();
854 for(
size_t i=last; i<A.rows(); ++i ) {
855 for(
size_t j=0UL; j<B.rows(); ++j ) {
856 ConstIterator element( B.begin(j) );
857 const ConstIterator end( B.end(j) );
858 for( ; element!=end; ++element ) {
859 C(i,element->index()) -= A(i,j) * element->value();
880 template<
typename MT >
898 DMatSMatMultExpr::selectColumnMajorSubAssignKernel( ~lhs, A, B );
917 template<
typename MT3
920 static inline void selectColumnMajorSubAssignKernel( MT3& C,
const MT4& A,
const MT5& B )
924 for(
size_t i=0UL; i<B.rows(); ++i ) {
925 for(
size_t jj=0UL; jj<A.rows(); jj+=8UL ) {
926 const size_t jend( ( jj+8UL > A.rows() )?( A.rows() ):( jj+8UL ) );
927 ConstIterator element( B.begin(i) );
928 const ConstIterator end( B.end(i) );
929 for( ; element!=end; ++element ) {
930 for(
size_t j=jj; j<jend; ++j ) {
931 C(j,element->index()) -= A(j,i) * element->value();
967 template<
typename MT
969 friend inline typename EnableIf< UseSMPAssign<MT> >::Type
1007 template<
typename MT
1009 friend inline typename EnableIf< UseSMPAssign<MT> >::Type
1014 typedef typename SelectType< SO, OppositeType, ResultType >::Type TmpType;
1026 const TmpType tmp( rhs );
1047 template<
typename MT
1049 friend inline typename EnableIf< UseSMPAssign<MT> >::Type
1091 template<
typename MT
1093 friend inline typename EnableIf< UseSMPAssign<MT> >::Type
1177 template<
typename T1
1179 inline const DMatSMatMultExpr<T1,T2>
1185 throw std::invalid_argument(
"Matrix sizes do not match" );
1202 template<
typename MT1,
typename MT2,
typename VT >
1207 typedef typename SelectType< IsDenseMatrix<MT1>::value && IsRowMajorMatrix<MT1>::value &&
1208 IsSparseMatrix<MT2>::value && IsRowMajorMatrix<MT2>::value &&
1209 IsDenseVector<VT>::value && IsColumnVector<VT>::value
1210 ,
typename DMatDVecMultExprTrait< MT1, typename SMatDVecMultExprTrait<MT2,VT>::Type >::Type
1211 , INVALID_TYPE >::Type Type;
1220 template<
typename MT1,
typename MT2,
typename VT >
1225 typedef typename SelectType< IsDenseMatrix<MT1>::value && IsRowMajorMatrix<MT1>::value &&
1226 IsSparseMatrix<MT2>::value && IsRowMajorMatrix<MT2>::value &&
1227 IsSparseVector<VT>::value && IsColumnVector<VT>::value
1228 ,
typename DMatSVecMultExprTrait< MT1, typename SMatSVecMultExprTrait<MT2,VT>::Type >::Type
1229 , INVALID_TYPE >::Type Type;
1238 template<
typename VT,
typename MT1,
typename MT2 >
1243 typedef typename SelectType< IsDenseVector<VT>::value && IsRowVector<VT>::value &&
1244 IsDenseMatrix<MT1>::value && IsRowMajorMatrix<MT1>::value &&
1245 IsSparseMatrix<MT2>::value && IsRowMajorMatrix<MT2>::value
1246 ,
typename TDVecSMatMultExprTrait< typename TDVecDMatMultExprTrait<VT,MT1>::Type, MT2 >::Type
1247 , INVALID_TYPE >::Type Type;
1256 template<
typename VT,
typename MT1,
typename MT2 >
1261 typedef typename SelectType< IsSparseVector<VT>::value && IsRowVector<VT>::value &&
1262 IsDenseMatrix<MT1>::value && IsRowMajorMatrix<MT1>::value &&
1263 IsSparseMatrix<MT2>::value && IsRowMajorMatrix<MT2>::value
1264 ,
typename TDVecSMatMultExprTrait< typename TDVecDMatMultExprTrait<VT,MT1>::Type, MT2 >::Type
1265 , INVALID_TYPE >::Type Type;
1274 template<
typename MT1,
typename MT2,
bool AF >
1279 typedef typename MultExprTrait< typename SubmatrixExprTrait<const MT1,AF>::Type
1280 ,
typename SubmatrixExprTrait<const MT2,AF>::Type >::Type Type;
1289 template<
typename MT1,
typename MT2 >
1294 typedef typename MultExprTrait< typename RowExprTrait<const MT1>::Type, MT2 >::Type Type;
1303 template<
typename MT1,
typename MT2 >
1308 typedef typename MultExprTrait< MT1, typename ColumnExprTrait<const MT2>::Type >::Type Type;
ResultType::TransposeType TransposeType
Transpose type for expression template evaluations.
Definition: DMatSMatMultExpr.h:169
Compile time check whether the given type is a computational expression template.This type trait clas...
Definition: IsComputation.h:89
RightOperand rhs_
Right-hand side sparse matrix of the multiplication expression.
Definition: DMatSMatMultExpr.h:324
Header file for the SMatDVecMultExprTrait class template.
void reset(DynamicMatrix< Type, SO > &m)
Resetting the given dense matrix.
Definition: DynamicMatrix.h:4599
const DMatDMatMultExpr< T1, T2 > operator*(const DenseMatrix< T1, false > &lhs, const DenseMatrix< T2, false > &rhs)
Multiplication operator for the multiplication of two row-major dense matrices ( ).
Definition: DMatDMatMultExpr.h:4329
const ResultType CompositeType
Data type for composite expression templates.
Definition: DMatSMatMultExpr.h:172
ReturnType operator()(size_t i, size_t j) const
2D-access to the matrix elements.
Definition: DMatSMatMultExpr.h:217
const ElementType ReturnType
Return type for expression template evaluations.
Definition: DMatSMatMultExpr.h:171
SelectType< evaluateRight, const RT2, CT2 >::Type RT
Type for the assignment of the right-hand side sparse matrix operand.
Definition: DMatSMatMultExpr.h:184
void smpSubAssign(DenseMatrix< MT1, SO1 > &lhs, const Matrix< MT2, SO2 > &rhs)
Default implementation of the SMP subtraction assignment of a matrix to dense matrix.
Definition: DenseMatrix.h:152
Header file for the IsSparseMatrix type trait.
bool isDefault(const DynamicMatrix< Type, SO > &m)
Returns whether the given dense matrix is in default state.
Definition: DynamicMatrix.h:4642
Efficient implementation of a compressed matrix.The CompressedMatrix class template is the represent...
Definition: CompressedMatrix.h:199
#define BLAZE_CONSTRAINT_MUST_BE_DENSE_MATRIX_TYPE(T)
Constraint on the data type.In case the given data type T is not a dense, N-dimensional matrix type...
Definition: DenseMatrix.h:79
Header file for the ColumnExprTrait class template.
const This & CompositeType
Data type for composite expression templates.
Definition: CompressedMatrix.h:2408
Header file for the IsRowVector type trait.
Type ElementType
Type of the sparse matrix elements.
Definition: CompressedMatrix.h:251
size_t columns() const
Returns the current number of columns of the matrix.
Definition: DMatSMatMultExpr.h:252
bool isAligned() const
Returns whether the operands of the expression are properly aligned in memory.
Definition: DMatSMatMultExpr.h:306
MT2::ResultType RT2
Result type of the right-hand side sparse matrix expression.
Definition: DMatSMatMultExpr.h:110
Header file for the TDVecSMatMultExprTrait class template.
MultTrait< RT1, RT2 >::Type ResultType
Result type for expression template evaluations.
Definition: DMatSMatMultExpr.h:167
const DMatSerialExpr< MT, SO > serial(const DenseMatrix< MT, SO > &dm)
Forces the serial evaluation of the given dense matrix expression dm.
Definition: DMatSerialExpr.h:690
Header file for the Computation base class.
Header file for the MatMatMultExpr base class.
Base class for dense matrices.The DenseMatrix class is a base class for all dense matrix classes...
Definition: DenseMatrix.h:70
Base class for sparse matrices.The SparseMatrix class is a base class for all sparse matrix classes...
Definition: Forward.h:107
Constraint on the data type.
Constraint on the data type.
Constraint on the data type.
Header file for the MultExprTrait class template.
void smpAddAssign(DenseMatrix< MT1, SO1 > &lhs, const Matrix< MT2, SO2 > &rhs)
Default implementation of the SMP addition assignment of a matrix to a dense matrix.
Definition: DenseMatrix.h:122
Compile time check to query the requirement to evaluate an expression.Via this type trait it is possi...
Definition: RequiresEvaluation.h:90
SelectType< IsExpression< MT2 >::value, const MT2, const MT2 & >::Type RightOperand
Composite type of the right-hand side sparse matrix expression.
Definition: DMatSMatMultExpr.h:178
LeftOperand lhs_
Left-hand side dense matrix of the multiplication expression.
Definition: DMatSMatMultExpr.h:323
size_t rows() const
Returns the current number of rows of the matrix.
Definition: DMatSMatMultExpr.h:242
Compile time type selection.The SelectType class template selects one of the two given types T1 and T...
Definition: SelectType.h:59
Header file for the multiplication trait.
MT1::ResultType RT1
Result type of the left-hand side dense matrix expression.
Definition: DMatSMatMultExpr.h:109
#define BLAZE_CONSTRAINT_MUST_BE_COLUMN_MAJOR_MATRIX_TYPE(T)
Constraint on the data type.In case the given data type T is not a column-major dense or sparse matri...
Definition: StorageOrder.h:161
const Element * ConstIterator
Iterator over constant elements.
Definition: CompressedMatrix.h:2412
LeftOperand leftOperand() const
Returns the left-hand side dense matrix operand.
Definition: DMatSMatMultExpr.h:262
Header file for the DenseMatrix base class.
ResultType::OppositeType OppositeType
Result type with opposite storage order for expression template evaluations.
Definition: DMatSMatMultExpr.h:168
void assign(Matrix< MT1, SO1 > &lhs, const Matrix< MT2, SO2 > &rhs)
Default implementation of the assignment of a matrix to a matrix.
Definition: Matrix.h:271
Header file for the DMatDVecMultExprTrait class template.
RT2::ElementType ET2
Element type of the right-hand side sparse matrix expression.
Definition: DMatSMatMultExpr.h:112
Header file for the SMatSVecMultExprTrait class template.
#define BLAZE_CONSTRAINT_MUST_BE_REFERENCE_TYPE(T)
Constraint on the data type.In case the given data type T is not a reference type, a compilation error is created.
Definition: Reference.h:78
bool canSMPAssign() const
Returns whether the expression can be used in SMP assignments.
Definition: DMatSMatMultExpr.h:316
Constraints on the storage order of matrix types.
SelectType< evaluateLeft, const RT1, CT1 >::Type LT
Type for the assignment of the left-hand side dense matrix operand.
Definition: DMatSMatMultExpr.h:181
Type ElementType
Type of the sparse matrix elements.
Definition: CompressedMatrix.h:2406
Header file for the SelectType class template.
Header file for the RowExprTrait class template.
Header file for all forward declarations for expression class templates.
Header file for the IsDenseMatrix type trait.
Header file for the EnableIf class template.
Header file for the serial shim.
ResultType::ElementType ElementType
Resulting element type.
Definition: DMatSMatMultExpr.h:170
void smpAssign(DenseMatrix< MT1, SO1 > &lhs, const Matrix< MT2, SO2 > &rhs)
Default implementation of the SMP assignment of a matrix to a dense matrix.
Definition: DenseMatrix.h:92
MT1::CompositeType CT1
Composite type of the left-hand side dense matrix expression.
Definition: DMatSMatMultExpr.h:113
RT1::ElementType ET1
Element type of the left-hand side dense matrix expression.
Definition: DMatSMatMultExpr.h:111
Base class for all matrix/matrix multiplication expression templates.The MatMatMultExpr class serves ...
Definition: MatMatMultExpr.h:65
Header file for the IsSparseVector type trait.
Header file for the SubmatrixExprTrait class template.
#define BLAZE_CONSTRAINT_MUST_BE_ROW_MAJOR_MATRIX_TYPE(T)
Constraint on the data type.In case the given data type T is not a row-major dense or sparse matrix t...
Definition: StorageOrder.h:81
bool canAlias(const T *alias) const
Returns whether the expression can alias with the given address alias.
Definition: DMatSMatMultExpr.h:284
Header file for run time assertion macros.
bool isAliased(const T *alias) const
Returns whether the expression is aliased with the given address alias.
Definition: DMatSMatMultExpr.h:296
Utility type for generic codes.
Base template for the MultTrait class.
Definition: MultTrait.h:141
Expression object for dense matrix-sparse matrix multiplications.The DMatSMatMultExpr class represent...
Definition: DMatSMatMultExpr.h:103
void addAssign(Matrix< MT1, SO1 > &lhs, const Matrix< MT2, SO2 > &rhs)
Default implementation of the addition assignment of a matrix to a matrix.
Definition: Matrix.h:301
Substitution Failure Is Not An Error (SFINAE) class.The EnableIf class template is an auxiliary tool ...
Definition: EnableIf.h:184
Header file for the reset shim.
void subAssign(Matrix< MT1, SO1 > &lhs, const Matrix< MT2, SO2 > &rhs)
Default implementation of the subtraction assignment of a matrix to matrix.
Definition: Matrix.h:331
Header file for the isDefault shim.
#define BLAZE_CONSTRAINT_MATRICES_MUST_HAVE_SAME_STORAGE_ORDER(T1, T2)
Constraint on the data type.In case either of the two given data types T1 or T2 is not a matrix type ...
Definition: StorageOrder.h:283
MT2::CompositeType CT2
Composite type of the right-hand side sparse matrix expression.
Definition: DMatSMatMultExpr.h:114
Header file for the IsDenseVector type trait.
SelectType< IsExpression< MT1 >::value, const MT1, const MT1 & >::Type LeftOperand
Composite type of the left-hand side dense matrix expression.
Definition: DMatSMatMultExpr.h:175
Header file for the IsRowMajorMatrix type trait.
Header file for the IsComputation type trait class.
const size_t SMP_DMATSMATMULT_THRESHOLD
SMP row-major dense matrix/row-major sparse matrix multiplication threshold.This threshold specifies ...
Definition: Thresholds.h:926
Base class for all compute expression templates.The Computation class serves as a tag for all computa...
Definition: Computation.h:59
Header file for the TDVecDMatMultExprTrait class template.
#define BLAZE_FUNCTION_TRACE
Function trace macro.This macro can be used to reliably trace function calls. In case function tracin...
Definition: FunctionTrace.h:157
This ResultType
Result type for expression template evaluations.
Definition: CompressedMatrix.h:2403
DMatSMatMultExpr(const MT1 &lhs, const MT2 &rhs)
Constructor for the DMatSMatMultExpr class.
Definition: DMatSMatMultExpr.h:202
Header file for basic type definitions.
Header file for the TSVecDMatMultExprTrait class template.
DMatSMatMultExpr< MT1, MT2 > This
Type of this DMatSMatMultExpr instance.
Definition: DMatSMatMultExpr.h:166
Header file for the DMatSVecMultExprTrait class template.
Header file for the IsColumnVector type trait.
Header file for the IsResizable type trait.
Header file for the thresholds for matrix/vector and matrix/matrix multiplications.
#define BLAZE_INTERNAL_ASSERT(expr, msg)
Run time assertion macro for internal checks.In case of an invalid run time expression, the program execution is terminated. The BLAZE_INTERNAL_ASSERT macro can be disabled by setting the BLAZE_USER_ASSERTION flag to zero or by defining NDEBUG during the compilation.
Definition: Assert.h:101
#define BLAZE_CONSTRAINT_MUST_BE_SPARSE_MATRIX_TYPE(T)
Constraint on the data type.In case the given data type T is not a sparse, N-dimensional matrix type...
Definition: SparseMatrix.h:79
Header file for the IsExpression type trait class.
Header file for the FunctionTrace class.
RightOperand rightOperand() const
Returns the right-hand side sparse matrix operand.
Definition: DMatSMatMultExpr.h:272