alexandrehoffmann
diff --git a/‎demo/demo_Matrix.cpp‎
Lines changed: 11 additions & 12 deletions b/‎demo/demo_Matrix.cpp‎
Lines changed: 11 additions & 12 deletions
diff --git a/‎demo/demo_Vector.cpp‎
Lines changed: 5 additions & 5 deletions b/‎demo/demo_Vector.cpp‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎include/FSLinalg/BasicLinalg/GeneralMatrixMatrixProduct.hpp‎
Lines changed: 44 additions & 0 deletions b/‎include/FSLinalg/BasicLinalg/GeneralMatrixMatrixProduct.hpp‎
Lines changed: 44 additions & 0 deletions
diff --git a/‎include/FSLinalg/BasicLinalg/GeneralMatrixMatrixProduct_impl.hpp‎
Lines changed: 124 additions & 0 deletions b/‎include/FSLinalg/BasicLinalg/GeneralMatrixMatrixProduct_impl.hpp‎
Lines changed: 124 additions & 0 deletions
diff --git a/‎include/FSLinalg/BasicLinalg/GeneralMatrixVectorProduct.hpp‎
Lines changed: 0 additions & 94 deletions b/‎include/FSLinalg/BasicLinalg/GeneralMatrixVectorProduct.hpp‎
Lines changed: 0 additions & 94 deletions
diff --git a/‎include/FSLinalg/BasicLinalg/InnerProduct.hpp‎
Lines changed: 20 additions & 0 deletions b/‎include/FSLinalg/BasicLinalg/InnerProduct.hpp‎
Lines changed: 20 additions & 0 deletions
@@ -1,32 +1,31 @@
-#include <FSLinalg/Vector.hpp>
 #include <FSLinalg/Matrix.hpp>
 
 int main()
 {
-	FSLinalg::UnitVector<4> e0(0);
-	FSLinalg::RealVector<3> a({2, 3, 0});
+	FSLinalg::UnitRowVector<4> e0(0);
+	FSLinalg::RealRowVector<3> a({2, 3, 0});
 
 	const auto expr1 = 0.5*FSLinalg::outer(e0, a)*a;
 
-	fmt::print("expr = {}\n", FSLinalg::RealVector<4>(expr1));
-	fmt::print("expr.createTemporaryMatrix = {}\n", expr1.createTemporaryMatrix);
-	fmt::print("expr.createTemporaryVector = {}\n", expr1.createTemporaryVector);
+	fmt::print("expr = {}\n", FSLinalg::RealRowVector<4>(expr1));
+	fmt::print("expr.createTemporaryMatrix = {}\n", expr1.createTemporaryLhs);
+	fmt::print("expr.createTemporaryVector = {}\n", expr1.createTemporaryRhs);
 
 	const auto expr2 = 0.5*FSLinalg::transpose(FSLinalg::outer(e0, a))*e0;
 
-	fmt::print("expr = {}\n", FSLinalg::RealVector<3>(expr2));
-	fmt::print("expr.createTemporaryMatrix = {}\n", expr2.createTemporaryMatrix);
-	fmt::print("expr.createTemporaryVector = {}\n", expr2.createTemporaryVector);
+	fmt::print("expr = {}\n", FSLinalg::RealRowVector<3>(expr2));
+	fmt::print("expr.createTemporaryMatrix = {}\n", expr2.createTemporaryLhs);
+	fmt::print("expr.createTemporaryVector = {}\n", expr2.createTemporaryRhs);
 
 	FSLinalg::RealMatrix<4, 3> A(FSLinalg::outer(e0, a));
 
 	fmt::print("{}\n", A);
 
 	const auto expr3 = 0.5*FSLinalg::transpose(A)*e0;
 
-	fmt::print("expr = {}\n", FSLinalg::RealVector<3>(expr3));
-	fmt::print("expr.createTemporaryMatrix = {}\n", expr3.createTemporaryMatrix);
-	fmt::print("expr.createTemporaryVector = {}\n", expr3.createTemporaryVector);
+	fmt::print("expr = {}\n", FSLinalg::RealRowVector<3>(expr3));
+	fmt::print("expr.createTemporaryMatrix = {}\n", expr3.createTemporaryLhs);
+	fmt::print("expr.createTemporaryVector = {}\n", expr3.createTemporaryRhs);
 
 	return EXIT_SUCCESS;
 }
@@ -1,18 +1,18 @@
-#include <FSLinalg/Vector.hpp>
+#include <FSLinalg/Matrix.hpp>
 
 int main()
 {
-	FSLinalg::UnitVector<3> e0(0);
-	FSLinalg::RealVector<3> one(1);
-	FSLinalg::RealVector<3> a({2, 3, 0});
+	FSLinalg::UnitRowVector<3> e0(0);
+	FSLinalg::RealRowVector<3> one(1);
+	FSLinalg::RealRowVector<3> a({2, 3, 0});
 
 	const auto expr = a + 3.*e0 - one/2.;
 
 	fmt::print("{} + 3*{} - {}/2 = {}\n", a, e0, one, expr);
 	fmt::print("expr is aliased to a = {}\n", expr.isAliasedTo(a));
 
 	const auto expr2 = -2.*FSLinalg::cross(a, one);
-	FSLinalg::RealVector<3> c = expr2;
+	FSLinalg::RealRowVector<3> c = expr2;
 
 	fmt::print("cross({}, {}) = {}\n", a, one, c);
 	fmt::print("expr2 is aliased to a = {}\n", expr2.isAliasedTo(a));
 
@@ -0,0 +1,44 @@
+#ifndef FSLINALG_BASIC_LINALG_GENERAL_MATRIX_MATRIX_PRODUCT_HPP
+#define FSLINALG_BASIC_LINALG_GENERAL_MATRIX_MATRIX_PRODUCT_HPP
+
+#include <FSLinalg/Scalar.hpp>
+#include <FSLinalg/Matrix.hpp>
+
+namespace FSLinalg
+{
+namespace BasicLinalg
+{
+
+template<bool transposeA, bool conjugateA, unsigned int nRowsA, unsigned int nColsA, bool transposeB, bool conjugateB, unsigned int nRowsB, unsigned int nColsB, bool incrDst>
+struct GeneralMatrixMatrixProduct
+{
+	using Size = unsigned int;
+	
+	static constexpr Size nRowsOpA = (not transposeA) ? nRowsA : nColsA;
+	static constexpr Size nColsOpA = (not transposeA) ? nColsA : nRowsA;
+	static constexpr Size nRowsOpB = (not transposeB) ? nRowsB : nColsB;
+	static constexpr Size nColsOpB = (not transposeB) ? nColsB : nRowsB;
+	static constexpr Size nRowsY   = nRowsOpA;
+	static constexpr Size nColsY   = nColsOpB;
+	
+	static_assert(nColsOpA == nRowsOpB, "Matrices sizes must match");
+	
+	template<Scalar_concept ScalarAlpha, Scalar_concept ScalarA, Scalar_concept ScalarB, Scalar_concept ScalarY>
+	static void run(const ScalarAlpha& alpha, const Matrix<ScalarA,nRowsA,nColsA>& A, const Matrix<ScalarB,nRowsB,nColsB>& B, Matrix<ScalarY,nRowsY,nColsY>& Y);
+	
+	template<Scalar_concept ScalarAlpha, Scalar_concept ScalarA, Scalar_concept ScalarY>
+	static void run(const ScalarAlpha& alpha, const Matrix<ScalarA,nRowsA,nColsA>& A, const UnitMatrix<nRowsB,nColsB>& B, Matrix<ScalarY,nRowsY,nColsY>& Y);
+	
+	template<Scalar_concept ScalarAlpha, Scalar_concept ScalarB, Scalar_concept ScalarY>
+	static void run(const ScalarAlpha& alpha, const UnitMatrix<nRowsA,nColsA>& A, const Matrix<ScalarB,nRowsB,nColsB>& B, Matrix<ScalarY,nRowsY,nColsY>& Y);
+	
+	template<Scalar_concept ScalarAlpha, Scalar_concept ScalarY>
+	static void run(const ScalarAlpha& alpha, const UnitMatrix<nRowsA,nColsA>& A, const UnitMatrix<nRowsB,nColsB>& B, Matrix<ScalarY,nRowsY,nColsY>& Y);
+};
+	
+} // namespace BasicLinalg
+} // namespace FSLinalg
+
+#include <FSLinalg/BasicLinalg/GeneralMatrixMatrixProduct_impl.hpp>
+
+#endif // FSLINALG_BASIC_LINALG_GENERAL_MATRIX_MATRIX_PRODUCT_HPP
@@ -0,0 +1,124 @@
+#ifndef FSLINALG_BASIC_LINALG_GENERAL_MATRIX_MATRIX_PRODUCT_IMPL_HPP
+#define FSLINALG_BASIC_LINALG_GENERAL_MATRIX_MATRIX_PRODUCT_IMPL_HPP
+
+#include <FSLinalg/BasicLinalg/GeneralMatrixMatrixProduct.hpp>
+#include <FSLinalg/BasicLinalg/TripleProduct.hpp>
+#include <FSLinalg/BasicLinalg/Product.hpp>
+
+namespace FSLinalg
+{
+namespace BasicLinalg
+{
+
+template<bool transposeA, bool conjugateA, unsigned int nRowsA, unsigned int nColsA, bool transposeB, bool conjugateB, unsigned int nRowsB, unsigned int nColsB, bool incrDst>
+template<Scalar_concept ScalarAlpha, Scalar_concept ScalarA, Scalar_concept ScalarB, Scalar_concept ScalarY>
+void GeneralMatrixMatrixProduct<transposeA,conjugateA,nRowsA,nColsA,transposeB,conjugateB,nRowsB,nColsB,incrDst>::run(
+	const ScalarAlpha&                   alpha, 
+	const Matrix<ScalarA,nRowsA,nColsA>& A, 
+	const Matrix<ScalarB,nRowsB,nColsB>& B, 
+	      Matrix<ScalarY,nRowsY,nColsY>& Y)
+{
+	constexpr Size A_iStride = (not transposeA) ? nColsA : 1;
+	constexpr Size A_kStride = (not transposeA) ?      1 : nColsA;
+	constexpr Size B_kStride = (not transposeB) ? nColsB : 1;
+	constexpr Size B_jStride = (not transposeB) ?      1 : nColsB;
+	
+	constexpr TripleProduct<false, conjugateA, conjugateB> prod;
+	
+	if constexpr (not incrDst)
+	{
+		for (Size i=0; i!=nRowsY*nColsY; ++i) { Y[i] = 0; }
+	}
+	
+	for (Size i=0; i!=nRowsY; ++i)
+	{
+		for (Size k=0; k !=nColsOpA; ++k)
+		{
+			for (Size j=0; j!=nColsY; ++j)
+			{
+				Y(i,j) += prod(alpha, A[i*A_iStride + k*A_kStride], B[k*B_kStride + j*B_jStride]);
+			}
+		}
+	}
+}
+
+template<bool transposeA, bool conjugateA, unsigned int nRowsA, unsigned int nColsA, bool transposeB, bool conjugateB, unsigned int nRowsB, unsigned int nColsB, bool incrDst>
+template<Scalar_concept ScalarAlpha, Scalar_concept ScalarA, Scalar_concept ScalarY>
+void GeneralMatrixMatrixProduct<transposeA,conjugateA,nRowsA,nColsA,transposeB,conjugateB,nRowsB,nColsB,incrDst>::run(
+	const ScalarAlpha&                   alpha, 
+	const Matrix<ScalarA,nRowsA,nColsA>& A, 
+	const UnitMatrix<nRowsB,nColsB>&     B, 
+	      Matrix<ScalarY,nRowsY,nColsY>& Y)
+{
+	constexpr Size A_iStride = (not transposeA) ? nColsA : 1;
+	constexpr Size A_kStride = (not transposeA) ?      1 : nColsA;
+	
+	constexpr Product<false, conjugateA> prod;
+	
+	if constexpr (not incrDst)
+	{
+		for (Size i=0; i!=nRowsY*nColsY; ++i) { Y[i] = 0; }
+	}
+	
+	const Size k = (not transposeB) ? B.getId().i : B.getId().j;
+	const Size j = (not transposeB) ? B.getId().j : B.getId().i;
+	
+	for (Size i=0; i!=nRowsY; ++i)
+	{
+		Y(i,j) += prod(alpha, A[i*A_iStride + k*A_kStride]);
+	}
+}
+
+template<bool transposeA, bool conjugateA, unsigned int nRowsA, unsigned int nColsA, bool transposeB, bool conjugateB, unsigned int nRowsB, unsigned int nColsB, bool incrDst>
+template<Scalar_concept ScalarAlpha, Scalar_concept ScalarB, Scalar_concept ScalarY>
+void GeneralMatrixMatrixProduct<transposeA,conjugateA,nRowsA,nColsA,transposeB,conjugateB,nRowsB,nColsB,incrDst>::run(
+	const ScalarAlpha&                   alpha, 
+	const UnitMatrix<nRowsA,nColsA>&     A, 
+	const Matrix<ScalarB,nRowsB,nColsB>& B, 
+	      Matrix<ScalarY,nRowsY,nColsY>& Y)
+{
+	constexpr Size B_kStride = (not transposeB) ? nColsB : 1;
+	constexpr Size B_jStride = (not transposeB) ?      1 : nColsB;
+	
+	constexpr Product<false, conjugateB> prod;
+	
+	if constexpr (not incrDst)
+	{
+		for (Size i=0; i!=nRowsY*nColsY; ++i) { Y[i] = 0; }
+	}
+	
+	const Size i = (not transposeA) ? A.getId().i : A.getId().j;
+	const Size k = (not transposeA) ? A.getId().j : A.getId().i;
+	
+	
+	for (Size j=0; j!=nColsY; ++j)
+	{
+		Y(i,j) += prod(alpha, B[k*B_kStride + j*B_jStride]);
+	}
+}
+
+template<bool transposeA, bool conjugateA, unsigned int nRowsA, unsigned int nColsA, bool transposeB, bool conjugateB, unsigned int nRowsB, unsigned int nColsB, bool incrDst>
+template<Scalar_concept ScalarAlpha, Scalar_concept ScalarY>
+void GeneralMatrixMatrixProduct<transposeA,conjugateA,nRowsA,nColsA,transposeB,conjugateB,nRowsB,nColsB,incrDst>::run(
+	const ScalarAlpha&                   alpha, 
+	const UnitMatrix<nRowsA,nColsA>&     A, 
+	const UnitMatrix<nRowsB,nColsB>&     B, 
+	      Matrix<ScalarY,nRowsY,nColsY>& Y)
+{	
+	if constexpr (not incrDst)
+	{
+		for (Size i=0; i!=nRowsY*nColsY; ++i) { Y[i] = 0; }
+	}
+	
+	const Size i  = (not transposeA) ? A.getId().i : A.getId().j;
+	const Size j  = (not transposeB) ? B.getId().j : B.getId().i;
+	const Size k1 = (not transposeA) ? A.getId().j : A.getId().i;
+	const Size k2 = (not transposeB) ? B.getId().i : B.getId().j;
+	
+	Y(i,j) += alpha*(k1 == k2);
+}
+
+} // namespace BasicLinalg
+} // namespace FSLinalg
+
+#endif // FSLINALG_BASIC_LINALG_GENERAL_MATRIX_MATRIX_PRODUCT_IMPL_HPP
@@ -0,0 +1,20 @@
+#ifndef FSLINALG_INNER_PRODUCT_HPP
+#define FSLINALG_INNER_PRODUCT_HPP
+
+#include <FSLinalg/Vector/VectorBase.hpp>
+#include <FSLinalg/Matrix/MatrixBase.hpp>
+
+namespace FSLinalg
+{
+
+template<class Lhs, class Rhs>
+using InnerProductScalar = decltype(conj(std::declval<typename Lhs::Scalar>()) * std::declval<typename Rhs::Scalar>());
+
+template<class Lhs, class Rhs> InnerProductScalar<Lhs,Rhs> inner(const MatrixBase<Lhs>& base_lhs, const MatrixBase<Rhs>& base_rhs);
+
+	
+} // namespace FSLinalg
+
+#include <FSLinalg/BasicLinalg/InnerProduct_impl.hpp>
+
+#endif // FSLINALG_INNER_PRODUCT_HPP