add rowSums() and colSums() functions to Eidos

bhaller · bhaller · commit a8be5c993baf · 2025-10-08T12:54:38.000-04:00
diff --git a/EidosScribe/EidosHelpFunctions.rtf b/EidosScribe/EidosHelpFunctions.rtf
@@ -4544,9 +4544,15 @@ The above explanation may not be entirely clear, so let\'92s look at an example.
 \f3\fs20 , 2\'966, in the second column.  Although visualization becomes more difficult, these same patterns extend to higher dimensions and arbitrary margins of 
 \f1\fs18 x
 \f3\fs20 .\
+\pard\pardeftab720\li547\ri720\sb60\sa60\partightenfactor0
+\cf2 \kerning1\expnd0\expndtw0 For efficiently obtaining the sums of the rows or columns of a matrix, see 
+\f1\fs18 rowSums()
+\f3\fs20  and 
+\f1\fs18 colSums()
+\f3\fs20 .\
 \pard\pardeftab720\li720\fi-446\ri720\sb180\sa60\partightenfactor0
 
-\f1\fs18 \cf0 \kerning1\expnd0\expndtw0 (*)array(*\'a0data, integer\'a0dim)
+\f1\fs18 \cf0 (*)array(*\'a0data, integer\'a0dim)
 \f2 \
 \pard\pardeftab720\li547\ri720\sb60\sa60\partightenfactor0
 
@@ -4621,7 +4627,48 @@ To combine vectors or matrices by row instead, see
 \f3\fs20 .\
 \pard\pardeftab720\li720\fi-446\ri720\sb180\sa60\partightenfactor0
 
-\f1\fs18 \cf2 \kerning1\expnd0\expndtw0 (numeric$)det(numeric\'a0x)\
+\f1\fs18 \cf2 \kerning1\expnd0\expndtw0 (numeric)colSums(lif\'a0x)\
+\pard\pardeftab720\li547\ri720\sb60\sa60\partightenfactor0
+
+\f0\b\fs20 \cf2 Returns the sums of the columns
+\f3\b0  of 
+\f1\fs18 x
+\f3\fs20 , which must be a matrix.  The result is a vector of elements, each providing the sum of the corresponding column of 
+\f1\fs18 x
+\f3\fs20 .  If 
+\f1\fs18 x
+\f3\fs20  is of type 
+\f1\fs18 logical
+\f3\fs20  or 
+\f1\fs18 integer
+\f3\fs20  the result will be of type 
+\f1\fs18 integer
+\f3\fs20 ; unlike the 
+\f1\fs18 sum()
+\f3\fs20  function, 
+\f1\fs18 colSums()
+\f3\fs20  does not promote the return type to 
+\f1\fs18 float
+\f3\fs20  if 
+\f1\fs18 integer
+\f3\fs20  overflow occurs, but instead throws an error.  If 
+\f1\fs18 x
+\f3\fs20  is of type 
+\f1\fs18 float
+\f3\fs20  the result will be of type 
+\f1\fs18 float
+\f3\fs20 .  Except for the change in the treatment of 
+\f1\fs18 integer
+\f3\fs20  overflow noted above, this is equivalent to using 
+\f1\fs18 apply()
+\f3\fs20  with 
+\f1\fs18 sum()
+\f3\fs20  to sum the columns of 
+\f1\fs18 x
+\f3\fs20 , but is much faster.\
+\pard\pardeftab720\li720\fi-446\ri720\sb180\sa60\partightenfactor0
+
+\f1\fs18 \cf2 (numeric$)det(numeric\'a0x)\
 \pard\pardeftab720\li547\ri720\sb60\sa60\partightenfactor0
 
 \f0\b\fs20 \cf2 Returns the determinant
@@ -5029,7 +5076,48 @@ To combine vectors or matrices by column instead, see
 \f3\fs20 .\
 \pard\pardeftab720\li720\fi-446\ri720\sb180\sa60\partightenfactor0
 
-\f1\fs18 \cf0 \kerning1\expnd0\expndtw0 (*)t(*\'a0x)
+\f1\fs18 \cf2 \kerning1\expnd0\expndtw0 (numeric)rowSums(lif\'a0x)\
+\pard\pardeftab720\li547\ri720\sb60\sa60\partightenfactor0
+
+\f0\b\fs20 \cf2 Returns the sums of the rows
+\f3\b0  of 
+\f1\fs18 x
+\f3\fs20 , which must be a matrix.  The result is a vector of elements, each providing the sum of the corresponding row of 
+\f1\fs18 x
+\f3\fs20 .  If 
+\f1\fs18 x
+\f3\fs20  is of type 
+\f1\fs18 logical
+\f3\fs20  or 
+\f1\fs18 integer
+\f3\fs20  the result will be of type 
+\f1\fs18 integer
+\f3\fs20 ; unlike the 
+\f1\fs18 sum()
+\f3\fs20  function, 
+\f1\fs18 rowSums()
+\f3\fs20  does not promote the return type to 
+\f1\fs18 float
+\f3\fs20  if 
+\f1\fs18 integer
+\f3\fs20  overflow occurs, but instead throws an error.  If 
+\f1\fs18 x
+\f3\fs20  is of type 
+\f1\fs18 float
+\f3\fs20  the result will be of type 
+\f1\fs18 float
+\f3\fs20 .  Except for the change in the treatment of 
+\f1\fs18 integer
+\f3\fs20  overflow noted above, this is equivalent to using 
+\f1\fs18 apply()
+\f3\fs20  with 
+\f1\fs18 sum()
+\f3\fs20  to sum the rows of 
+\f1\fs18 x
+\f3\fs20 , but is much faster.\
+\pard\pardeftab720\li720\fi-446\ri720\sb180\sa60\partightenfactor0
+
+\f1\fs18 \cf0 (*)t(*\'a0x)
 \f2 \
 \pard\pardeftab720\li547\ri720\sb60\sa60\partightenfactor0
 
diff --git a/QtSLiM/help/EidosHelpFunctions.html b/QtSLiM/help/EidosHelpFunctions.html
diff --git a/VERSIONS b/VERSIONS
@@ -14,6 +14,7 @@ development head (in the master branch):
 	add rects() call to Plot, for plotting a set of rectangles
 	extend text() to support drawing text and an angle, with new [float angle = 0.0] parameter
 	add mtext() call to Plot, for drawing text in the margins outside the plot area
+	add rowSums() and colSums() functions to Eidos, for use with matrices as a faster alternative to apply()
 
 
 version 5.1 (Eidos version 4.1):
diff --git a/eidos/eidos_functions.cpp b/eidos/eidos_functions.cpp
@@ -297,6 +297,8 @@ const std::vector<EidosFunctionSignature_CSP> &EidosInterpreter::BuiltInFunction
 		signatures->emplace_back((EidosFunctionSignature *)(new EidosFunctionSignature("det",				Eidos_ExecuteFunction_det,			kEidosValueMaskNumeric | kEidosValueMaskSingleton))->AddNumeric("x"));
 		signatures->emplace_back((EidosFunctionSignature *)(new EidosFunctionSignature("inverse",			Eidos_ExecuteFunction_inverse,		kEidosValueMaskFloat))->AddNumeric("x"));
 		signatures->emplace_back((EidosFunctionSignature *)(new EidosFunctionSignature("asVector",			Eidos_ExecuteFunction_asVector,		kEidosValueMaskAny))->AddAny("x"));
+		signatures->emplace_back((EidosFunctionSignature *)(new EidosFunctionSignature("rowSums",			Eidos_ExecuteFunction_rowSums,		kEidosValueMaskNumeric))->AddLogicalEquiv("x"));
+		signatures->emplace_back((EidosFunctionSignature *)(new EidosFunctionSignature("colSums",			Eidos_ExecuteFunction_colSums,		kEidosValueMaskNumeric))->AddLogicalEquiv("x"));
 
 		
 		// ************************************************************************************
diff --git a/eidos/eidos_functions.h b/eidos/eidos_functions.h
@@ -234,6 +234,8 @@ EidosValue_SP Eidos_ExecuteFunction_tr(const std::vector<EidosValue_SP> &p_argum
 EidosValue_SP Eidos_ExecuteFunction_det(const std::vector<EidosValue_SP> &p_arguments, EidosInterpreter &p_interpreter);
 EidosValue_SP Eidos_ExecuteFunction_inverse(const std::vector<EidosValue_SP> &p_arguments, EidosInterpreter &p_interpreter);
 EidosValue_SP Eidos_ExecuteFunction_asVector(const std::vector<EidosValue_SP> &p_arguments, EidosInterpreter &p_interpreter);
+EidosValue_SP Eidos_ExecuteFunction_rowSums(const std::vector<EidosValue_SP> &p_arguments, EidosInterpreter &p_interpreter);
+EidosValue_SP Eidos_ExecuteFunction_colSums(const std::vector<EidosValue_SP> &p_arguments, EidosInterpreter &p_interpreter);
 
 
 #pragma mark -
diff --git a/eidos/eidos_functions_matrices.cpp b/eidos/eidos_functions_matrices.cpp
@@ -1537,6 +1537,178 @@ EidosValue_SP Eidos_ExecuteFunction_asVector(const std::vector<EidosValue_SP> &p
 	return result_SP;
 }
 
+//	(numeric)rowSums(lif x)
+EidosValue_SP Eidos_ExecuteFunction_rowSums(const std::vector<EidosValue_SP> &p_arguments, __attribute__((unused)) EidosInterpreter &p_interpreter)
+{
+	EidosValue_SP result_SP(nullptr);
+	
+	EidosValue *x_value = p_arguments[0].get();
+	EidosValueType x_type = x_value->Type();
+	
+	if (x_value->DimensionCount() != 2)
+		EIDOS_TERMINATION << "ERROR (Eidos_ExecuteFunction_rowSums): in function rowSums() x is not a matrix." << EidosTerminate(nullptr);
+	
+	const int64_t *dim_values = x_value->Dimensions();
+	size_t x_rowcount = (size_t)dim_values[0];
+	size_t x_colcount = (size_t)dim_values[1];
+	
+	if (x_type == EidosValueType::kValueInt)
+	{
+		const int64_t *int_data = x_value->IntData();
+		
+		EidosValue_Int *int_result = (new (gEidosValuePool->AllocateChunk()) EidosValue_Int())->resize_no_initialize(x_rowcount);
+		result_SP = EidosValue_SP(int_result);
+		
+		for (size_t value_index = 0; value_index < x_rowcount; ++value_index)
+		{
+			int64_t sum = 0;
+			const int64_t *series_ptr = int_data + value_index;
+			
+			for (size_t col_index = 0; col_index < x_colcount; ++col_index)
+			{
+				// do sum += *series_ptr but check for overflow
+				int64_t old_sum = sum;
+				int64_t temp = *series_ptr;
+				bool overflow = Eidos_add_overflow(old_sum, temp, &sum);
+				
+				if (overflow)
+					EIDOS_TERMINATION << "ERROR (Eidos_ExecuteFunction_rowSums): integer overflow in rowSums(); you might wish to convert to float before calling rowSums()." << EidosTerminate(nullptr);
+				
+				series_ptr += x_rowcount;
+			}
+			
+			int_result->set_int_no_check(sum, value_index);
+		}
+	}
+	else if (x_type == EidosValueType::kValueFloat)
+	{
+		const double *float_data = x_value->FloatData();
+		
+		EidosValue_Float *float_result = (new (gEidosValuePool->AllocateChunk()) EidosValue_Float())->resize_no_initialize(x_rowcount);
+		result_SP = EidosValue_SP(float_result);
+		
+		for (size_t value_index = 0; value_index < x_rowcount; ++value_index)
+		{
+			double sum = 0;
+			const double *series_ptr = float_data + value_index;
+			
+			for (size_t col_index = 0; col_index < x_colcount; ++col_index)
+			{
+				sum += *series_ptr;
+				series_ptr += x_rowcount;
+			}
+			
+			float_result->set_float_no_check(sum, value_index);
+		}
+	}
+	else if (x_type == EidosValueType::kValueLogical)
+	{
+		const eidos_logical_t *logical_data = x_value->LogicalData();
+		
+		EidosValue_Int *int_result = (new (gEidosValuePool->AllocateChunk()) EidosValue_Int())->resize_no_initialize(x_rowcount);
+		result_SP = EidosValue_SP(int_result);
+		
+		for (size_t value_index = 0; value_index < x_rowcount; ++value_index)
+		{
+			int64_t sum = 0;
+			const eidos_logical_t *series_ptr = logical_data + value_index;
+			
+			for (size_t col_index = 0; col_index < x_colcount; ++col_index)
+			{
+				sum += *series_ptr;
+				series_ptr += x_rowcount;
+			}
+			
+			int_result->set_int_no_check(sum, value_index);
+		}
+	}
+	
+	return result_SP;
+}
+
+//	(numeric)colSums(lif x)
+EidosValue_SP Eidos_ExecuteFunction_colSums(const std::vector<EidosValue_SP> &p_arguments, __attribute__((unused)) EidosInterpreter &p_interpreter)
+{
+	EidosValue_SP result_SP(nullptr);
+	
+	EidosValue *x_value = p_arguments[0].get();
+	EidosValueType x_type = x_value->Type();
+	
+	if (x_value->DimensionCount() != 2)
+		EIDOS_TERMINATION << "ERROR (Eidos_ExecuteFunction_colSums): in function colSums() x is not a matrix." << EidosTerminate(nullptr);
+	
+	const int64_t *dim_values = x_value->Dimensions();
+	size_t x_rowcount = (size_t)dim_values[0];
+	size_t x_colcount = (size_t)dim_values[1];
+	
+	if (x_type == EidosValueType::kValueInt)
+	{
+		const int64_t *int_data = x_value->IntData();
+		
+		EidosValue_Int *int_result = (new (gEidosValuePool->AllocateChunk()) EidosValue_Int())->resize_no_initialize(x_colcount);
+		result_SP = EidosValue_SP(int_result);
+		
+		for (size_t value_index = 0; value_index < x_colcount; ++value_index)
+		{
+			int64_t sum = 0;
+			const int64_t *series_ptr = int_data + value_index * x_rowcount;
+			
+			for (size_t row_index = 0; row_index < x_rowcount; ++row_index)
+			{
+				// do sum += *series_ptr but check for overflow
+				int64_t old_sum = sum;
+				int64_t temp = *series_ptr;
+				bool overflow = Eidos_add_overflow(old_sum, temp, &sum);
+				
+				if (overflow)
+					EIDOS_TERMINATION << "ERROR (Eidos_ExecuteFunction_colSums): integer overflow in colSums(); you might wish to convert to float before calling colSums()." << EidosTerminate(nullptr);
+				
+				series_ptr++;
+			}
+			
+			int_result->set_int_no_check(sum, value_index);
+		}
+	}
+	else if (x_type == EidosValueType::kValueFloat)
+	{
+		const double *float_data = x_value->FloatData();
+		
+		EidosValue_Float *float_result = (new (gEidosValuePool->AllocateChunk()) EidosValue_Float())->resize_no_initialize(x_colcount);
+		result_SP = EidosValue_SP(float_result);
+		
+		for (size_t value_index = 0; value_index < x_colcount; ++value_index)
+		{
+			double sum = 0;
+			const double *series_ptr = float_data + value_index * x_rowcount;
+			
+			for (size_t row_index = 0; row_index < x_rowcount; ++row_index)
+				sum += *(series_ptr++);
+			
+			float_result->set_float_no_check(sum, value_index);
+		}
+	}
+	else if (x_type == EidosValueType::kValueLogical)
+	{
+		const eidos_logical_t *logical_data = x_value->LogicalData();
+		
+		EidosValue_Int *int_result = (new (gEidosValuePool->AllocateChunk()) EidosValue_Int())->resize_no_initialize(x_colcount);
+		result_SP = EidosValue_SP(int_result);
+		
+		for (size_t value_index = 0; value_index < x_colcount; ++value_index)
+		{
+			int64_t sum = 0;
+			const eidos_logical_t *series_ptr = logical_data + value_index * x_rowcount;
+			
+			for (size_t row_index = 0; row_index < x_rowcount; ++row_index)
+				sum += *(series_ptr++);
+			
+			int_result->set_int_no_check(sum, value_index);
+		}
+	}
+	
+	return result_SP;
+}
+
 
 
 
diff --git a/eidos/eidos_test_functions_other.cpp b/eidos/eidos_test_functions_other.cpp
@@ -370,6 +370,22 @@ void _RunFunctionMatrixArrayTests(void)
 	EidosAssertScriptSuccess_L("x = 1.0:12; y = matrix(x, nrow=3); identical(asVector(y), x);", true);
 	EidosAssertScriptSuccess_L("x = (rbinom(12, 1, 0.5) == 1); y = matrix(x, nrow=3); identical(asVector(y), x);", true);
 	EidosAssertScriptSuccess_L("x = c('a','b','c','d','e','f','g','h','i','j','k','l'); y = matrix(x, nrow=3); identical(asVector(y), x);", true);
+	
+	// rowSums()
+	EidosAssertScriptSuccess_L("x = c(T,T,F,F,T,F,F,T,T,F,F,T); y = matrix(x, nrow=3); identical(rowSums(y), c(1, 3, 2));", true);
+	EidosAssertScriptSuccess_L("x = 1:12; y = matrix(x, nrow=3); identical(rowSums(y), c(22, 26, 30));", true);
+	EidosAssertScriptSuccess_L("x = 1.0:12; y = matrix(x, nrow=3); identical(rowSums(y), c(22.0, 26, 30));", true);
+	EidosAssertScriptSuccess_L("x = (rbinom(100, 1, 0.4) == 1); y = matrix(x, nrow=10); identical(rowSums(y), apply(y, 0, 'sum(applyValue);'));", true);
+	EidosAssertScriptSuccess_L("x = rdunif(100, -1000, 1000); y = matrix(x, nrow=10); identical(rowSums(y), apply(y, 0, 'sum(applyValue);'));", true);
+	EidosAssertScriptSuccess_L("x = runif(100); y = matrix(x, nrow=10); identical(rowSums(y), apply(y, 0, 'sum(applyValue);'));", true);
+	
+	// colSums()
+	EidosAssertScriptSuccess_L("x = c(T,T,F,F,T,F,F,T,T,F,F,T); y = matrix(x, nrow=3); identical(colSums(y), c(2, 1, 2, 1));", true);
+	EidosAssertScriptSuccess_L("x = 1:12; y = matrix(x, nrow=3); identical(colSums(y), c(6, 15, 24, 33));", true);
+	EidosAssertScriptSuccess_L("x = 1.0:12; y = matrix(x, nrow=3); identical(colSums(y), c(6.0, 15, 24, 33));", true);
+	EidosAssertScriptSuccess_L("x = (rbinom(100, 1, 0.4) == 1); y = matrix(x, nrow=10); identical(colSums(y), apply(y, 1, 'sum(applyValue);'));", true);
+	EidosAssertScriptSuccess_L("x = rdunif(100, -1000, 1000); y = matrix(x, nrow=10); identical(colSums(y), apply(y, 1, 'sum(applyValue);'));", true);
+	EidosAssertScriptSuccess_L("x = runif(100); y = matrix(x, nrow=10); identical(colSums(y), apply(y, 1, 'sum(applyValue);'));", true);
 }
 
 #pragma mark filesystem access