// This file is part of Eigen, a lightweight C++ template library // for linear algebra. // // Copyright (C) 2008 Benoit Jacob // Copyright (C) 2015 Gael Guennebaud // // This Source Code Form is subject to the terms of the Mozilla // Public License v. 2.0. If a copy of the MPL was not distributed // with this file, You can obtain one at http://mozilla.org/MPL/2.0/. #define TEST_ENABLE_TEMPORARY_TRACKING #define EIGEN_CACHEFRIENDLY_PRODUCT_THRESHOLD 8 // ^^ see bug 1449 #include "main.h" template void matrixRedux(const MatrixType& m) { typedef typename MatrixType::Scalar Scalar; typedef typename MatrixType::RealScalar RealScalar; Index rows = m.rows(); Index cols = m.cols(); MatrixType m1 = MatrixType::Random(rows, cols); // The entries of m1 are uniformly distributed in [-1,1), so m1.prod() is very small. This may lead to test // failures if we underflow into denormals. Thus, we scale so that entries are close to 1. MatrixType m1_for_prod = MatrixType::Ones(rows, cols) + RealScalar(0.2) * m1; Matrix m2(rows, rows); m2.setRandom(); // Prevent overflows for integer types. if (Eigen::NumTraits::IsInteger) { Scalar kMaxVal = Scalar(8); m1.array() = m1.array() - kMaxVal * (m1.array() / kMaxVal); m2.array() = m2.array() - kMaxVal * (m2.array() / kMaxVal); } VERIFY_IS_EQUAL(MatrixType::Zero(rows, cols).sum(), Scalar(0)); Scalar sizeAsScalar = internal::cast(rows * cols); VERIFY_IS_APPROX(MatrixType::Ones(rows, cols).sum(), sizeAsScalar); Scalar s(0), p(1), minc(numext::real(m1.coeff(0))), maxc(numext::real(m1.coeff(0))); for (int j = 0; j < cols; j++) for (int i = 0; i < rows; i++) { s += m1(i, j); p *= m1_for_prod(i, j); minc = (std::min)(numext::real(minc), numext::real(m1(i, j))); maxc = (std::max)(numext::real(maxc), numext::real(m1(i, j))); } const Scalar mean = s / Scalar(RealScalar(rows * cols)); VERIFY_IS_APPROX(m1.sum(), s); VERIFY_IS_APPROX(m1.mean(), mean); VERIFY_IS_APPROX(m1_for_prod.prod(), p); VERIFY_IS_APPROX(m1.real().minCoeff(), numext::real(minc)); VERIFY_IS_APPROX(m1.real().maxCoeff(), numext::real(maxc)); // test that partial reduction works if nested expressions is forced to evaluate early VERIFY_IS_APPROX((m1.matrix() * m1.matrix().transpose()).cwiseProduct(m2.matrix()).rowwise().sum().sum(), (m1.matrix() * m1.matrix().transpose()).eval().cwiseProduct(m2.matrix()).rowwise().sum().sum()); // test slice vectorization assuming assign is ok Index r0 = internal::random(0, rows - 1); Index c0 = internal::random(0, cols - 1); Index r1 = internal::random(r0 + 1, rows) - r0; Index c1 = internal::random(c0 + 1, cols) - c0; VERIFY_IS_APPROX(m1.block(r0, c0, r1, c1).sum(), m1.block(r0, c0, r1, c1).eval().sum()); VERIFY_IS_APPROX(m1.block(r0, c0, r1, c1).mean(), m1.block(r0, c0, r1, c1).eval().mean()); VERIFY_IS_APPROX(m1_for_prod.block(r0, c0, r1, c1).prod(), m1_for_prod.block(r0, c0, r1, c1).eval().prod()); VERIFY_IS_APPROX(m1.block(r0, c0, r1, c1).real().minCoeff(), m1.block(r0, c0, r1, c1).real().eval().minCoeff()); VERIFY_IS_APPROX(m1.block(r0, c0, r1, c1).real().maxCoeff(), m1.block(r0, c0, r1, c1).real().eval().maxCoeff()); // regression for bug 1090 const int R1 = MatrixType::RowsAtCompileTime >= 2 ? MatrixType::RowsAtCompileTime / 2 : 6; const int C1 = MatrixType::ColsAtCompileTime >= 2 ? MatrixType::ColsAtCompileTime / 2 : 6; if (R1 <= rows - r0 && C1 <= cols - c0) { VERIFY_IS_APPROX((m1.template block(r0, c0).sum()), m1.block(r0, c0, R1, C1).sum()); } // test empty objects VERIFY_IS_APPROX(m1.block(r0, c0, 0, 0).sum(), Scalar(0)); VERIFY_IS_APPROX(m1.block(r0, c0, 0, 0).prod(), Scalar(1)); // test nesting complex expression VERIFY_EVALUATION_COUNT((m1.matrix() * m1.matrix().transpose()).sum(), (MatrixType::IsVectorAtCompileTime && MatrixType::SizeAtCompileTime != 1 ? 0 : 1)); VERIFY_EVALUATION_COUNT(((m1.matrix() * m1.matrix().transpose()) + m2).sum(), (MatrixType::IsVectorAtCompileTime && MatrixType::SizeAtCompileTime != 1 ? 0 : 1)); } template void vectorRedux(const VectorType& w) { using std::abs; typedef typename VectorType::Scalar Scalar; typedef typename NumTraits::Real RealScalar; Index size = w.size(); VectorType v = VectorType::Random(size); VectorType v_for_prod = VectorType::Ones(size) + Scalar(0.2) * v; // see comment above declaration of m1_for_prod if (Eigen::NumTraits::IsInteger) { Scalar kMaxVal = Scalar(8); v.array() = v.array() - kMaxVal * (v.array() / kMaxVal); v_for_prod = VectorType::Ones(size) + Scalar(0.2) * v; } for (int i = 1; i < size; i++) { Scalar s(0), p(1); RealScalar minc(numext::real(v.coeff(0))), maxc(numext::real(v.coeff(0))); for (int j = 0; j < i; j++) { s += v[j]; p *= v_for_prod[j]; minc = (std::min)(minc, numext::real(v[j])); maxc = (std::max)(maxc, numext::real(v[j])); } VERIFY_IS_MUCH_SMALLER_THAN(abs(s - v.head(i).sum()), Scalar(1)); VERIFY_IS_APPROX(p, v_for_prod.head(i).prod()); VERIFY_IS_APPROX(minc, v.real().head(i).minCoeff()); VERIFY_IS_APPROX(maxc, v.real().head(i).maxCoeff()); } for (int i = 0; i < size - 1; i++) { Scalar s(0), p(1); RealScalar minc(numext::real(v.coeff(i))), maxc(numext::real(v.coeff(i))); for (int j = i; j < size; j++) { s += v[j]; p *= v_for_prod[j]; minc = (std::min)(minc, numext::real(v[j])); maxc = (std::max)(maxc, numext::real(v[j])); } VERIFY_IS_MUCH_SMALLER_THAN(abs(s - v.tail(size - i).sum()), Scalar(1)); VERIFY_IS_APPROX(p, v_for_prod.tail(size - i).prod()); VERIFY_IS_APPROX(minc, v.real().tail(size - i).minCoeff()); VERIFY_IS_APPROX(maxc, v.real().tail(size - i).maxCoeff()); } for (int i = 0; i < size / 2; i++) { Scalar s(0), p(1); RealScalar minc(numext::real(v.coeff(i))), maxc(numext::real(v.coeff(i))); for (int j = i; j < size - i; j++) { s += v[j]; p *= v_for_prod[j]; minc = (std::min)(minc, numext::real(v[j])); maxc = (std::max)(maxc, numext::real(v[j])); } VERIFY_IS_MUCH_SMALLER_THAN(abs(s - v.segment(i, size - 2 * i).sum()), Scalar(1)); VERIFY_IS_APPROX(p, v_for_prod.segment(i, size - 2 * i).prod()); VERIFY_IS_APPROX(minc, v.real().segment(i, size - 2 * i).minCoeff()); VERIFY_IS_APPROX(maxc, v.real().segment(i, size - 2 * i).maxCoeff()); } // test empty objects VERIFY_IS_APPROX(v.head(0).sum(), Scalar(0)); VERIFY_IS_APPROX(v.tail(0).prod(), Scalar(1)); VERIFY_RAISES_ASSERT(v.head(0).mean()); VERIFY_RAISES_ASSERT(v.head(0).minCoeff()); VERIFY_RAISES_ASSERT(v.head(0).maxCoeff()); } void boolRedux(Index rows, Index cols) { // Test boolean reductions: all(), any(), count() typedef Array BoolArray; // All-true BoolArray all_true = BoolArray::Constant(rows, cols, true); VERIFY(all_true.all()); VERIFY(all_true.any()); VERIFY_IS_EQUAL(all_true.count(), rows * cols); // All-false BoolArray all_false = BoolArray::Constant(rows, cols, false); if (rows > 0 && cols > 0) { VERIFY(!all_false.all()); VERIFY(!all_false.any()); } VERIFY_IS_EQUAL(all_false.count(), Index(0)); // Mixed: set a checkerboard pattern BoolArray mixed(rows, cols); Index expected_count = 0; for (Index j = 0; j < cols; ++j) for (Index i = 0; i < rows; ++i) { mixed(i, j) = ((i + j) % 2 == 0); if (mixed(i, j)) expected_count++; } VERIFY_IS_EQUAL(mixed.count(), expected_count); if (rows > 0 && cols > 0) { VERIFY(mixed.any()); VERIFY(mixed.all() == (expected_count == rows * cols)); } // Partial reductions if (rows > 0 && cols > 0) { auto col_counts = mixed.colwise().count(); for (Index k = 0; k < cols; ++k) VERIFY_IS_EQUAL(col_counts(k), mixed.col(k).count()); auto row_counts = mixed.rowwise().count(); for (Index k = 0; k < rows; ++k) VERIFY_IS_EQUAL(row_counts(k), mixed.row(k).count()); } } // Test reductions at sizes that hit vectorization boundaries in Redux.h: // LinearVectorizedTraversal with 2-way unrolled packet loop, scalar pre/post loops. template void redux_vec_boundary() { const Index PS = internal::packet_traits::size; // Critical sizes: around packet multiples and at 2-way unroll boundaries const Index sizes[] = {1, PS - 1, PS, PS + 1, 2 * PS - 1, 2 * PS, 2 * PS + 1, 3 * PS, 3 * PS + 1, 4 * PS - 1, 4 * PS, 4 * PS + 1, 8 * PS, 8 * PS + 1}; for (int si = 0; si < 14; ++si) { const Index n = sizes[si]; if (n <= 0) continue; typedef Matrix Vec; Vec v = Vec::Random(n); // For prod, use values near 1 to avoid underflow (float) or overflow (int). Vec v_for_prod = Vec::Ones(n) + Scalar(typename NumTraits::Real(0.2)) * v; // Reference: scalar loops Scalar ref_sum(0), ref_prod(1); typename NumTraits::Real ref_min = numext::real(v(0)), ref_max = numext::real(v(0)); for (Index k = 0; k < n; ++k) { ref_sum += v(k); ref_prod *= v_for_prod(k); ref_min = (std::min)(ref_min, numext::real(v(k))); ref_max = (std::max)(ref_max, numext::real(v(k))); } VERIFY_IS_APPROX(v.sum(), ref_sum); VERIFY_IS_APPROX(v_for_prod.prod(), ref_prod); VERIFY_IS_APPROX(v.real().minCoeff(), ref_min); VERIFY_IS_APPROX(v.real().maxCoeff(), ref_max); } } // Test reductions on strided (non-contiguous) mapped data. // This exercises SliceVectorizedTraversal or DefaultTraversal in Redux.h // depending on stride and packet size. template void redux_strided() { const Index n = 64; typedef Matrix Vec; Vec data = Vec::Random(2 * n); // Map with inner stride of 2 — every other element Map> strided(data.data(), n); Scalar ref_sum(0); typename NumTraits::Real ref_min = numext::real(strided(0)), ref_max = numext::real(strided(0)); for (Index k = 0; k < n; ++k) { ref_sum += strided(k); ref_min = (std::min)(ref_min, numext::real(strided(k))); ref_max = (std::max)(ref_max, numext::real(strided(k))); } VERIFY_IS_APPROX(strided.sum(), ref_sum); VERIFY_IS_APPROX(strided.real().minCoeff(), ref_min); VERIFY_IS_APPROX(strided.real().maxCoeff(), ref_max); // Also test reduction on a non-contiguous matrix block (SliceVectorizedTraversal) typedef Matrix Mat; Mat m = Mat::Random(16, 16); for (Index bsz = 1; bsz <= 8; bsz *= 2) { Scalar block_sum(0); for (Index j = 0; j < bsz; ++j) for (Index i = 0; i < bsz; ++i) block_sum += m(1 + i, 1 + j); VERIFY_IS_APPROX(m.block(1, 1, bsz, bsz).sum(), block_sum); } } EIGEN_DECLARE_TEST(redux) { // the max size cannot be too large, otherwise reduxion operations obviously generate large errors. int maxsize = (std::min)(100, EIGEN_TEST_MAX_SIZE); TEST_SET_BUT_UNUSED_VARIABLE(maxsize); for (int i = 0; i < g_repeat; i++) { int rows = internal::random(1, maxsize); int cols = internal::random(1, maxsize); EIGEN_UNUSED_VARIABLE(rows); EIGEN_UNUSED_VARIABLE(cols); CALL_SUBTEST_1(matrixRedux(Matrix())); CALL_SUBTEST_1(matrixRedux(Array())); CALL_SUBTEST_2(matrixRedux(Matrix2f())); CALL_SUBTEST_2(matrixRedux(Array2f())); CALL_SUBTEST_2(matrixRedux(Array22f())); CALL_SUBTEST_3(matrixRedux(Matrix4d())); CALL_SUBTEST_3(matrixRedux(Array4d())); CALL_SUBTEST_3(matrixRedux(Array44d())); CALL_SUBTEST_4(matrixRedux(MatrixXf(rows, cols))); CALL_SUBTEST_4(matrixRedux(ArrayXXf(rows, cols))); CALL_SUBTEST_4(matrixRedux(MatrixXd(rows, cols))); CALL_SUBTEST_4(matrixRedux(ArrayXXd(rows, cols))); /* TODO: fix test for boolean */ /*CALL_SUBTEST_5(matrixRedux(MatrixX(rows, cols)));*/ /*CALL_SUBTEST_5(matrixRedux(ArrayXX(rows, cols)));*/ CALL_SUBTEST_5(matrixRedux(MatrixXi(rows, cols))); CALL_SUBTEST_5(matrixRedux(ArrayXXi(rows, cols))); CALL_SUBTEST_5(matrixRedux(MatrixX(rows, cols))); CALL_SUBTEST_5(matrixRedux(ArrayXX(rows, cols))); CALL_SUBTEST_6(matrixRedux(MatrixXcf(rows, cols))); CALL_SUBTEST_6(matrixRedux(ArrayXXcf(rows, cols))); CALL_SUBTEST_7(matrixRedux(MatrixXcd(rows, cols))); CALL_SUBTEST_7(matrixRedux(ArrayXXcd(rows, cols))); } for (int i = 0; i < g_repeat; i++) { int size = internal::random(1, maxsize); EIGEN_UNUSED_VARIABLE(size); CALL_SUBTEST_8(vectorRedux(Vector4f())); CALL_SUBTEST_8(vectorRedux(Array4f())); CALL_SUBTEST_9(vectorRedux(VectorXf(size))); CALL_SUBTEST_9(vectorRedux(ArrayXf(size))); CALL_SUBTEST_10(vectorRedux(VectorXd(size))); CALL_SUBTEST_10(vectorRedux(ArrayXd(size))); /* TODO: fix test for boolean */ /*CALL_SUBTEST_10(vectorRedux(VectorX(size)));*/ /*CALL_SUBTEST_10(vectorRedux(ArrayX(size)));*/ CALL_SUBTEST_10(vectorRedux(VectorXi(size))); CALL_SUBTEST_10(vectorRedux(ArrayXi(size))); CALL_SUBTEST_10(vectorRedux(VectorX(size))); CALL_SUBTEST_10(vectorRedux(ArrayX(size))); } // Bool reductions (deterministic, outside g_repeat) CALL_SUBTEST_11(boolRedux(1, 1)); CALL_SUBTEST_11(boolRedux(4, 4)); CALL_SUBTEST_11(boolRedux(7, 13)); CALL_SUBTEST_11(boolRedux(63, 63)); // Bool reductions at vectorization boundary sizes. // all()/any()/count() use packet-level visitors with remainder handling. { // bool packets are typically 16 bytes (SSE) or 32 bytes (AVX). // Test sizes around common packet sizes to catch off-by-one in remainder loops. const Index bsizes[] = {1, 2, 3, 7, 8, 9, 15, 16, 17, 31, 32, 33, 63, 64, 65, 127, 128, 129}; EIGEN_UNUSED_VARIABLE(bsizes); for (int si = 0; si < 18; ++si) { CALL_SUBTEST_11(boolRedux(bsizes[si], 1)); // column vector CALL_SUBTEST_11(boolRedux(1, bsizes[si])); // row vector CALL_SUBTEST_11(boolRedux(bsizes[si], 3)); // thin matrix } } // Vectorization boundary sizes — deterministic, run once. // Integer types are excluded: full-range random ints overflow in sum/prod (UB). // Integer reductions are already tested by matrixRedux/vectorRedux with clamped values. CALL_SUBTEST_12(redux_vec_boundary()); CALL_SUBTEST_12(redux_vec_boundary()); // Strided (non-contiguous) reductions. CALL_SUBTEST_13(redux_strided()); CALL_SUBTEST_13(redux_strided()); CALL_SUBTEST_13(redux_strided>()); }