// This file is part of Eigen, a lightweight C++ template library // for linear algebra. // // Copyright (C) 2006-2008 Benoit Jacob // // This Source Code Form is subject to the terms of the Mozilla // Public License v. 2.0. If a copy of the MPL was not distributed // with this file, You can obtain one at http://mozilla.org/MPL/2.0/. #include "main.h" template void product_extra(const MatrixType& m) { typedef typename MatrixType::Scalar Scalar; typedef Matrix RowVectorType; typedef Matrix ColVectorType; typedef Matrix OtherMajorMatrixType; Index rows = m.rows(); Index cols = m.cols(); MatrixType m1 = MatrixType::Random(rows, cols), m2 = MatrixType::Random(rows, cols), m3(rows, cols), mzero = MatrixType::Zero(rows, cols), identity = MatrixType::Identity(rows, rows), square = MatrixType::Random(rows, rows), res = MatrixType::Random(rows, rows), square2 = MatrixType::Random(cols, cols), res2 = MatrixType::Random(cols, cols); RowVectorType v1 = RowVectorType::Random(rows), vrres(rows); ColVectorType vc2 = ColVectorType::Random(cols), vcres(cols); OtherMajorMatrixType tm1 = m1; Scalar s1 = internal::random(), s2 = internal::random(), s3 = internal::random(); VERIFY_IS_APPROX(m3.noalias() = m1 * m2.adjoint(), m1 * m2.adjoint().eval()); VERIFY_IS_APPROX(m3.noalias() = m1.adjoint() * square.adjoint(), m1.adjoint().eval() * square.adjoint().eval()); VERIFY_IS_APPROX(m3.noalias() = m1.adjoint() * m2, m1.adjoint().eval() * m2); VERIFY_IS_APPROX(m3.noalias() = (s1 * m1.adjoint()) * m2, (s1 * m1.adjoint()).eval() * m2); VERIFY_IS_APPROX(m3.noalias() = ((s1 * m1).adjoint()) * m2, (numext::conj(s1) * m1.adjoint()).eval() * m2); VERIFY_IS_APPROX(m3.noalias() = (-m1.adjoint() * s1) * (s3 * m2), (-m1.adjoint() * s1).eval() * (s3 * m2).eval()); VERIFY_IS_APPROX(m3.noalias() = (s2 * m1.adjoint() * s1) * m2, (s2 * m1.adjoint() * s1).eval() * m2); VERIFY_IS_APPROX(m3.noalias() = (-m1 * s2) * s1 * m2.adjoint(), (-m1 * s2).eval() * (s1 * m2.adjoint()).eval()); // a very tricky case where a scale factor has to be automatically conjugated: VERIFY_IS_APPROX(m1.adjoint() * (s1 * m2).conjugate(), (m1.adjoint()).eval() * ((s1 * m2).conjugate()).eval()); // test all possible conjugate combinations for the four matrix-vector product cases: VERIFY_IS_APPROX((-m1.conjugate() * s2) * (s1 * vc2), (-m1.conjugate() * s2).eval() * (s1 * vc2).eval()); VERIFY_IS_APPROX((-m1 * s2) * (s1 * vc2.conjugate()), (-m1 * s2).eval() * (s1 * vc2.conjugate()).eval()); VERIFY_IS_APPROX((-m1.conjugate() * s2) * (s1 * vc2.conjugate()), (-m1.conjugate() * s2).eval() * (s1 * vc2.conjugate()).eval()); VERIFY_IS_APPROX((s1 * vc2.transpose()) * (-m1.adjoint() * s2), (s1 * vc2.transpose()).eval() * (-m1.adjoint() * s2).eval()); VERIFY_IS_APPROX((s1 * vc2.adjoint()) * (-m1.transpose() * s2), (s1 * vc2.adjoint()).eval() * (-m1.transpose() * s2).eval()); VERIFY_IS_APPROX((s1 * vc2.adjoint()) * (-m1.adjoint() * s2), (s1 * vc2.adjoint()).eval() * (-m1.adjoint() * s2).eval()); VERIFY_IS_APPROX((-m1.adjoint() * s2) * (s1 * v1.transpose()), (-m1.adjoint() * s2).eval() * (s1 * v1.transpose()).eval()); VERIFY_IS_APPROX((-m1.transpose() * s2) * (s1 * v1.adjoint()), (-m1.transpose() * s2).eval() * (s1 * v1.adjoint()).eval()); VERIFY_IS_APPROX((-m1.adjoint() * s2) * (s1 * v1.adjoint()), (-m1.adjoint() * s2).eval() * (s1 * v1.adjoint()).eval()); VERIFY_IS_APPROX((s1 * v1) * (-m1.conjugate() * s2), (s1 * v1).eval() * (-m1.conjugate() * s2).eval()); VERIFY_IS_APPROX((s1 * v1.conjugate()) * (-m1 * s2), (s1 * v1.conjugate()).eval() * (-m1 * s2).eval()); VERIFY_IS_APPROX((s1 * v1.conjugate()) * (-m1.conjugate() * s2), (s1 * v1.conjugate()).eval() * (-m1.conjugate() * s2).eval()); VERIFY_IS_APPROX((-m1.adjoint() * s2) * (s1 * v1.adjoint()), (-m1.adjoint() * s2).eval() * (s1 * v1.adjoint()).eval()); // test the vector-matrix product with non aligned starts Index i = internal::random(0, m1.rows() - 2); Index j = internal::random(0, m1.cols() - 2); Index r = internal::random(1, m1.rows() - i); Index c = internal::random(1, m1.cols() - j); Index i2 = internal::random(0, m1.rows() - 1); Index j2 = internal::random(0, m1.cols() - 1); VERIFY_IS_APPROX(m1.col(j2).adjoint() * m1.block(0, j, m1.rows(), c), m1.col(j2).adjoint().eval() * m1.block(0, j, m1.rows(), c).eval()); VERIFY_IS_APPROX(m1.block(i, 0, r, m1.cols()) * m1.row(i2).adjoint(), m1.block(i, 0, r, m1.cols()).eval() * m1.row(i2).adjoint().eval()); // test negative strides { Map > map1(&m1(rows - 1, cols - 1), rows, cols, Stride(-m1.outerStride(), -1)); Map > map2(&m2(rows - 1, cols - 1), rows, cols, Stride(-m2.outerStride(), -1)); Map > mapv1(&v1(v1.size() - 1), v1.size(), InnerStride<-1>(-1)); Map > mapvc2(&vc2(vc2.size() - 1), vc2.size(), InnerStride<-1>(-1)); VERIFY_IS_APPROX(MatrixType(map1), m1.reverse()); VERIFY_IS_APPROX(MatrixType(map2), m2.reverse()); VERIFY_IS_APPROX(m3.noalias() = MatrixType(map1) * MatrixType(map2).adjoint(), m1.reverse() * m2.reverse().adjoint()); VERIFY_IS_APPROX(m3.noalias() = map1 * map2.adjoint(), m1.reverse() * m2.reverse().adjoint()); VERIFY_IS_APPROX(map1 * vc2, m1.reverse() * vc2); VERIFY_IS_APPROX(m1 * mapvc2, m1 * mapvc2); VERIFY_IS_APPROX(map1.adjoint() * v1.transpose(), m1.adjoint().reverse() * v1.transpose()); VERIFY_IS_APPROX(m1.adjoint() * mapv1.transpose(), m1.adjoint() * v1.reverse().transpose()); } // regression test MatrixType tmp = m1 * m1.adjoint() * s1; VERIFY_IS_APPROX(tmp, m1 * m1.adjoint() * s1); // regression test for bug 1343, assignment to arrays Array a1 = m1 * vc2; VERIFY_IS_APPROX(a1.matrix(), m1 * vc2); Array a2 = s1 * (m1 * vc2); VERIFY_IS_APPROX(a2.matrix(), s1 * m1 * vc2); Array a3 = v1 * m1; VERIFY_IS_APPROX(a3.matrix(), v1 * m1); Array a4 = m1 * m2.adjoint(); VERIFY_IS_APPROX(a4.matrix(), m1 * m2.adjoint()); } // Regression test for bug reported at http://forum.kde.org/viewtopic.php?f=74&t=96947 void mat_mat_scalar_scalar_product() { Eigen::Matrix2Xd dNdxy(2, 3); dNdxy << -0.5, 0.5, 0, -0.3, 0, 0.3; double det = 6.0, wt = 0.5; VERIFY_IS_APPROX(dNdxy.transpose() * dNdxy * det * wt, det * wt * dNdxy.transpose() * dNdxy); } template void zero_sized_objects(const MatrixType& m) { typedef typename MatrixType::Scalar Scalar; const int PacketSize = internal::packet_traits::size; const int PacketSize1 = PacketSize > 1 ? PacketSize - 1 : 1; Index rows = m.rows(); Index cols = m.cols(); { MatrixType res, a(rows, 0), b(0, cols); VERIFY_IS_APPROX((res = a * b), MatrixType::Zero(rows, cols)); VERIFY_IS_APPROX((res = a * a.transpose()), MatrixType::Zero(rows, rows)); VERIFY_IS_APPROX((res = b.transpose() * b), MatrixType::Zero(cols, cols)); VERIFY_IS_APPROX((res = b.transpose() * a.transpose()), MatrixType::Zero(cols, rows)); } { MatrixType res, a(rows, cols), b(cols, 0); res = a * b; VERIFY(res.rows() == rows && res.cols() == 0); b.resize(0, rows); res = b * a; VERIFY(res.rows() == 0 && res.cols() == cols); } { Matrix a; Matrix b; Matrix res; VERIFY_IS_APPROX((res = a * b), MatrixType::Zero(PacketSize, 1)); VERIFY_IS_APPROX((res = a.lazyProduct(b)), MatrixType::Zero(PacketSize, 1)); } { Matrix a; Matrix b; Matrix res; VERIFY_IS_APPROX((res = a * b), MatrixType::Zero(PacketSize1, 1)); VERIFY_IS_APPROX((res = a.lazyProduct(b)), MatrixType::Zero(PacketSize1, 1)); } { Matrix a(PacketSize, 0); Matrix b(0, 1); Matrix res; VERIFY_IS_APPROX((res = a * b), MatrixType::Zero(PacketSize, 1)); VERIFY_IS_APPROX((res = a.lazyProduct(b)), MatrixType::Zero(PacketSize, 1)); } { Matrix a(PacketSize1, 0); Matrix b(0, 1); Matrix res; VERIFY_IS_APPROX((res = a * b), MatrixType::Zero(PacketSize1, 1)); VERIFY_IS_APPROX((res = a.lazyProduct(b)), MatrixType::Zero(PacketSize1, 1)); } } template void bug_127() { // Bug 127 // // a product of the form lhs*rhs with // // lhs: // rows = 1, cols = 4 // RowsAtCompileTime = 1, ColsAtCompileTime = -1 // MaxRowsAtCompileTime = 1, MaxColsAtCompileTime = 5 // // rhs: // rows = 4, cols = 0 // RowsAtCompileTime = -1, ColsAtCompileTime = -1 // MaxRowsAtCompileTime = 5, MaxColsAtCompileTime = 1 // // was failing on a runtime assertion, because it had been mis-compiled as a dot product because Product.h was using // the max-sizes to detect size 1 indicating vectors, and that didn't account for 0-sized object with max-size 1. Matrix a(1, 4); Matrix b(4, 0); a* b; } template void bug_817() { ArrayXXf B = ArrayXXf::Random(10, 10), C; VectorXf x = VectorXf::Random(10); C = (x.transpose() * B.matrix()); B = (x.transpose() * B.matrix()); VERIFY_IS_APPROX(B, C); } template void unaligned_objects() { // Regression test for the bug reported here: // http://forum.kde.org/viewtopic.php?f=74&t=107541 // Recall the matrix*vector kernel avoid unaligned loads by loading two packets and then reassemble then. // There was a mistake in the computation of the valid range for fully unaligned objects: in some rare cases, // memory was read outside the allocated matrix memory. Though the values were not used, this might raise segfault. for (int m = 450; m < 460; ++m) { for (int n = 8; n < 12; ++n) { MatrixXf M(m, n); VectorXf v1(n), r1(500); RowVectorXf v2(m), r2(16); M.setRandom(); v1.setRandom(); v2.setRandom(); for (int o = 0; o < 4; ++o) { r1.segment(o, m).noalias() = M * v1; VERIFY_IS_APPROX(r1.segment(o, m), M * MatrixXf(v1)); r2.segment(o, n).noalias() = v2 * M; VERIFY_IS_APPROX(r2.segment(o, n), MatrixXf(v2) * M); } } } } template EIGEN_DONT_INLINE Index test_compute_block_size(Index m, Index n, Index k) { Index mc(m), nc(n), kc(k); internal::computeProductBlockingSizes(kc, mc, nc); return kc + mc + nc; } template Index compute_block_size() { Index ret = 0; // Zero-sized inputs: verify they compile and don't crash. ret += test_compute_block_size(0, 1, 1); ret += test_compute_block_size(1, 0, 1); ret += test_compute_block_size(1, 1, 0); ret += test_compute_block_size(0, 0, 1); ret += test_compute_block_size(0, 1, 0); ret += test_compute_block_size(1, 0, 0); ret += test_compute_block_size(0, 0, 0); // Sanity checks: blocking sizes must be positive and not exceed the original. { Index m = 200, n = 200, k = 200; Index mc = m, nc = n, kc = k; internal::computeProductBlockingSizes(kc, mc, nc); VERIFY(kc > 0 && kc <= k); VERIFY(mc > 0 && mc <= m); VERIFY(nc > 0 && nc <= n); } // With EIGEN_DEBUG_SMALL_PRODUCT_BLOCKS (l1=9KB, l2=32KB, l3=512KB), // large sizes must be actually blocked (not returned as-is). { Index m = 500, n = 500, k = 500; Index mc = m, nc = n, kc = k; internal::computeProductBlockingSizes(kc, mc, nc); VERIFY(kc < k); } return ret; } // Verify correctness of GEMM at sizes that require multiple blocking passes // under EIGEN_DEBUG_SMALL_PRODUCT_BLOCKS (l1=9KB, l2=32KB, l3=512KB). // The blocking early-return threshold is max(k,m,n) < 48, so sizes >= 48 // trigger actual multi-pass blocking with these tiny cache sizes. // Verifies GEMM against column-by-column GEMV (a different code path). template void test_small_block_correctness() { const int sizes[] = {48, 64, 96, 128, 200}; for (int si = 0; si < 5; ++si) { int n = sizes[si]; MatrixXd A = MatrixXd::Random(n, n); MatrixXd B = MatrixXd::Random(n, n); MatrixXd C(n, n); C.noalias() = A * B; MatrixXd Cref(n, n); for (int j = 0; j < n; ++j) Cref.col(j) = A * B.col(j); VERIFY_IS_APPROX(C, Cref); } // Non-square: exercise different blocking in m, n, k dimensions. { MatrixXd A = MatrixXd::Random(200, 64); MatrixXd B = MatrixXd::Random(64, 300); MatrixXd C(200, 300); C.noalias() = A * B; MatrixXd Cref(200, 300); for (int j = 0; j < 300; ++j) Cref.col(j) = A * B.col(j); VERIFY_IS_APPROX(C, Cref); } } template void aliasing_with_resize() { Index m = internal::random(10, 50); Index n = internal::random(10, 50); MatrixXd A, B, C(m, n), D(m, m); VectorXd a, b, c(n); C.setRandom(); D.setRandom(); c.setRandom(); double s = internal::random(1, 10); A = C; B = A * A.transpose(); A = A * A.transpose(); VERIFY_IS_APPROX(A, B); A = C; B = (A * A.transpose()) / s; A = (A * A.transpose()) / s; VERIFY_IS_APPROX(A, B); A = C; B = (A * A.transpose()) + D; A = (A * A.transpose()) + D; VERIFY_IS_APPROX(A, B); A = C; B = D + (A * A.transpose()); A = D + (A * A.transpose()); VERIFY_IS_APPROX(A, B); A = C; B = s * (A * A.transpose()); A = s * (A * A.transpose()); VERIFY_IS_APPROX(A, B); A = C; a = c; b = (A * a) / s; a = (A * a) / s; VERIFY_IS_APPROX(a, b); } template void bug_1308() { int n = 10; MatrixXd r(n, n); VectorXd v = VectorXd::Random(n); r = v * RowVectorXd::Ones(n); VERIFY_IS_APPROX(r, v.rowwise().replicate(n)); r = VectorXd::Ones(n) * v.transpose(); VERIFY_IS_APPROX(r, v.rowwise().replicate(n).transpose()); Matrix4d ones44 = Matrix4d::Ones(); Matrix4d m44 = Matrix4d::Ones() * Matrix4d::Ones(); VERIFY_IS_APPROX(m44, Matrix4d::Constant(4)); VERIFY_IS_APPROX(m44.noalias() = ones44 * Matrix4d::Ones(), Matrix4d::Constant(4)); VERIFY_IS_APPROX(m44.noalias() = ones44.transpose() * Matrix4d::Ones(), Matrix4d::Constant(4)); VERIFY_IS_APPROX(m44.noalias() = Matrix4d::Ones() * ones44, Matrix4d::Constant(4)); VERIFY_IS_APPROX(m44.noalias() = Matrix4d::Ones() * ones44.transpose(), Matrix4d::Constant(4)); typedef Matrix RMatrix4d; RMatrix4d r44 = Matrix4d::Ones() * Matrix4d::Ones(); VERIFY_IS_APPROX(r44, Matrix4d::Constant(4)); VERIFY_IS_APPROX(r44.noalias() = ones44 * Matrix4d::Ones(), Matrix4d::Constant(4)); VERIFY_IS_APPROX(r44.noalias() = ones44.transpose() * Matrix4d::Ones(), Matrix4d::Constant(4)); VERIFY_IS_APPROX(r44.noalias() = Matrix4d::Ones() * ones44, Matrix4d::Constant(4)); VERIFY_IS_APPROX(r44.noalias() = Matrix4d::Ones() * ones44.transpose(), Matrix4d::Constant(4)); VERIFY_IS_APPROX(r44.noalias() = ones44 * RMatrix4d::Ones(), Matrix4d::Constant(4)); VERIFY_IS_APPROX(r44.noalias() = ones44.transpose() * RMatrix4d::Ones(), Matrix4d::Constant(4)); VERIFY_IS_APPROX(r44.noalias() = RMatrix4d::Ones() * ones44, Matrix4d::Constant(4)); VERIFY_IS_APPROX(r44.noalias() = RMatrix4d::Ones() * ones44.transpose(), Matrix4d::Constant(4)); // RowVector4d r4; m44.setOnes(); r44.setZero(); VERIFY_IS_APPROX(r44.noalias() += m44.row(0).transpose() * RowVector4d::Ones(), ones44); r44.setZero(); VERIFY_IS_APPROX(r44.noalias() += m44.col(0) * RowVector4d::Ones(), ones44); r44.setZero(); VERIFY_IS_APPROX(r44.noalias() += Vector4d::Ones() * m44.row(0), ones44); r44.setZero(); VERIFY_IS_APPROX(r44.noalias() += Vector4d::Ones() * m44.col(0).transpose(), ones44); } // Regression test for issue #3059: GEBP asm register constraints fail // for custom (non-vectorizable) scalar types. Type T has a non-trivial // destructor (making sizeof(T) > sizeof(double)), while type U is a // simple wrapper. Both must compile and produce correct products. namespace issue_3059 { class Ptr { public: ~Ptr() {} double* m_ptr = nullptr; }; class T { public: T() = default; T(double v) : m_value(v) {} friend T operator*(const T& a, const T& b) { return T(a.m_value * b.m_value); } T& operator*=(const T& o) { m_value *= o.m_value; return *this; } friend T operator/(const T& a, const T& b) { return T(a.m_value / b.m_value); } T& operator/=(const T& o) { m_value /= o.m_value; return *this; } friend T operator+(const T& a, const T& b) { return T(a.m_value + b.m_value); } T& operator+=(const T& o) { m_value += o.m_value; return *this; } friend T operator-(const T& a, const T& b) { return T(a.m_value - b.m_value); } T& operator-=(const T& o) { m_value -= o.m_value; return *this; } friend T operator-(const T& a) { return T(-a.m_value); } bool operator==(const T& o) const { return m_value == o.m_value; } bool operator<(const T& o) const { return m_value < o.m_value; } bool operator<=(const T& o) const { return m_value <= o.m_value; } bool operator>(const T& o) const { return m_value > o.m_value; } bool operator>=(const T& o) const { return m_value >= o.m_value; } bool operator!=(const T& o) const { return m_value != o.m_value; } double value() const { return m_value; } private: double m_value = 0.0; Ptr m_ptr; // Makes sizeof(T) > sizeof(double) }; T sqrt(const T& x) { return T(std::sqrt(x.value())); } T abs(const T& x) { return T(std::abs(x.value())); } T abs2(const T& x) { return T(x.value() * x.value()); } class U { public: U() = default; U(double v) : m_value(v) {} friend U operator*(const U& a, const U& b) { return U(a.m_value * b.m_value); } U& operator*=(const U& o) { m_value *= o.m_value; return *this; } friend U operator/(const U& a, const U& b) { return U(a.m_value / b.m_value); } U& operator/=(const U& o) { m_value /= o.m_value; return *this; } friend U operator+(const U& a, const U& b) { return U(a.m_value + b.m_value); } U& operator+=(const U& o) { m_value += o.m_value; return *this; } friend U operator-(const U& a, const U& b) { return U(a.m_value - b.m_value); } U& operator-=(const U& o) { m_value -= o.m_value; return *this; } friend U operator-(const U& a) { return U(-a.m_value); } bool operator==(const U& o) const { return m_value == o.m_value; } bool operator<(const U& o) const { return m_value < o.m_value; } bool operator<=(const U& o) const { return m_value <= o.m_value; } bool operator>(const U& o) const { return m_value > o.m_value; } bool operator>=(const U& o) const { return m_value >= o.m_value; } bool operator!=(const U& o) const { return m_value != o.m_value; } double value() const { return m_value; } private: double m_value = 0.0; }; U sqrt(const U& x) { return U(std::sqrt(x.value())); } U abs(const U& x) { return U(std::abs(x.value())); } U abs2(const U& x) { return U(x.value() * x.value()); } } // namespace issue_3059 namespace Eigen { template <> struct NumTraits : NumTraits { using Real = issue_3059::T; using NonInteger = issue_3059::T; using Nested = issue_3059::T; enum { IsComplex = 0, RequireInitialization = 1 }; }; template <> struct NumTraits : NumTraits { using Real = issue_3059::U; using NonInteger = issue_3059::U; using Nested = issue_3059::U; enum { IsComplex = 0, RequireInitialization = 0 }; }; } // namespace Eigen template void product_custom_scalar_types() { using namespace issue_3059; // Type T: has non-trivial destructor, sizeof(T) > sizeof(double) { Matrix A(4, 4), B(4, 4), C(4, 4); for (int i = 0; i < 4; ++i) for (int j = 0; j < 4; ++j) { A(i, j) = T(static_cast(i + 1)); B(i, j) = T(static_cast(j + 1)); } C.noalias() = A * B; // A*B: C(i,j) = sum_k (i+1)*(k+1) * ... no, A(i,k)=(i+1), B(k,j)=(j+1) // so C(i,j) = sum_k (i+1)*(j+1) = 4*(i+1)*(j+1) for (int i = 0; i < 4; ++i) for (int j = 0; j < 4; ++j) VERIFY(C(i, j) == T(4.0 * (i + 1) * (j + 1))); } // Type U: simple wrapper, sizeof(U) == sizeof(double) { Matrix A(4, 4), B(4, 4), C(4, 4); for (int i = 0; i < 4; ++i) for (int j = 0; j < 4; ++j) { A(i, j) = U(static_cast(i + 1)); B(i, j) = U(static_cast(j + 1)); } C.noalias() = A * B; for (int i = 0; i < 4; ++i) for (int j = 0; j < 4; ++j) VERIFY(C(i, j) == U(4.0 * (i + 1) * (j + 1))); } // Larger matrices to exercise GEBP blocking. { const int n = 33; Matrix A(n, n), B(n, n), C(n, n); for (int i = 0; i < n; ++i) for (int j = 0; j < n; ++j) { A(i, j) = U(static_cast((i * 7 + j * 3) % 13)); B(i, j) = U(static_cast((i * 5 + j * 11) % 17)); } C.noalias() = A * B; // Verify against explicit triple loop. for (int i = 0; i < n; ++i) for (int j = 0; j < n; ++j) { double sum = 0; for (int k = 0; k < n; ++k) sum += A(i, k).value() * B(k, j).value(); VERIFY(C(i, j) == U(sum)); } } } // Test complex GEMV with all conjugation combinations at sizes that // exercise full, half, and quarter packet code paths. // The GEMV kernels in GeneralMatrixVector.h use conj_helper at three // packet levels. The existing product_extra tests cover conjugation // but only at random sizes, never systematically at packet boundaries. template void gemv_complex_conjugate() { typedef std::complex Scf; typedef std::complex Scd; const Index PS_f = internal::packet_traits::size; const Index PS_d = internal::packet_traits::size; // Sizes chosen to exercise packet boundaries for both float and double. const Index sizes[] = {1, 2, 3, 4, 5, 7, 8, 9, 15, 16, 17, 31, 32, 33}; for (int si = 0; si < 14; ++si) { Index m = sizes[si]; // Test complex GEMV with all conjugation combos. { typedef Matrix Mat; typedef Matrix Vec; Mat A = Mat::Random(m, m); Vec v = Vec::Random(m); Vec res(m); // A * v (no conjugation) res.noalias() = A * v; VERIFY_IS_APPROX(res, (A.eval() * v.eval()).eval()); // A.conjugate() * v res.noalias() = A.conjugate() * v; VERIFY_IS_APPROX(res, (A.conjugate().eval() * v.eval()).eval()); // A * v.conjugate() res.noalias() = A * v.conjugate(); VERIFY_IS_APPROX(res, (A.eval() * v.conjugate().eval()).eval()); // A.conjugate() * v.conjugate() res.noalias() = A.conjugate() * v.conjugate(); VERIFY_IS_APPROX(res, (A.conjugate().eval() * v.conjugate().eval()).eval()); // A.adjoint() * v (transpose + conjugate of lhs) Vec res2(m); res2.noalias() = A.adjoint() * v; VERIFY_IS_APPROX(res2, (A.adjoint().eval() * v.eval()).eval()); // Row-major complex GEMV typedef Matrix RMat; RMat B = A; res.noalias() = B * v; VERIFY_IS_APPROX(res, (A.eval() * v.eval()).eval()); res.noalias() = B.conjugate() * v; VERIFY_IS_APPROX(res, (A.conjugate().eval() * v.eval()).eval()); } // Test complex GEMV with conjugation. { typedef Matrix Mat; typedef Matrix Vec; Mat A = Mat::Random(m, m); Vec v = Vec::Random(m); Vec res(m); res.noalias() = A.conjugate() * v; VERIFY_IS_APPROX(res, (A.conjugate().eval() * v.eval()).eval()); res.noalias() = A * v.conjugate(); VERIFY_IS_APPROX(res, (A.eval() * v.conjugate().eval()).eval()); // Non-square: wide matrix × vector (exercises different cols path). Mat C = Mat::Random(m, m + 3); Vec w = Vec::Random(m + 3); Vec res3(m); res3.noalias() = C.conjugate() * w; VERIFY_IS_APPROX(res3, (C.conjugate().eval() * w.eval()).eval()); } } (void)PS_f; (void)PS_d; } EIGEN_DECLARE_TEST(product_extra) { for (int i = 0; i < g_repeat; i++) { CALL_SUBTEST_1(product_extra( MatrixXf(internal::random(1, EIGEN_TEST_MAX_SIZE), internal::random(1, EIGEN_TEST_MAX_SIZE)))); CALL_SUBTEST_2(product_extra( MatrixXd(internal::random(1, EIGEN_TEST_MAX_SIZE), internal::random(1, EIGEN_TEST_MAX_SIZE)))); CALL_SUBTEST_2(mat_mat_scalar_scalar_product()); CALL_SUBTEST_3(product_extra(MatrixXcf(internal::random(1, EIGEN_TEST_MAX_SIZE / 2), internal::random(1, EIGEN_TEST_MAX_SIZE / 2)))); CALL_SUBTEST_4(product_extra(MatrixXcd(internal::random(1, EIGEN_TEST_MAX_SIZE / 2), internal::random(1, EIGEN_TEST_MAX_SIZE / 2)))); CALL_SUBTEST_1(zero_sized_objects( MatrixXf(internal::random(1, EIGEN_TEST_MAX_SIZE), internal::random(1, EIGEN_TEST_MAX_SIZE)))); } CALL_SUBTEST_5(bug_127<0>()); CALL_SUBTEST_5(bug_817<0>()); CALL_SUBTEST_5(bug_1308<0>()); CALL_SUBTEST_6(unaligned_objects<0>()); CALL_SUBTEST_7(compute_block_size()); CALL_SUBTEST_7(compute_block_size()); CALL_SUBTEST_7(compute_block_size >()); CALL_SUBTEST_8(aliasing_with_resize()); CALL_SUBTEST_9(product_custom_scalar_types<0>()); CALL_SUBTEST_10(test_small_block_correctness<0>()); // Complex GEMV conjugation at varied sizes (deterministic, outside g_repeat). CALL_SUBTEST_11(gemv_complex_conjugate<0>()); }