// This file is part of Eigen, a lightweight C++ template library // for linear algebra. // // Copyright (C) 2009-2010 Gael Guennebaud // // This Source Code Form is subject to the terms of the Mozilla // Public License v. 2.0. If a copy of the MPL was not distributed // with this file, You can obtain one at http://mozilla.org/MPL/2.0/. #include "common.h" /** ZHEMV performs the matrix-vector operation * * y := alpha*A*x + beta*y, * * where alpha and beta are scalars, x and y are n element vectors and * A is an n by n hermitian matrix. */ EIGEN_BLAS_FUNC(hemv) (const char *uplo, const int *n, const RealScalar *palpha, const RealScalar *pa, const int *lda, const RealScalar *px, const int *incx, const RealScalar *pbeta, RealScalar *py, const int *incy) { typedef void (*functype)(int, const Scalar *, int, const Scalar *, Scalar *, Scalar); static const functype func[2] = { // array index: UP (Eigen::internal::selfadjoint_matrix_vector_product::run), // array index: LO (Eigen::internal::selfadjoint_matrix_vector_product::run), }; const Scalar *a = reinterpret_cast(pa); const Scalar *x = reinterpret_cast(px); Scalar *y = reinterpret_cast(py); Scalar alpha = *reinterpret_cast(palpha); Scalar beta = *reinterpret_cast(pbeta); // check arguments int info = 0; if (UPLO(*uplo) == INVALID) info = 1; else if (*n < 0) info = 2; else if (*lda < std::max(1, *n)) info = 5; else if (*incx == 0) info = 7; else if (*incy == 0) info = 10; if (info) return xerbla_(SCALAR_SUFFIX_UP "HEMV ", &info); if (*n == 0) return; const Scalar *actual_x = get_compact_vector(x, *n, *incx); Scalar *actual_y = get_compact_vector(y, *n, *incy); if (beta != Scalar(1)) { if (beta == Scalar(0)) make_vector(actual_y, *n).setZero(); else make_vector(actual_y, *n) *= beta; } if (alpha != Scalar(0)) { int code = UPLO(*uplo); if (code >= 2 || func[code] == 0) return; func[code](*n, a, *lda, actual_x, actual_y, alpha); } if (actual_x != x) delete[] actual_x; if (actual_y != y) delete[] copy_back(actual_y, y, *n, *incy); } /** HBMV performs the matrix-vector operation * * y := alpha*A*x + beta*y, * * where alpha and beta are scalars, x and y are n element vectors and * A is an n by n hermitian band matrix, with k super-diagonals. * Diagonal elements are real; off-diagonal contributions use conjugation. */ EIGEN_BLAS_FUNC(hbmv) (char *uplo, int *n, int *k, RealScalar *palpha, RealScalar *pa, int *lda, RealScalar *px, int *incx, RealScalar *pbeta, RealScalar *py, int *incy) { const Scalar alpha = *reinterpret_cast(palpha); const Scalar beta = *reinterpret_cast(pbeta); const Scalar *a = reinterpret_cast(pa); const Scalar *x = reinterpret_cast(px); Scalar *y = reinterpret_cast(py); int info = 0; if (UPLO(*uplo) == INVALID) info = 1; else if (*n < 0) info = 2; else if (*k < 0) info = 3; else if (*lda < *k + 1) info = 6; else if (*incx == 0) info = 8; else if (*incy == 0) info = 11; if (info) return xerbla_(SCALAR_SUFFIX_UP "HBMV ", &info); if (*n == 0 || (alpha == Scalar(0) && beta == Scalar(1))) return; const Scalar *actual_x = get_compact_vector(x, *n, *incx); Scalar *actual_y = get_compact_vector(y, *n, *incy); // First form y := beta*y. if (beta != Scalar(1)) { if (beta == Scalar(0)) make_vector(actual_y, *n).setZero(); else make_vector(actual_y, *n) *= beta; } if (alpha == Scalar(0)) { if (actual_x != x) delete[] actual_x; if (actual_y != y) delete[] copy_back(actual_y, y, *n, *incy); return; } if (*k >= 8) { // Vectorized path: use Eigen Map segments for the inner band operations. ConstMatrixType band(a, *k + 1, *n, *lda); if (UPLO(*uplo) == UP) { for (int j = 0; j < *n; ++j) { int start = std::max(0, j - *k); int len = j - start; int offset = *k - (j - start); Scalar temp1 = alpha * actual_x[j]; actual_y[j] += Scalar(Eigen::numext::real(band(*k, j))) * temp1; if (len > 0) { make_vector(actual_y + start, len) += temp1 * band.col(j).segment(offset, len); actual_y[j] += alpha * band.col(j).segment(offset, len).dot(make_vector(actual_x + start, len)); } } } else { for (int j = 0; j < *n; ++j) { int len = std::min(*n - 1, j + *k) - j; Scalar temp1 = alpha * actual_x[j]; actual_y[j] += Scalar(Eigen::numext::real(band(0, j))) * temp1; if (len > 0) { make_vector(actual_y + j + 1, len) += temp1 * band.col(j).segment(1, len); actual_y[j] += alpha * band.col(j).segment(1, len).dot(make_vector(actual_x + j + 1, len)); } } } } else { // Scalar path: for narrow bandwidth, avoid Map overhead. if (UPLO(*uplo) == UP) { for (int j = 0; j < *n; ++j) { Scalar temp1 = alpha * actual_x[j]; Scalar temp2 = Scalar(0); for (int i = std::max(0, j - *k); i < j; ++i) { Scalar aij = a[(*k + i - j) + j * *lda]; actual_y[i] += temp1 * aij; temp2 += Eigen::numext::conj(aij) * actual_x[i]; } actual_y[j] += Scalar(Eigen::numext::real(a[*k + j * *lda])) * temp1 + alpha * temp2; } } else { for (int j = 0; j < *n; ++j) { Scalar temp1 = alpha * actual_x[j]; Scalar temp2 = Scalar(0); actual_y[j] += Scalar(Eigen::numext::real(a[j * *lda])) * temp1; for (int i = j + 1; i <= std::min(*n - 1, j + *k); ++i) { Scalar aij = a[(i - j) + j * *lda]; actual_y[i] += temp1 * aij; temp2 += Eigen::numext::conj(aij) * actual_x[i]; } actual_y[j] += alpha * temp2; } } } if (actual_x != x) delete[] actual_x; if (actual_y != y) delete[] copy_back(actual_y, y, *n, *incy); } /** HPMV performs the matrix-vector operation * * y := alpha*A*x + beta*y, * * where alpha and beta are scalars, x and y are n element vectors and * A is an n by n hermitian matrix, supplied in packed form. * Diagonal elements are real; off-diagonal contributions use conjugation. */ EIGEN_BLAS_FUNC(hpmv) (char *uplo, int *n, RealScalar *palpha, RealScalar *pap, RealScalar *px, int *incx, RealScalar *pbeta, RealScalar *py, int *incy) { const Scalar alpha = *reinterpret_cast(palpha); const Scalar beta = *reinterpret_cast(pbeta); const Scalar *ap = reinterpret_cast(pap); const Scalar *x = reinterpret_cast(px); Scalar *y = reinterpret_cast(py); int info = 0; if (UPLO(*uplo) == INVALID) info = 1; else if (*n < 0) info = 2; else if (*incx == 0) info = 6; else if (*incy == 0) info = 9; if (info) return xerbla_(SCALAR_SUFFIX_UP "HPMV ", &info); if (*n == 0 || (alpha == Scalar(0) && beta == Scalar(1))) return; const Scalar *actual_x = get_compact_vector(x, *n, *incx); Scalar *actual_y = get_compact_vector(y, *n, *incy); // First form y := beta*y. if (beta != Scalar(1)) { if (beta == Scalar(0)) make_vector(actual_y, *n).setZero(); else make_vector(actual_y, *n) *= beta; } if (alpha == Scalar(0)) { if (actual_x != x) delete[] actual_x; if (actual_y != y) delete[] copy_back(actual_y, y, *n, *incy); return; } int kk = 0; if (UPLO(*uplo) == UP) { // Upper triangle packed: column j occupies ap[kk..kk+j]. for (int j = 0; j < *n; ++j) { Scalar temp1 = alpha * actual_x[j]; // Diagonal is real. actual_y[j] += Scalar(Eigen::numext::real(ap[kk + j])) * temp1; if (j > 0) { make_vector(actual_y, j) += temp1 * make_vector(ap + kk, j); actual_y[j] += alpha * make_vector(ap + kk, j).dot(make_vector(actual_x, j)); } kk += j + 1; } } else { // Lower triangle packed: column j occupies ap[kk..kk+(n-j-1)]. for (int j = 0; j < *n; ++j) { int len = *n - j - 1; Scalar temp1 = alpha * actual_x[j]; // Diagonal is real. actual_y[j] += Scalar(Eigen::numext::real(ap[kk])) * temp1; if (len > 0) { make_vector(actual_y + j + 1, len) += temp1 * make_vector(ap + kk + 1, len); actual_y[j] += alpha * make_vector(ap + kk + 1, len).dot(make_vector(actual_x + j + 1, len)); } kk += *n - j; } } if (actual_x != x) delete[] actual_x; if (actual_y != y) delete[] copy_back(actual_y, y, *n, *incy); } /** ZHPR performs the hermitian rank 1 operation * * A := alpha*x*conjg( x' ) + A, * * where alpha is a real scalar, x is an n element vector and A is an * n by n hermitian matrix, supplied in packed form. */ EIGEN_BLAS_FUNC(hpr)(char *uplo, int *n, RealScalar *palpha, RealScalar *px, int *incx, RealScalar *pap) { typedef void (*functype)(int, Scalar *, const Scalar *, RealScalar); static const functype func[2] = { // array index: UP (Eigen::internal::selfadjoint_packed_rank1_update::run), // array index: LO (Eigen::internal::selfadjoint_packed_rank1_update::run), }; Scalar *x = reinterpret_cast(px); Scalar *ap = reinterpret_cast(pap); RealScalar alpha = *palpha; int info = 0; if (UPLO(*uplo) == INVALID) info = 1; else if (*n < 0) info = 2; else if (*incx == 0) info = 5; if (info) return xerbla_(SCALAR_SUFFIX_UP "HPR ", &info); if (alpha == Scalar(0)) return; Scalar *x_cpy = get_compact_vector(x, *n, *incx); int code = UPLO(*uplo); if (code >= 2 || func[code] == 0) return; func[code](*n, ap, x_cpy, alpha); if (x_cpy != x) delete[] x_cpy; } /** ZHPR2 performs the hermitian rank 2 operation * * A := alpha*x*conjg( y' ) + conjg( alpha )*y*conjg( x' ) + A, * * where alpha is a scalar, x and y are n element vectors and A is an * n by n hermitian matrix, supplied in packed form. */ EIGEN_BLAS_FUNC(hpr2) (char *uplo, int *n, RealScalar *palpha, RealScalar *px, int *incx, RealScalar *py, int *incy, RealScalar *pap) { typedef void (*functype)(int, Scalar *, const Scalar *, const Scalar *, Scalar); static const functype func[2] = { // array index: UP (Eigen::internal::packed_rank2_update_selector::run), // array index: LO (Eigen::internal::packed_rank2_update_selector::run), }; Scalar *x = reinterpret_cast(px); Scalar *y = reinterpret_cast(py); Scalar *ap = reinterpret_cast(pap); Scalar alpha = *reinterpret_cast(palpha); int info = 0; if (UPLO(*uplo) == INVALID) info = 1; else if (*n < 0) info = 2; else if (*incx == 0) info = 5; else if (*incy == 0) info = 7; if (info) return xerbla_(SCALAR_SUFFIX_UP "HPR2 ", &info); if (alpha == Scalar(0)) return; Scalar *x_cpy = get_compact_vector(x, *n, *incx); Scalar *y_cpy = get_compact_vector(y, *n, *incy); int code = UPLO(*uplo); if (code >= 2 || func[code] == 0) return; func[code](*n, ap, x_cpy, y_cpy, alpha); if (x_cpy != x) delete[] x_cpy; if (y_cpy != y) delete[] y_cpy; } /** ZHER performs the hermitian rank 1 operation * * A := alpha*x*conjg( x' ) + A, * * where alpha is a real scalar, x is an n element vector and A is an * n by n hermitian matrix. */ EIGEN_BLAS_FUNC(her)(char *uplo, int *n, RealScalar *palpha, RealScalar *px, int *incx, RealScalar *pa, int *lda) { typedef void (*functype)(int, Scalar *, int, const Scalar *, const Scalar *, const Scalar &); static const functype func[2] = { // array index: UP (Eigen::selfadjoint_rank1_update::run), // array index: LO (Eigen::selfadjoint_rank1_update::run), }; Scalar *x = reinterpret_cast(px); Scalar *a = reinterpret_cast(pa); RealScalar alpha = *reinterpret_cast(palpha); int info = 0; if (UPLO(*uplo) == INVALID) info = 1; else if (*n < 0) info = 2; else if (*incx == 0) info = 5; else if (*lda < std::max(1, *n)) info = 7; if (info) return xerbla_(SCALAR_SUFFIX_UP "HER ", &info); if (alpha == RealScalar(0)) return; Scalar *x_cpy = get_compact_vector(x, *n, *incx); int code = UPLO(*uplo); if (code >= 2 || func[code] == 0) return; func[code](*n, a, *lda, x_cpy, x_cpy, alpha); matrix(a, *n, *n, *lda).diagonal().imag().setZero(); if (x_cpy != x) delete[] x_cpy; } /** ZHER2 performs the hermitian rank 2 operation * * A := alpha*x*conjg( y' ) + conjg( alpha )*y*conjg( x' ) + A, * * where alpha is a scalar, x and y are n element vectors and A is an n * by n hermitian matrix. */ EIGEN_BLAS_FUNC(her2) (char *uplo, int *n, RealScalar *palpha, RealScalar *px, int *incx, RealScalar *py, int *incy, RealScalar *pa, int *lda) { typedef void (*functype)(int, Scalar *, int, const Scalar *, const Scalar *, Scalar); static const functype func[2] = { // array index: UP (Eigen::internal::rank2_update_selector::run), // array index: LO (Eigen::internal::rank2_update_selector::run), }; Scalar *x = reinterpret_cast(px); Scalar *y = reinterpret_cast(py); Scalar *a = reinterpret_cast(pa); Scalar alpha = *reinterpret_cast(palpha); int info = 0; if (UPLO(*uplo) == INVALID) info = 1; else if (*n < 0) info = 2; else if (*incx == 0) info = 5; else if (*incy == 0) info = 7; else if (*lda < std::max(1, *n)) info = 9; if (info) return xerbla_(SCALAR_SUFFIX_UP "HER2 ", &info); if (alpha == Scalar(0)) return; Scalar *x_cpy = get_compact_vector(x, *n, *incx); Scalar *y_cpy = get_compact_vector(y, *n, *incy); int code = UPLO(*uplo); if (code >= 2 || func[code] == 0) return; func[code](*n, a, *lda, x_cpy, y_cpy, alpha); matrix(a, *n, *n, *lda).diagonal().imag().setZero(); if (x_cpy != x) delete[] x_cpy; if (y_cpy != y) delete[] y_cpy; } /** ZGERU performs the rank 1 operation * * A := alpha*x*y' + A, * * where alpha is a scalar, x is an m element vector, y is an n element * vector and A is an m by n matrix. */ EIGEN_BLAS_FUNC(geru) (int *m, int *n, RealScalar *palpha, RealScalar *px, int *incx, RealScalar *py, int *incy, RealScalar *pa, int *lda) { Scalar *x = reinterpret_cast(px); Scalar *y = reinterpret_cast(py); Scalar *a = reinterpret_cast(pa); Scalar alpha = *reinterpret_cast(palpha); int info = 0; if (*m < 0) info = 1; else if (*n < 0) info = 2; else if (*incx == 0) info = 5; else if (*incy == 0) info = 7; else if (*lda < std::max(1, *m)) info = 9; if (info) return xerbla_(SCALAR_SUFFIX_UP "GERU ", &info); if (alpha == Scalar(0)) return; Scalar *x_cpy = get_compact_vector(x, *m, *incx); Scalar *y_cpy = get_compact_vector(y, *n, *incy); Eigen::internal::general_rank1_update::run(*m, *n, a, *lda, x_cpy, y_cpy, alpha); if (x_cpy != x) delete[] x_cpy; if (y_cpy != y) delete[] y_cpy; } /** ZGERC performs the rank 1 operation * * A := alpha*x*conjg( y' ) + A, * * where alpha is a scalar, x is an m element vector, y is an n element * vector and A is an m by n matrix. */ EIGEN_BLAS_FUNC(gerc) (int *m, int *n, RealScalar *palpha, RealScalar *px, int *incx, RealScalar *py, int *incy, RealScalar *pa, int *lda) { Scalar *x = reinterpret_cast(px); Scalar *y = reinterpret_cast(py); Scalar *a = reinterpret_cast(pa); Scalar alpha = *reinterpret_cast(palpha); int info = 0; if (*m < 0) info = 1; else if (*n < 0) info = 2; else if (*incx == 0) info = 5; else if (*incy == 0) info = 7; else if (*lda < std::max(1, *m)) info = 9; if (info) return xerbla_(SCALAR_SUFFIX_UP "GERC ", &info); if (alpha == Scalar(0)) return; Scalar *x_cpy = get_compact_vector(x, *m, *incx); Scalar *y_cpy = get_compact_vector(y, *n, *incy); Eigen::internal::general_rank1_update::run(*m, *n, a, *lda, x_cpy, y_cpy, alpha); if (x_cpy != x) delete[] x_cpy; if (y_cpy != y) delete[] y_cpy; }