#ifndef SCITBX_MATRIX_HOUSEHOLDER_H #define SCITBX_MATRIX_HOUSEHOLDER_H #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include namespace scitbx { namespace matrix { namespace householder { struct applied_on_left_tag {}; struct applied_on_right_tag {}; struct applied_on_left_and_right_tag {}; enum { product_in_row_order, product_in_reverse_row_order }; /// Householder reflection P = I - beta v v^T /** Reference: Golub and Van Loan 5.1.2 to 5.1.4 Implementation note: only row-major storage is supported and this code is optimised accordingly (only relevant for big matrices). */ template struct reflection { typedef FloatType scalar_t; typedef af::c_grid<2> dim; typedef af::versa matrix_t; typedef af::ref matrix_ref_t; typedef af::const_ref matrix_const_ref_t; typedef af::versa symmetric_matrix_packed_u_t; typedef af::ref symmetric_matrix_packed_u_ref_t; /// Normalisation of the Householder vector scalar_t beta; /// Normalisation of the vector x passed to the constructor scalar_t norm_x; /// Essential part of the Householder vector std::vector v; /// Working vector for applying the Householder reflection to a matrix std::vector w; /** @name Constructors One may think that the working array v should be of size n-1 for a problem of size n since the real vector v is actually [ 1 v[0] v[1] ... ] but we actually use transformations in place in several places where v is loaded with [ x[0] x[1] ... ] and then transformed to [ 1 v[0] v[1] ... ]. Hence the need for one more element. */ //@{ template reflection(af::ref const &x) : v(x.size()) { zero_vector(x); } reflection(int n) : v(n) {} reflection(int m, int n, applied_on_left_tag, bool accumulate) : v(m), w(accumulate ? std::max(m,n) : n) {} reflection(int m, int n, applied_on_right_tag, bool accumulate) : v(n), w(accumulate ? std::max(m,n) : m) {} reflection(int m, int n, applied_on_left_and_right_tag) : v(std::max(m,n)), w(std::max(m,n)) {} //@} /// Construct the Householder reflection P s.t. Px = ||x||_2 e_1 /** If requested, x(0) is overwritten with the first element of Px whereas x(1:) is overwritten with the essential part of the Householder vector. Since operator() is used to access the elements of x, that code works even if x is stored with a stride different of 1 v is filled with the essential part of the Householder vector. Reference: Algorithm 5.1.1 (with the substitution sigma -> sqrt(sigma)) */ template void zero_vector(af::ref const &x, bool overwrite=true) { using namespace math::accumulator; // compute beta and v(0) int n = x.size(); norm_accumulator norm_accu; for (int i=1; i(&v[0], n), false); } /// Replace A(i:, j:) by PA(i:, j:) void apply_on_left_to_lower_right_block(matrix_ref_t const &a, int i, int j) { int m = a.n_rows(), n=a.n_columns(); // w = beta A(i:, j:)^T v for (int jj=j; jj < n; ++jj) w[jj-j] = a(i,jj); for (int ii=i+1; ii < m; ++ii) for (int jj=j; jj < n; ++jj) { w[jj-j] += a(ii,jj)*v[ii-i-1]; } for (int k=0; k < n-j; ++k) w[k] *= beta; // A(i:, j:) -= v(i:) w(j:)^T for (int jj=j; jj < n; ++jj) a(i,jj) -= w[jj-j]; for (int ii=i+1; ii < m; ++ii) { for (int jj=j; jj < n; ++jj) a(ii,jj) -= v[ii-i-1]*w[jj-j]; } } /// Replace A(i:, j:) by A(i:, j:)P void apply_on_right_to_lower_right_block(matrix_ref_t const &a, int i, int j) { int m = a.n_rows(), n=a.n_columns(); // w = beta A(i:, j) v for (int ii=i; ii < m; ++ii) { w[ii-i] = a(ii, j); for (int jj=j+1; jj < n; ++jj) w[ii-i] += a(ii,jj)*v[jj-j-1]; w[ii-i] *= beta; } // A(i:, j:) -= w(i:) v(j:)^T for (int ii=i; ii < m; ++ii) { a(ii,j) -= w[ii-i]; for (int jj=j+1; jj < n; ++jj) a(ii,jj) -= w[ii-i]*v[jj-j-1]; } } /// Replace A(i:, i:) by PA(i:,i:)P for a symmetric matrix A void apply_to_lower_right_block(symmetric_matrix_packed_u_ref_t const &a_, int i0) { int n = a_.accessor().n; scalar_t *a0 = &a_(i0,i0); // w = beta A(i:,i:) v scalar_t *a = a0; w[0] = *a++; for (int k=i0+1; k const &beta, int const off_diag=0) { int m = a.n_rows(); SCITBX_ASSERT(q.n_rows() == m)(q.n_rows())(m); // A = Q x ... q.set_identity(false); // Q may be rectangular for (int j=beta.size()-1; j >= 0; --j) { for (int i=j + off_diag + 1; i < m; ++i) v[i - j - off_diag - 1] = a(i,j); this->beta = beta[j]; apply_on_left_to_lower_right_block(q, j+off_diag, j+off_diag); } } /// Accumulate the k Householder reflection stored in factored form in the /// columns of the matrix a, in place into a /** The first n columns of the product H(0) H(1) .. H(k-1) are stored in the first n columns of \c a Reference: LAPACK DORG2R */ void accumulate_in_place_factored_form_in_columns( matrix_ref_t const &a, af::const_ref const &beta) { int m = a.n_rows(), n = a.n_columns(); // Don't forget Q and A occupy the same memory locations! if (m <= n) { // the last reduced column of A does not contain any Householder vector // and it will therefore not be touched by the coming loop for (int i=0; i= 0; --j) { // A(j+1:, j) starts as the essential part of the vector of H(j) // Q(j:, j) starts as [ 1 0 ... 0 ]^T // Copy the former to v and perform Q(j:, j) = H(j) Q(j:, j) // in one loop. for (int i=j+1; i < m; ++i) { v[i-j-1] = a(i,j); a(i,j) *= -beta[j]; } this->beta = beta[j]; a(j,j) = 1 - beta[j]; // Q(j:, j+1:) = H(j) Q(j:, j+1:) if (j < n-1) apply_on_left_to_lower_right_block(a, j, j+1); // Q(:j, j) = 0 for (int i=0; i const &beta, int reflection_order, int const off_diag=0) { int n = a.n_columns(); SCITBX_ASSERT( reflection_order == product_in_row_order || reflection_order == product_in_reverse_row_order); switch (reflection_order) { case product_in_row_order: // the reduction of A is done by A -> A Q SCITBX_ASSERT(q.n_rows() == n)(q.n_rows())(n); break; case product_in_reverse_row_order: // the reduction of A is done by A -> A Q^T SCITBX_ASSERT(q.n_columns() == n)(q.n_columns())(n); break; } q.set_identity(false); // Q may be rectangular for (int i=beta.size()-1; i >= 0; --i) { for (int j=i + off_diag + 1; j < n; ++j) v[j - i - off_diag - 1] = a(i,j); this->beta = beta[i]; switch (reflection_order) { case product_in_row_order: apply_on_left_to_lower_right_block(q, i+off_diag, i+off_diag); break; case product_in_reverse_row_order: apply_on_right_to_lower_right_block(q, i+off_diag, i+off_diag); break; } } } /// Accumulate the k Householder reflection stored in factored form in the /// rows of the matrix a, in place into a /** The first m rows of the product H(k-1) H(k-2) .. H(0) are stored in the first m rows of \c a */ void accumulate_in_place_factored_form_in_rows( matrix_ref_t const &a, af::const_ref const &beta) { int m = a.n_rows(), n = a.n_columns(); // Don't forget Q and A occupy the same memory locations! if (m >= n) { // the last reduced row of A does not contain any Householder vector // and it will therefore not be touched by the coming loop for (int j=0; j= 0; --i) { // A(i, i+1:) starts as the essential part of the vector of H(i) // Q(i, i:) starts as [ 1 0 ... 0 ]^T // Copy the former to v and perform Q(i, i:) = H(i) Q(i, i:) // in one loop. for (int j=i+1; j < n; ++j) { v[j-i-1] = a(i,j); a(i,j) *= -beta[i]; } this->beta = beta[i]; a(i,i) = 1 - beta[i]; // Q(i+1:, i:) = Q(i+1:, i:) H(i) if (i < m-1) apply_on_right_to_lower_right_block(a, i+1, i); // Q(i, :i) = 0 for (int j=0; j n, then Q only consists of the first n columns of a random normal matrix; - if m < n, then Q only consists of the first m rows of a random normal matrix. The distribution is uniform on the set of normal matrices. (For mathematically minded people, it is the Haar measure). Reference: G.W. Stewart, The efficient generation of random orthogonal matrices with an application to condition estimators, SIAM Journal on Numerical Analysis 17 (1980), no. 3, 403-409. This is the method used in LAPACK test tool DLAGGE for example. */ template void accumulate_random_normal_matrix( boost::variate_generator > &normal, matrix_ref_t const &q) { int m = q.n_rows(), n = q.n_columns(); q.set_identity(false); for (int i=std::min(m, n) - 1; i >= 0; --i) { if (i < n-1) { for (int k=0; k void accumulate_random_matrix_with_singular_values( boost::variate_generator > &normal, af::const_ref const &sigma, matrix_ref_t const &a) { int m = a.n_rows(), n = a.n_columns(); a.set_diagonal(sigma, false); for (int i=std::min(m, n) - 1; i >= 0; --i) { if (i < m-1) { for (int k=0; k void accumulate_random_symmetric_matrix_with_eigenvalues( boost::variate_generator > &normal, af::const_ref const &lambda, symmetric_matrix_packed_u_ref_t const &a) { int n = a.n_columns(); a.set_diagonal(lambda); for (int i=n-2; i>=0; --i) { for (int k=0; k struct qr_decomposition { typedef FloatType scalar_t; typedef af::c_grid<2> dim; typedef af::versa matrix_t; typedef af::ref matrix_ref_t; bool may_accumulate_q; matrix_ref_t a; reflection p; std::vector beta; /// Construct the QR decomposition of the m x n matrix A in place. /** The lower diagonal part of R is zero and its non-zero part is stored above and on the diagonal of A. Q is a product of Householder reflections whose vectors are stored below the diagonal of A. The argument may_accumulate_q_ must be set to true if Q is to be accumulated later. */ qr_decomposition(matrix_ref_t const &a_, bool may_accumulate_q_=true) : a(a_), may_accumulate_q(may_accumulate_q_), p(a.n_rows(), a.n_columns(), applied_on_left_tag(), may_accumulate_q) { int m = a.n_rows(), n = a.n_columns(), k=(m > n ? n : m-1); beta.reserve(k); for (int j=0; j= n): Q is m x n and R is n x n If \c thin is true, then the thin q is returned if m <= n and the full Q otherwise. If \c thin is false, the full Q is returned. */ matrix_t q(bool thin=true) { int m = a.n_rows(), n = a.n_columns(); SCITBX_ASSERT(may_accumulate_q); af::const_ref beta_(&beta[0], beta.size()); matrix_t q(dim(m, thin ? std::min(m,n) : m), af::init_functor_null()); p.accumulate_factored_form_in_columns(q.ref(), a, beta_); return q; } /// Accumulate the thin Q inside A in-place /** L is therefore lost */ void accumulate_q_in_place() { int m = a.n_rows(), n = a.n_columns(); SCITBX_ASSERT(may_accumulate_q); SCITBX_ASSERT(m >= n); af::const_ref beta_(&beta[0], beta.size()); p.accumulate_in_place_factored_form_in_columns(a, beta_); } }; /// Householder LQ decomposition template struct lq_decomposition { typedef FloatType scalar_t; typedef af::c_grid<2> dim; typedef af::versa matrix_t; typedef af::ref matrix_ref_t; bool may_accumulate_q; matrix_ref_t a; reflection p; std::vector beta; /// Construct the LQ decomposition of A /** The upper diagonal part of L is zero and its non-zero part is stored below and on the diagonal of A. Q is a product of Householder reflections whose vectors are stored above the diagonal of A. The argument may_accumulate_q_ must be set to true if Q is to be accumulated later. */ lq_decomposition(matrix_ref_t const &a_, bool may_accumulate_q_=true) : a(a_), may_accumulate_q(may_accumulate_q_), p(a.n_rows(), a.n_columns(), applied_on_right_tag(), may_accumulate_q) { int m = a.n_rows(), n = a.n_columns(), k=(n > m ? m : n-1); beta.reserve(k); for (int i=0; i beta_(&beta[0], beta.size()); matrix_t q(dim(thin ? std::min(m, n) : n, n), af::init_functor_null()); p.accumulate_factored_form_in_rows(q.ref(), a, beta_, product_in_reverse_row_order); return q; } /// Accumulate Q inside A in-place /** L is therefore lost */ void accumulate_q_in_place() { int m = a.n_rows(), n = a.n_columns(); SCITBX_ASSERT(may_accumulate_q); SCITBX_ASSERT(m <= n); af::const_ref beta_(&beta[0], beta.size()); p.accumulate_in_place_factored_form_in_rows(a, beta_); } }; /// Decomposition U^T A V = B where B is bibidiagonal and U,V orthogonal /** B is upper diagonal if m >= n and lower diagonal if m < n. Reference: Golub and Van Loan, Algorithm 5.4.2 */ template struct bidiagonalisation { typedef FloatType scalar_t; typedef af::c_grid<2> dim; typedef af::versa matrix_t; typedef af::ref matrix_ref_t; matrix_ref_t a; reflection p; std::vector beta_left, beta_right; /// Overwrite a in-place with its bidiagonalisation /** The bidiagonal is that of B whereas the rest of a stores the essential part of the Householder vectors making U and V */ bidiagonalisation(matrix_ref_t const &a_) : a(a_), p(a.n_rows(), a.n_columns(), applied_on_left_and_right_tag()) { int m = a.n_rows(), n = a.n_columns(); if (m >= n) { int k_left = m > n ? n : n-1; int k_right = n-2; beta_left.reserve(k_left); beta_right.reserve(k_right); for (int j=0; j beta_left_(&beta_left[0], beta_left.size()); matrix_t u(dim(m, thin ? std::min(m, n) : m), af::init_functor_null()); p.accumulate_factored_form_in_columns(u.ref(), a, beta_left_, m >= n ? 0 : 1); return u; } /// The matrix V, either full or thin (c.f. class \c lq_decomposition) matrix_t v(bool thin=true) { int m = a.n_rows(), n = a.n_columns(); af::const_ref beta_right_(&beta_right[0], beta_right.size()); matrix_t v(dim(n, thin ? std::min(m,n) : n), af::init_functor_null()); p.accumulate_factored_form_in_rows(v.ref(), a, beta_right_, product_in_row_order, m >= n ? 1 : 0); return v; } }; /// Random sequences of normal matrices, /// or of matrices with given eigen or singular values. /** Reference: G.W. Stewart, SIAM J. Numer. Anal., 17:403--409, 1980. The method relies on a multinormal random vector whose dimension is the number of rows of the matrices to generate. This class is modelled on the Boost random framework. */ template struct random_normal_matrix_generator { typedef FloatType scalar_t; typedef af::c_grid<2> dim; typedef af::versa matrix_t; typedef af::ref matrix_ref_t; typedef af::versa symmetric_matrix_packed_u_t; typedef af::ref symmetric_matrix_packed_u_ref_t; UniformRandomNumberGenerator uniform_gen; boost::normal_distribution normal_dist; boost::variate_generator > normal_gen; int m, n; reflection p; /// Construct a generator for matrices with the given dimensions. /** The given generator of uniformly distributed numbers on [0,1) is used as the source of the multinormal random generator. */ random_normal_matrix_generator(UniformRandomNumberGenerator &uniform, int rows, int columns) : uniform_gen(uniform), normal_dist(0, 1), normal_gen(uniform_gen, normal_dist), m(rows), n(columns), p(m, n, applied_on_left_and_right_tag()) {} /// Construct a generator for matrices with the given dimensions. /** An internal generator of uniformly distributed unbers on [0,1) is used as the source of the multinormal random generator. All objects made by this constructor produce the same random sequences. */ random_normal_matrix_generator(int rows, int columns) : normal_dist(0, 1), normal_gen(uniform_gen, normal_dist), m(rows), n(columns), p(m, n, applied_on_left_and_right_tag()) {} /// Generate a random normal matrix. matrix_t normal_matrix() { matrix_t result(dim(m, n), af::init_functor_null()); matrix_ref_t q = result.ref(); p.accumulate_random_normal_matrix(normal_gen, q); return result; } /// Generate a random matrix with the given singular values. matrix_t matrix_with_singular_values(af::const_ref const &sigma) { matrix_t result(dim(m, n), af::init_functor_null()); matrix_ref_t a = result.ref(); p.accumulate_random_matrix_with_singular_values(normal_gen, sigma, a); return result; } /// Generate a random symmetric matrix with the given eigenvalues. symmetric_matrix_packed_u_t symmetric_matrix_with_eigenvalues(af::const_ref const& lambda) { SCITBX_ASSERT(m == n)(m)(n); symmetric_matrix_packed_u_t result(n, af::init_functor_null()); symmetric_matrix_packed_u_ref_t a = result.ref(); p.accumulate_random_symmetric_matrix_with_eigenvalues(normal_gen, lambda, a); return result; } }; }}} // scitbx::matrix::householder #endif // GUARD