4325 lines
117 KiB
C++
4325 lines
117 KiB
C++
// Copyright (C) 2008-2015 National ICT Australia (NICTA)
|
|
//
|
|
// This Source Code Form is subject to the terms of the Mozilla Public
|
|
// License, v. 2.0. If a copy of the MPL was not distributed with this
|
|
// file, You can obtain one at http://mozilla.org/MPL/2.0/.
|
|
// -------------------------------------------------------------------
|
|
//
|
|
// Written by Conrad Sanderson - http://conradsanderson.id.au
|
|
// Written by James Sanders
|
|
// Written by Stanislav Funiak
|
|
// Written by Eric Jon Sundstrom
|
|
// Written by Michael McNeil Forbes
|
|
// Written by Keith O'Hara
|
|
|
|
|
|
//! \addtogroup auxlib
|
|
//! @{
|
|
|
|
|
|
|
|
//! matrix inverse
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::inv(Mat<eT>& out, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
out = X.get_ref();
|
|
|
|
arma_debug_check( (out.is_square() == false), "inv(): given matrix must be square sized" );
|
|
|
|
const uword N = out.n_rows;
|
|
|
|
if(N <= 4)
|
|
{
|
|
Mat<eT> tmp(N,N);
|
|
|
|
const bool status = auxlib::inv_noalias_tinymat(tmp, out, N);
|
|
|
|
if(status == true)
|
|
{
|
|
arrayops::copy( out.memptr(), tmp.memptr(), tmp.n_elem );
|
|
|
|
return true;
|
|
}
|
|
}
|
|
|
|
return auxlib::inv_inplace_lapack(out);
|
|
}
|
|
|
|
|
|
|
|
template<typename eT>
|
|
inline
|
|
bool
|
|
auxlib::inv(Mat<eT>& out, const Mat<eT>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
arma_debug_check( (X.is_square() == false), "inv(): given matrix must be square sized" );
|
|
|
|
const uword N = X.n_rows;
|
|
|
|
if(N <= 4)
|
|
{
|
|
if(&out != &X)
|
|
{
|
|
out.set_size(N,N);
|
|
|
|
const bool status = auxlib::inv_noalias_tinymat(out, X, N);
|
|
|
|
if(status == true) { return true; }
|
|
}
|
|
else
|
|
{
|
|
Mat<eT> tmp(N,N);
|
|
|
|
const bool status = auxlib::inv_noalias_tinymat(tmp, X, N);
|
|
|
|
if(status == true)
|
|
{
|
|
arrayops::copy( out.memptr(), tmp.memptr(), tmp.n_elem );
|
|
|
|
return true;
|
|
}
|
|
}
|
|
}
|
|
|
|
out = X;
|
|
|
|
return auxlib::inv_inplace_lapack(out);
|
|
}
|
|
|
|
|
|
|
|
template<typename eT>
|
|
inline
|
|
bool
|
|
auxlib::inv_noalias_tinymat(Mat<eT>& out, const Mat<eT>& X, const uword N)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
typedef typename get_pod_type<eT>::result T;
|
|
|
|
const T det_min = std::numeric_limits<T>::epsilon();
|
|
|
|
bool calc_ok = false;
|
|
|
|
const eT* Xm = X.memptr();
|
|
eT* outm = out.memptr(); // NOTE: the output matrix is assumed to have the correct size
|
|
|
|
switch(N)
|
|
{
|
|
case 1:
|
|
{
|
|
outm[0] = eT(1) / Xm[0];
|
|
|
|
calc_ok = true;
|
|
};
|
|
break;
|
|
|
|
case 2:
|
|
{
|
|
const eT a = Xm[pos<0,0>::n2];
|
|
const eT b = Xm[pos<0,1>::n2];
|
|
const eT c = Xm[pos<1,0>::n2];
|
|
const eT d = Xm[pos<1,1>::n2];
|
|
|
|
const eT det_val = (a*d - b*c);
|
|
|
|
if(std::abs(det_val) >= det_min)
|
|
{
|
|
outm[pos<0,0>::n2] = d / det_val;
|
|
outm[pos<0,1>::n2] = -b / det_val;
|
|
outm[pos<1,0>::n2] = -c / det_val;
|
|
outm[pos<1,1>::n2] = a / det_val;
|
|
|
|
calc_ok = true;
|
|
}
|
|
};
|
|
break;
|
|
|
|
case 3:
|
|
{
|
|
const eT det_val = auxlib::det_tinymat(X,3);
|
|
|
|
if(std::abs(det_val) >= det_min)
|
|
{
|
|
outm[pos<0,0>::n3] = (Xm[pos<2,2>::n3]*Xm[pos<1,1>::n3] - Xm[pos<2,1>::n3]*Xm[pos<1,2>::n3]) / det_val;
|
|
outm[pos<1,0>::n3] = -(Xm[pos<2,2>::n3]*Xm[pos<1,0>::n3] - Xm[pos<2,0>::n3]*Xm[pos<1,2>::n3]) / det_val;
|
|
outm[pos<2,0>::n3] = (Xm[pos<2,1>::n3]*Xm[pos<1,0>::n3] - Xm[pos<2,0>::n3]*Xm[pos<1,1>::n3]) / det_val;
|
|
|
|
outm[pos<0,1>::n3] = -(Xm[pos<2,2>::n3]*Xm[pos<0,1>::n3] - Xm[pos<2,1>::n3]*Xm[pos<0,2>::n3]) / det_val;
|
|
outm[pos<1,1>::n3] = (Xm[pos<2,2>::n3]*Xm[pos<0,0>::n3] - Xm[pos<2,0>::n3]*Xm[pos<0,2>::n3]) / det_val;
|
|
outm[pos<2,1>::n3] = -(Xm[pos<2,1>::n3]*Xm[pos<0,0>::n3] - Xm[pos<2,0>::n3]*Xm[pos<0,1>::n3]) / det_val;
|
|
|
|
outm[pos<0,2>::n3] = (Xm[pos<1,2>::n3]*Xm[pos<0,1>::n3] - Xm[pos<1,1>::n3]*Xm[pos<0,2>::n3]) / det_val;
|
|
outm[pos<1,2>::n3] = -(Xm[pos<1,2>::n3]*Xm[pos<0,0>::n3] - Xm[pos<1,0>::n3]*Xm[pos<0,2>::n3]) / det_val;
|
|
outm[pos<2,2>::n3] = (Xm[pos<1,1>::n3]*Xm[pos<0,0>::n3] - Xm[pos<1,0>::n3]*Xm[pos<0,1>::n3]) / det_val;
|
|
|
|
const eT check_val = Xm[pos<0,0>::n3]*outm[pos<0,0>::n3] + Xm[pos<0,1>::n3]*outm[pos<1,0>::n3] + Xm[pos<0,2>::n3]*outm[pos<2,0>::n3];
|
|
|
|
const T max_diff = (is_float<T>::value) ? T(1e-4) : T(1e-10); // empirically determined; may need tuning
|
|
|
|
if(std::abs(T(1) - check_val) < max_diff)
|
|
{
|
|
calc_ok = true;
|
|
}
|
|
}
|
|
};
|
|
break;
|
|
|
|
case 4:
|
|
{
|
|
const eT det_val = auxlib::det_tinymat(X,4);
|
|
|
|
if(std::abs(det_val) >= det_min)
|
|
{
|
|
outm[pos<0,0>::n4] = ( Xm[pos<1,2>::n4]*Xm[pos<2,3>::n4]*Xm[pos<3,1>::n4] - Xm[pos<1,3>::n4]*Xm[pos<2,2>::n4]*Xm[pos<3,1>::n4] + Xm[pos<1,3>::n4]*Xm[pos<2,1>::n4]*Xm[pos<3,2>::n4] - Xm[pos<1,1>::n4]*Xm[pos<2,3>::n4]*Xm[pos<3,2>::n4] - Xm[pos<1,2>::n4]*Xm[pos<2,1>::n4]*Xm[pos<3,3>::n4] + Xm[pos<1,1>::n4]*Xm[pos<2,2>::n4]*Xm[pos<3,3>::n4] ) / det_val;
|
|
outm[pos<1,0>::n4] = ( Xm[pos<1,3>::n4]*Xm[pos<2,2>::n4]*Xm[pos<3,0>::n4] - Xm[pos<1,2>::n4]*Xm[pos<2,3>::n4]*Xm[pos<3,0>::n4] - Xm[pos<1,3>::n4]*Xm[pos<2,0>::n4]*Xm[pos<3,2>::n4] + Xm[pos<1,0>::n4]*Xm[pos<2,3>::n4]*Xm[pos<3,2>::n4] + Xm[pos<1,2>::n4]*Xm[pos<2,0>::n4]*Xm[pos<3,3>::n4] - Xm[pos<1,0>::n4]*Xm[pos<2,2>::n4]*Xm[pos<3,3>::n4] ) / det_val;
|
|
outm[pos<2,0>::n4] = ( Xm[pos<1,1>::n4]*Xm[pos<2,3>::n4]*Xm[pos<3,0>::n4] - Xm[pos<1,3>::n4]*Xm[pos<2,1>::n4]*Xm[pos<3,0>::n4] + Xm[pos<1,3>::n4]*Xm[pos<2,0>::n4]*Xm[pos<3,1>::n4] - Xm[pos<1,0>::n4]*Xm[pos<2,3>::n4]*Xm[pos<3,1>::n4] - Xm[pos<1,1>::n4]*Xm[pos<2,0>::n4]*Xm[pos<3,3>::n4] + Xm[pos<1,0>::n4]*Xm[pos<2,1>::n4]*Xm[pos<3,3>::n4] ) / det_val;
|
|
outm[pos<3,0>::n4] = ( Xm[pos<1,2>::n4]*Xm[pos<2,1>::n4]*Xm[pos<3,0>::n4] - Xm[pos<1,1>::n4]*Xm[pos<2,2>::n4]*Xm[pos<3,0>::n4] - Xm[pos<1,2>::n4]*Xm[pos<2,0>::n4]*Xm[pos<3,1>::n4] + Xm[pos<1,0>::n4]*Xm[pos<2,2>::n4]*Xm[pos<3,1>::n4] + Xm[pos<1,1>::n4]*Xm[pos<2,0>::n4]*Xm[pos<3,2>::n4] - Xm[pos<1,0>::n4]*Xm[pos<2,1>::n4]*Xm[pos<3,2>::n4] ) / det_val;
|
|
|
|
outm[pos<0,1>::n4] = ( Xm[pos<0,3>::n4]*Xm[pos<2,2>::n4]*Xm[pos<3,1>::n4] - Xm[pos<0,2>::n4]*Xm[pos<2,3>::n4]*Xm[pos<3,1>::n4] - Xm[pos<0,3>::n4]*Xm[pos<2,1>::n4]*Xm[pos<3,2>::n4] + Xm[pos<0,1>::n4]*Xm[pos<2,3>::n4]*Xm[pos<3,2>::n4] + Xm[pos<0,2>::n4]*Xm[pos<2,1>::n4]*Xm[pos<3,3>::n4] - Xm[pos<0,1>::n4]*Xm[pos<2,2>::n4]*Xm[pos<3,3>::n4] ) / det_val;
|
|
outm[pos<1,1>::n4] = ( Xm[pos<0,2>::n4]*Xm[pos<2,3>::n4]*Xm[pos<3,0>::n4] - Xm[pos<0,3>::n4]*Xm[pos<2,2>::n4]*Xm[pos<3,0>::n4] + Xm[pos<0,3>::n4]*Xm[pos<2,0>::n4]*Xm[pos<3,2>::n4] - Xm[pos<0,0>::n4]*Xm[pos<2,3>::n4]*Xm[pos<3,2>::n4] - Xm[pos<0,2>::n4]*Xm[pos<2,0>::n4]*Xm[pos<3,3>::n4] + Xm[pos<0,0>::n4]*Xm[pos<2,2>::n4]*Xm[pos<3,3>::n4] ) / det_val;
|
|
outm[pos<2,1>::n4] = ( Xm[pos<0,3>::n4]*Xm[pos<2,1>::n4]*Xm[pos<3,0>::n4] - Xm[pos<0,1>::n4]*Xm[pos<2,3>::n4]*Xm[pos<3,0>::n4] - Xm[pos<0,3>::n4]*Xm[pos<2,0>::n4]*Xm[pos<3,1>::n4] + Xm[pos<0,0>::n4]*Xm[pos<2,3>::n4]*Xm[pos<3,1>::n4] + Xm[pos<0,1>::n4]*Xm[pos<2,0>::n4]*Xm[pos<3,3>::n4] - Xm[pos<0,0>::n4]*Xm[pos<2,1>::n4]*Xm[pos<3,3>::n4] ) / det_val;
|
|
outm[pos<3,1>::n4] = ( Xm[pos<0,1>::n4]*Xm[pos<2,2>::n4]*Xm[pos<3,0>::n4] - Xm[pos<0,2>::n4]*Xm[pos<2,1>::n4]*Xm[pos<3,0>::n4] + Xm[pos<0,2>::n4]*Xm[pos<2,0>::n4]*Xm[pos<3,1>::n4] - Xm[pos<0,0>::n4]*Xm[pos<2,2>::n4]*Xm[pos<3,1>::n4] - Xm[pos<0,1>::n4]*Xm[pos<2,0>::n4]*Xm[pos<3,2>::n4] + Xm[pos<0,0>::n4]*Xm[pos<2,1>::n4]*Xm[pos<3,2>::n4] ) / det_val;
|
|
|
|
outm[pos<0,2>::n4] = ( Xm[pos<0,2>::n4]*Xm[pos<1,3>::n4]*Xm[pos<3,1>::n4] - Xm[pos<0,3>::n4]*Xm[pos<1,2>::n4]*Xm[pos<3,1>::n4] + Xm[pos<0,3>::n4]*Xm[pos<1,1>::n4]*Xm[pos<3,2>::n4] - Xm[pos<0,1>::n4]*Xm[pos<1,3>::n4]*Xm[pos<3,2>::n4] - Xm[pos<0,2>::n4]*Xm[pos<1,1>::n4]*Xm[pos<3,3>::n4] + Xm[pos<0,1>::n4]*Xm[pos<1,2>::n4]*Xm[pos<3,3>::n4] ) / det_val;
|
|
outm[pos<1,2>::n4] = ( Xm[pos<0,3>::n4]*Xm[pos<1,2>::n4]*Xm[pos<3,0>::n4] - Xm[pos<0,2>::n4]*Xm[pos<1,3>::n4]*Xm[pos<3,0>::n4] - Xm[pos<0,3>::n4]*Xm[pos<1,0>::n4]*Xm[pos<3,2>::n4] + Xm[pos<0,0>::n4]*Xm[pos<1,3>::n4]*Xm[pos<3,2>::n4] + Xm[pos<0,2>::n4]*Xm[pos<1,0>::n4]*Xm[pos<3,3>::n4] - Xm[pos<0,0>::n4]*Xm[pos<1,2>::n4]*Xm[pos<3,3>::n4] ) / det_val;
|
|
outm[pos<2,2>::n4] = ( Xm[pos<0,1>::n4]*Xm[pos<1,3>::n4]*Xm[pos<3,0>::n4] - Xm[pos<0,3>::n4]*Xm[pos<1,1>::n4]*Xm[pos<3,0>::n4] + Xm[pos<0,3>::n4]*Xm[pos<1,0>::n4]*Xm[pos<3,1>::n4] - Xm[pos<0,0>::n4]*Xm[pos<1,3>::n4]*Xm[pos<3,1>::n4] - Xm[pos<0,1>::n4]*Xm[pos<1,0>::n4]*Xm[pos<3,3>::n4] + Xm[pos<0,0>::n4]*Xm[pos<1,1>::n4]*Xm[pos<3,3>::n4] ) / det_val;
|
|
outm[pos<3,2>::n4] = ( Xm[pos<0,2>::n4]*Xm[pos<1,1>::n4]*Xm[pos<3,0>::n4] - Xm[pos<0,1>::n4]*Xm[pos<1,2>::n4]*Xm[pos<3,0>::n4] - Xm[pos<0,2>::n4]*Xm[pos<1,0>::n4]*Xm[pos<3,1>::n4] + Xm[pos<0,0>::n4]*Xm[pos<1,2>::n4]*Xm[pos<3,1>::n4] + Xm[pos<0,1>::n4]*Xm[pos<1,0>::n4]*Xm[pos<3,2>::n4] - Xm[pos<0,0>::n4]*Xm[pos<1,1>::n4]*Xm[pos<3,2>::n4] ) / det_val;
|
|
|
|
outm[pos<0,3>::n4] = ( Xm[pos<0,3>::n4]*Xm[pos<1,2>::n4]*Xm[pos<2,1>::n4] - Xm[pos<0,2>::n4]*Xm[pos<1,3>::n4]*Xm[pos<2,1>::n4] - Xm[pos<0,3>::n4]*Xm[pos<1,1>::n4]*Xm[pos<2,2>::n4] + Xm[pos<0,1>::n4]*Xm[pos<1,3>::n4]*Xm[pos<2,2>::n4] + Xm[pos<0,2>::n4]*Xm[pos<1,1>::n4]*Xm[pos<2,3>::n4] - Xm[pos<0,1>::n4]*Xm[pos<1,2>::n4]*Xm[pos<2,3>::n4] ) / det_val;
|
|
outm[pos<1,3>::n4] = ( Xm[pos<0,2>::n4]*Xm[pos<1,3>::n4]*Xm[pos<2,0>::n4] - Xm[pos<0,3>::n4]*Xm[pos<1,2>::n4]*Xm[pos<2,0>::n4] + Xm[pos<0,3>::n4]*Xm[pos<1,0>::n4]*Xm[pos<2,2>::n4] - Xm[pos<0,0>::n4]*Xm[pos<1,3>::n4]*Xm[pos<2,2>::n4] - Xm[pos<0,2>::n4]*Xm[pos<1,0>::n4]*Xm[pos<2,3>::n4] + Xm[pos<0,0>::n4]*Xm[pos<1,2>::n4]*Xm[pos<2,3>::n4] ) / det_val;
|
|
outm[pos<2,3>::n4] = ( Xm[pos<0,3>::n4]*Xm[pos<1,1>::n4]*Xm[pos<2,0>::n4] - Xm[pos<0,1>::n4]*Xm[pos<1,3>::n4]*Xm[pos<2,0>::n4] - Xm[pos<0,3>::n4]*Xm[pos<1,0>::n4]*Xm[pos<2,1>::n4] + Xm[pos<0,0>::n4]*Xm[pos<1,3>::n4]*Xm[pos<2,1>::n4] + Xm[pos<0,1>::n4]*Xm[pos<1,0>::n4]*Xm[pos<2,3>::n4] - Xm[pos<0,0>::n4]*Xm[pos<1,1>::n4]*Xm[pos<2,3>::n4] ) / det_val;
|
|
outm[pos<3,3>::n4] = ( Xm[pos<0,1>::n4]*Xm[pos<1,2>::n4]*Xm[pos<2,0>::n4] - Xm[pos<0,2>::n4]*Xm[pos<1,1>::n4]*Xm[pos<2,0>::n4] + Xm[pos<0,2>::n4]*Xm[pos<1,0>::n4]*Xm[pos<2,1>::n4] - Xm[pos<0,0>::n4]*Xm[pos<1,2>::n4]*Xm[pos<2,1>::n4] - Xm[pos<0,1>::n4]*Xm[pos<1,0>::n4]*Xm[pos<2,2>::n4] + Xm[pos<0,0>::n4]*Xm[pos<1,1>::n4]*Xm[pos<2,2>::n4] ) / det_val;
|
|
|
|
const eT check_val = Xm[pos<0,0>::n4]*outm[pos<0,0>::n4] + Xm[pos<0,1>::n4]*outm[pos<1,0>::n4] + Xm[pos<0,2>::n4]*outm[pos<2,0>::n4] + Xm[pos<0,3>::n4]*outm[pos<3,0>::n4];
|
|
|
|
const T max_diff = (is_float<T>::value) ? T(1e-4) : T(1e-10); // empirically determined; may need tuning
|
|
|
|
if(std::abs(T(1) - check_val) < max_diff)
|
|
{
|
|
calc_ok = true;
|
|
}
|
|
}
|
|
};
|
|
break;
|
|
|
|
default:
|
|
;
|
|
}
|
|
|
|
return calc_ok;
|
|
}
|
|
|
|
|
|
|
|
template<typename eT>
|
|
inline
|
|
bool
|
|
auxlib::inv_inplace_lapack(Mat<eT>& out)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
if(out.is_empty()) { return true; }
|
|
|
|
#if defined(ARMA_USE_ATLAS)
|
|
{
|
|
arma_debug_assert_atlas_size(out);
|
|
|
|
podarray<int> ipiv(out.n_rows);
|
|
|
|
int info = 0;
|
|
|
|
arma_extra_debug_print("atlas::clapack_getrf()");
|
|
info = atlas::clapack_getrf(atlas::CblasColMajor, out.n_rows, out.n_cols, out.memptr(), out.n_rows, ipiv.memptr());
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
arma_extra_debug_print("atlas::clapack_getri()");
|
|
info = atlas::clapack_getri(atlas::CblasColMajor, out.n_rows, out.memptr(), out.n_rows, ipiv.memptr());
|
|
|
|
return (info == 0);
|
|
}
|
|
#elif defined(ARMA_USE_LAPACK)
|
|
{
|
|
arma_debug_assert_blas_size(out);
|
|
|
|
blas_int n_rows = out.n_rows;
|
|
blas_int lwork = (std::max)(blas_int(podarray_prealloc_n_elem::val), n_rows);
|
|
blas_int info = 0;
|
|
|
|
podarray<blas_int> ipiv(out.n_rows);
|
|
|
|
if(n_rows > 16)
|
|
{
|
|
eT work_query[2];
|
|
blas_int lwork_query = -1;
|
|
|
|
arma_extra_debug_print("lapack::getri()");
|
|
lapack::getri(&n_rows, out.memptr(), &n_rows, ipiv.memptr(), &work_query[0], &lwork_query, &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
blas_int lwork_proposed = static_cast<blas_int>( access::tmp_real(work_query[0]) );
|
|
|
|
lwork = (std::max)(lwork_proposed, lwork);
|
|
}
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
|
|
arma_extra_debug_print("lapack::getrf()");
|
|
lapack::getrf(&n_rows, &n_rows, out.memptr(), &n_rows, ipiv.memptr(), &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
arma_extra_debug_print("lapack::getri()");
|
|
lapack::getri(&n_rows, out.memptr(), &n_rows, ipiv.memptr(), work.memptr(), &lwork, &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_stop("inv(): use of ATLAS or LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::inv_tr(Mat<eT>& out, const Base<eT,T1>& X, const uword layout)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
out = X.get_ref();
|
|
|
|
arma_debug_check( (out.is_square() == false), "inv(): given matrix must be square sized" );
|
|
|
|
if(out.is_empty()) { return true; }
|
|
|
|
arma_debug_assert_blas_size(out);
|
|
|
|
char uplo = (layout == 0) ? 'U' : 'L';
|
|
char diag = 'N';
|
|
blas_int n = blas_int(out.n_rows);
|
|
blas_int info = 0;
|
|
|
|
arma_extra_debug_print("lapack::trtri()");
|
|
lapack::trtri(&uplo, &diag, &n, out.memptr(), &n, &info);
|
|
|
|
if(layout == 0)
|
|
{
|
|
out = trimatu(out); // upper triangular
|
|
}
|
|
else
|
|
{
|
|
out = trimatl(out); // lower triangular
|
|
}
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(out);
|
|
arma_ignore(X);
|
|
arma_ignore(layout);
|
|
arma_stop("inv(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::inv_sym(Mat<eT>& out, const Base<eT,T1>& X, const uword layout)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
out = X.get_ref();
|
|
|
|
arma_debug_check( (out.is_square() == false), "inv(): given matrix must be square sized" );
|
|
|
|
if(out.is_empty()) { return true; }
|
|
|
|
arma_debug_assert_blas_size(out);
|
|
|
|
char uplo = (layout == 0) ? 'U' : 'L';
|
|
blas_int n = blas_int(out.n_rows);
|
|
blas_int lwork = (std::max)(blas_int(podarray_prealloc_n_elem::val), 2*n);
|
|
blas_int info = 0;
|
|
|
|
podarray<blas_int> ipiv;
|
|
ipiv.set_size(out.n_rows);
|
|
|
|
podarray<eT> work;
|
|
work.set_size( uword(lwork) );
|
|
|
|
arma_extra_debug_print("lapack::sytrf()");
|
|
lapack::sytrf(&uplo, &n, out.memptr(), &n, ipiv.memptr(), work.memptr(), &lwork, &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
arma_extra_debug_print("lapack::sytri()");
|
|
lapack::sytri(&uplo, &n, out.memptr(), &n, ipiv.memptr(), work.memptr(), &info);
|
|
|
|
if(layout == 0)
|
|
{
|
|
out = symmatu(out);
|
|
}
|
|
else
|
|
{
|
|
out = symmatl(out);
|
|
}
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(out);
|
|
arma_ignore(X);
|
|
arma_ignore(layout);
|
|
arma_stop("inv(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::inv_sympd(Mat<eT>& out, const Base<eT,T1>& X, const uword layout)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
out = X.get_ref();
|
|
|
|
arma_debug_check( (out.is_square() == false), "inv_sympd(): given matrix must be square sized" );
|
|
|
|
if(out.is_empty()) { return true; }
|
|
|
|
arma_debug_assert_blas_size(out);
|
|
|
|
char uplo = (layout == 0) ? 'U' : 'L';
|
|
blas_int n = blas_int(out.n_rows);
|
|
blas_int info = 0;
|
|
|
|
arma_extra_debug_print("lapack::potrf()");
|
|
lapack::potrf(&uplo, &n, out.memptr(), &n, &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
arma_extra_debug_print("lapack::potri()");
|
|
lapack::potri(&uplo, &n, out.memptr(), &n, &info);
|
|
|
|
if(layout == 0)
|
|
{
|
|
out = symmatu(out);
|
|
}
|
|
else
|
|
{
|
|
out = symmatl(out);
|
|
}
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(out);
|
|
arma_ignore(X);
|
|
arma_ignore(layout);
|
|
arma_stop("inv_sympd(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
eT
|
|
auxlib::det(const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
typedef typename get_pod_type<eT>::result T;
|
|
|
|
const bool make_copy = (is_Mat<T1>::value) ? true : false;
|
|
|
|
const unwrap<T1> tmp(X.get_ref());
|
|
const Mat<eT>& A = tmp.M;
|
|
|
|
arma_debug_check( (A.is_square() == false), "det(): given matrix must be square sized" );
|
|
|
|
const uword N = A.n_rows;
|
|
|
|
if(N <= 4)
|
|
{
|
|
const eT det_val = auxlib::det_tinymat(A, N);
|
|
|
|
const T det_min = std::numeric_limits<T>::epsilon();
|
|
|
|
if(std::abs(det_val) >= det_min) { return det_val; }
|
|
}
|
|
|
|
return auxlib::det_lapack(A, make_copy);
|
|
}
|
|
|
|
|
|
|
|
template<typename eT>
|
|
inline
|
|
eT
|
|
auxlib::det_tinymat(const Mat<eT>& X, const uword N)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
switch(N)
|
|
{
|
|
case 0:
|
|
return eT(1);
|
|
break;
|
|
|
|
case 1:
|
|
return X[0];
|
|
break;
|
|
|
|
case 2:
|
|
{
|
|
const eT* Xm = X.memptr();
|
|
|
|
return ( Xm[pos<0,0>::n2]*Xm[pos<1,1>::n2] - Xm[pos<0,1>::n2]*Xm[pos<1,0>::n2] );
|
|
}
|
|
break;
|
|
|
|
case 3:
|
|
{
|
|
// const double tmp1 = X.at(0,0) * X.at(1,1) * X.at(2,2);
|
|
// const double tmp2 = X.at(0,1) * X.at(1,2) * X.at(2,0);
|
|
// const double tmp3 = X.at(0,2) * X.at(1,0) * X.at(2,1);
|
|
// const double tmp4 = X.at(2,0) * X.at(1,1) * X.at(0,2);
|
|
// const double tmp5 = X.at(2,1) * X.at(1,2) * X.at(0,0);
|
|
// const double tmp6 = X.at(2,2) * X.at(1,0) * X.at(0,1);
|
|
// return (tmp1+tmp2+tmp3) - (tmp4+tmp5+tmp6);
|
|
|
|
const eT* Xm = X.memptr();
|
|
|
|
const eT val1 = Xm[pos<0,0>::n3]*(Xm[pos<2,2>::n3]*Xm[pos<1,1>::n3] - Xm[pos<2,1>::n3]*Xm[pos<1,2>::n3]);
|
|
const eT val2 = Xm[pos<1,0>::n3]*(Xm[pos<2,2>::n3]*Xm[pos<0,1>::n3] - Xm[pos<2,1>::n3]*Xm[pos<0,2>::n3]);
|
|
const eT val3 = Xm[pos<2,0>::n3]*(Xm[pos<1,2>::n3]*Xm[pos<0,1>::n3] - Xm[pos<1,1>::n3]*Xm[pos<0,2>::n3]);
|
|
|
|
return ( val1 - val2 + val3 );
|
|
}
|
|
break;
|
|
|
|
case 4:
|
|
{
|
|
const eT* Xm = X.memptr();
|
|
|
|
const eT val = \
|
|
Xm[pos<0,3>::n4] * Xm[pos<1,2>::n4] * Xm[pos<2,1>::n4] * Xm[pos<3,0>::n4] \
|
|
- Xm[pos<0,2>::n4] * Xm[pos<1,3>::n4] * Xm[pos<2,1>::n4] * Xm[pos<3,0>::n4] \
|
|
- Xm[pos<0,3>::n4] * Xm[pos<1,1>::n4] * Xm[pos<2,2>::n4] * Xm[pos<3,0>::n4] \
|
|
+ Xm[pos<0,1>::n4] * Xm[pos<1,3>::n4] * Xm[pos<2,2>::n4] * Xm[pos<3,0>::n4] \
|
|
+ Xm[pos<0,2>::n4] * Xm[pos<1,1>::n4] * Xm[pos<2,3>::n4] * Xm[pos<3,0>::n4] \
|
|
- Xm[pos<0,1>::n4] * Xm[pos<1,2>::n4] * Xm[pos<2,3>::n4] * Xm[pos<3,0>::n4] \
|
|
- Xm[pos<0,3>::n4] * Xm[pos<1,2>::n4] * Xm[pos<2,0>::n4] * Xm[pos<3,1>::n4] \
|
|
+ Xm[pos<0,2>::n4] * Xm[pos<1,3>::n4] * Xm[pos<2,0>::n4] * Xm[pos<3,1>::n4] \
|
|
+ Xm[pos<0,3>::n4] * Xm[pos<1,0>::n4] * Xm[pos<2,2>::n4] * Xm[pos<3,1>::n4] \
|
|
- Xm[pos<0,0>::n4] * Xm[pos<1,3>::n4] * Xm[pos<2,2>::n4] * Xm[pos<3,1>::n4] \
|
|
- Xm[pos<0,2>::n4] * Xm[pos<1,0>::n4] * Xm[pos<2,3>::n4] * Xm[pos<3,1>::n4] \
|
|
+ Xm[pos<0,0>::n4] * Xm[pos<1,2>::n4] * Xm[pos<2,3>::n4] * Xm[pos<3,1>::n4] \
|
|
+ Xm[pos<0,3>::n4] * Xm[pos<1,1>::n4] * Xm[pos<2,0>::n4] * Xm[pos<3,2>::n4] \
|
|
- Xm[pos<0,1>::n4] * Xm[pos<1,3>::n4] * Xm[pos<2,0>::n4] * Xm[pos<3,2>::n4] \
|
|
- Xm[pos<0,3>::n4] * Xm[pos<1,0>::n4] * Xm[pos<2,1>::n4] * Xm[pos<3,2>::n4] \
|
|
+ Xm[pos<0,0>::n4] * Xm[pos<1,3>::n4] * Xm[pos<2,1>::n4] * Xm[pos<3,2>::n4] \
|
|
+ Xm[pos<0,1>::n4] * Xm[pos<1,0>::n4] * Xm[pos<2,3>::n4] * Xm[pos<3,2>::n4] \
|
|
- Xm[pos<0,0>::n4] * Xm[pos<1,1>::n4] * Xm[pos<2,3>::n4] * Xm[pos<3,2>::n4] \
|
|
- Xm[pos<0,2>::n4] * Xm[pos<1,1>::n4] * Xm[pos<2,0>::n4] * Xm[pos<3,3>::n4] \
|
|
+ Xm[pos<0,1>::n4] * Xm[pos<1,2>::n4] * Xm[pos<2,0>::n4] * Xm[pos<3,3>::n4] \
|
|
+ Xm[pos<0,2>::n4] * Xm[pos<1,0>::n4] * Xm[pos<2,1>::n4] * Xm[pos<3,3>::n4] \
|
|
- Xm[pos<0,0>::n4] * Xm[pos<1,2>::n4] * Xm[pos<2,1>::n4] * Xm[pos<3,3>::n4] \
|
|
- Xm[pos<0,1>::n4] * Xm[pos<1,0>::n4] * Xm[pos<2,2>::n4] * Xm[pos<3,3>::n4] \
|
|
+ Xm[pos<0,0>::n4] * Xm[pos<1,1>::n4] * Xm[pos<2,2>::n4] * Xm[pos<3,3>::n4] \
|
|
;
|
|
|
|
return val;
|
|
}
|
|
break;
|
|
|
|
default:
|
|
return eT(0);
|
|
;
|
|
}
|
|
}
|
|
|
|
|
|
|
|
//! determinant of a matrix
|
|
template<typename eT>
|
|
inline
|
|
eT
|
|
auxlib::det_lapack(const Mat<eT>& X, const bool make_copy)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
Mat<eT> X_copy;
|
|
|
|
if(make_copy) { X_copy = X; }
|
|
|
|
Mat<eT>& tmp = (make_copy) ? X_copy : const_cast< Mat<eT>& >(X);
|
|
|
|
if(tmp.is_empty()) { return eT(1); }
|
|
|
|
#if defined(ARMA_USE_ATLAS)
|
|
{
|
|
arma_debug_assert_atlas_size(tmp);
|
|
|
|
podarray<int> ipiv(tmp.n_rows);
|
|
|
|
arma_extra_debug_print("atlas::clapack_getrf()");
|
|
//const int info =
|
|
atlas::clapack_getrf(atlas::CblasColMajor, tmp.n_rows, tmp.n_cols, tmp.memptr(), tmp.n_rows, ipiv.memptr());
|
|
|
|
// on output tmp appears to be L+U_alt, where U_alt is U with the main diagonal set to zero
|
|
eT val = tmp.at(0,0);
|
|
for(uword i=1; i < tmp.n_rows; ++i)
|
|
{
|
|
val *= tmp.at(i,i);
|
|
}
|
|
|
|
int sign = +1;
|
|
for(uword i=0; i < tmp.n_rows; ++i)
|
|
{
|
|
if( int(i) != ipiv.mem[i] ) // NOTE: no adjustment required, as the clapack version of getrf() assumes counting from 0
|
|
{
|
|
sign *= -1;
|
|
}
|
|
}
|
|
|
|
return ( (sign < 0) ? -val : val );
|
|
}
|
|
#elif defined(ARMA_USE_LAPACK)
|
|
{
|
|
arma_debug_assert_blas_size(tmp);
|
|
|
|
podarray<blas_int> ipiv(tmp.n_rows);
|
|
|
|
blas_int info = 0;
|
|
blas_int n_rows = blas_int(tmp.n_rows);
|
|
blas_int n_cols = blas_int(tmp.n_cols);
|
|
|
|
arma_extra_debug_print("lapack::getrf()");
|
|
lapack::getrf(&n_rows, &n_cols, tmp.memptr(), &n_rows, ipiv.memptr(), &info);
|
|
|
|
// on output tmp appears to be L+U_alt, where U_alt is U with the main diagonal set to zero
|
|
eT val = tmp.at(0,0);
|
|
for(uword i=1; i < tmp.n_rows; ++i)
|
|
{
|
|
val *= tmp.at(i,i);
|
|
}
|
|
|
|
blas_int sign = +1;
|
|
for(uword i=0; i < tmp.n_rows; ++i)
|
|
{
|
|
if( blas_int(i) != (ipiv.mem[i] - 1) ) // NOTE: adjustment of -1 is required as Fortran counts from 1
|
|
{
|
|
sign *= -1;
|
|
}
|
|
}
|
|
|
|
return ( (sign < 0) ? -val : val );
|
|
}
|
|
#else
|
|
{
|
|
arma_stop("det(): use of ATLAS or LAPACK must be enabled");
|
|
return eT(0);
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! log determinant of a matrix
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::log_det(eT& out_val, typename get_pod_type<eT>::result& out_sign, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
typedef typename get_pod_type<eT>::result T;
|
|
|
|
#if defined(ARMA_USE_ATLAS)
|
|
{
|
|
Mat<eT> tmp(X.get_ref());
|
|
arma_debug_check( (tmp.is_square() == false), "log_det(): given matrix must be square sized" );
|
|
|
|
if(tmp.is_empty())
|
|
{
|
|
out_val = eT(0);
|
|
out_sign = T(1);
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_atlas_size(tmp);
|
|
|
|
podarray<int> ipiv(tmp.n_rows);
|
|
|
|
arma_extra_debug_print("atlas::clapack_getrf()");
|
|
const int info = atlas::clapack_getrf(atlas::CblasColMajor, tmp.n_rows, tmp.n_cols, tmp.memptr(), tmp.n_rows, ipiv.memptr());
|
|
|
|
// on output tmp appears to be L+U_alt, where U_alt is U with the main diagonal set to zero
|
|
|
|
sword sign = (is_complex<eT>::value == false) ? ( (access::tmp_real( tmp.at(0,0) ) < T(0)) ? -1 : +1 ) : +1;
|
|
eT val = (is_complex<eT>::value == false) ? std::log( (access::tmp_real( tmp.at(0,0) ) < T(0)) ? tmp.at(0,0)*T(-1) : tmp.at(0,0) ) : std::log( tmp.at(0,0) );
|
|
|
|
for(uword i=1; i < tmp.n_rows; ++i)
|
|
{
|
|
const eT x = tmp.at(i,i);
|
|
|
|
sign *= (is_complex<eT>::value == false) ? ( (access::tmp_real(x) < T(0)) ? -1 : +1 ) : +1;
|
|
val += (is_complex<eT>::value == false) ? std::log( (access::tmp_real(x) < T(0)) ? x*T(-1) : x ) : std::log(x);
|
|
}
|
|
|
|
for(uword i=0; i < tmp.n_rows; ++i)
|
|
{
|
|
if( int(i) != ipiv.mem[i] ) // NOTE: no adjustment required, as the clapack version of getrf() assumes counting from 0
|
|
{
|
|
sign *= -1;
|
|
}
|
|
}
|
|
|
|
out_val = val;
|
|
out_sign = T(sign);
|
|
|
|
return (info == 0);
|
|
}
|
|
#elif defined(ARMA_USE_LAPACK)
|
|
{
|
|
Mat<eT> tmp(X.get_ref());
|
|
arma_debug_check( (tmp.is_square() == false), "log_det(): given matrix must be square sized" );
|
|
|
|
if(tmp.is_empty())
|
|
{
|
|
out_val = eT(0);
|
|
out_sign = T(1);
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(tmp);
|
|
|
|
podarray<blas_int> ipiv(tmp.n_rows);
|
|
|
|
blas_int info = 0;
|
|
blas_int n_rows = blas_int(tmp.n_rows);
|
|
blas_int n_cols = blas_int(tmp.n_cols);
|
|
|
|
arma_extra_debug_print("lapack::getrf()");
|
|
lapack::getrf(&n_rows, &n_cols, tmp.memptr(), &n_rows, ipiv.memptr(), &info);
|
|
|
|
// on output tmp appears to be L+U_alt, where U_alt is U with the main diagonal set to zero
|
|
|
|
sword sign = (is_complex<eT>::value == false) ? ( (access::tmp_real( tmp.at(0,0) ) < T(0)) ? -1 : +1 ) : +1;
|
|
eT val = (is_complex<eT>::value == false) ? std::log( (access::tmp_real( tmp.at(0,0) ) < T(0)) ? tmp.at(0,0)*T(-1) : tmp.at(0,0) ) : std::log( tmp.at(0,0) );
|
|
|
|
for(uword i=1; i < tmp.n_rows; ++i)
|
|
{
|
|
const eT x = tmp.at(i,i);
|
|
|
|
sign *= (is_complex<eT>::value == false) ? ( (access::tmp_real(x) < T(0)) ? -1 : +1 ) : +1;
|
|
val += (is_complex<eT>::value == false) ? std::log( (access::tmp_real(x) < T(0)) ? x*T(-1) : x ) : std::log(x);
|
|
}
|
|
|
|
for(uword i=0; i < tmp.n_rows; ++i)
|
|
{
|
|
if( blas_int(i) != (ipiv.mem[i] - 1) ) // NOTE: adjustment of -1 is required as Fortran counts from 1
|
|
{
|
|
sign *= -1;
|
|
}
|
|
}
|
|
|
|
out_val = val;
|
|
out_sign = T(sign);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(X);
|
|
|
|
out_val = eT(0);
|
|
out_sign = T(0);
|
|
|
|
arma_stop("log_det(): use of ATLAS or LAPACK must be enabled");
|
|
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! LU decomposition of a matrix
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::lu(Mat<eT>& L, Mat<eT>& U, podarray<blas_int>& ipiv, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
U = X.get_ref();
|
|
|
|
const uword U_n_rows = U.n_rows;
|
|
const uword U_n_cols = U.n_cols;
|
|
|
|
if(U.is_empty())
|
|
{
|
|
L.set_size(U_n_rows, 0);
|
|
U.set_size(0, U_n_cols);
|
|
ipiv.reset();
|
|
return true;
|
|
}
|
|
|
|
#if defined(ARMA_USE_ATLAS) || defined(ARMA_USE_LAPACK)
|
|
{
|
|
bool status = false;
|
|
|
|
#if defined(ARMA_USE_ATLAS)
|
|
{
|
|
arma_debug_assert_atlas_size(U);
|
|
|
|
ipiv.set_size( (std::min)(U_n_rows, U_n_cols) );
|
|
|
|
arma_extra_debug_print("atlas::clapack_getrf()");
|
|
int info = atlas::clapack_getrf(atlas::CblasColMajor, U_n_rows, U_n_cols, U.memptr(), U_n_rows, ipiv.memptr());
|
|
|
|
status = (info == 0);
|
|
}
|
|
#elif defined(ARMA_USE_LAPACK)
|
|
{
|
|
arma_debug_assert_blas_size(U);
|
|
|
|
ipiv.set_size( (std::min)(U_n_rows, U_n_cols) );
|
|
|
|
blas_int info = 0;
|
|
|
|
blas_int n_rows = blas_int(U_n_rows);
|
|
blas_int n_cols = blas_int(U_n_cols);
|
|
|
|
arma_extra_debug_print("lapack::getrf()");
|
|
lapack::getrf(&n_rows, &n_cols, U.memptr(), &n_rows, ipiv.memptr(), &info);
|
|
|
|
// take into account that Fortran counts from 1
|
|
arrayops::inplace_minus(ipiv.memptr(), blas_int(1), ipiv.n_elem);
|
|
|
|
status = (info == 0);
|
|
}
|
|
#endif
|
|
|
|
L.copy_size(U);
|
|
|
|
for(uword col=0; col < U_n_cols; ++col)
|
|
{
|
|
for(uword row=0; (row < col) && (row < U_n_rows); ++row)
|
|
{
|
|
L.at(row,col) = eT(0);
|
|
}
|
|
|
|
if( L.in_range(col,col) == true )
|
|
{
|
|
L.at(col,col) = eT(1);
|
|
}
|
|
|
|
for(uword row = (col+1); row < U_n_rows; ++row)
|
|
{
|
|
L.at(row,col) = U.at(row,col);
|
|
U.at(row,col) = eT(0);
|
|
}
|
|
}
|
|
|
|
return status;
|
|
}
|
|
#else
|
|
{
|
|
arma_stop("lu(): use of ATLAS or LAPACK must be enabled");
|
|
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::lu(Mat<eT>& L, Mat<eT>& U, Mat<eT>& P, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
podarray<blas_int> ipiv1;
|
|
const bool status = auxlib::lu(L, U, ipiv1, X);
|
|
|
|
if(status == false) { return false; }
|
|
|
|
if(U.is_empty())
|
|
{
|
|
// L and U have been already set to the correct empty matrices
|
|
P.eye(L.n_rows, L.n_rows);
|
|
return true;
|
|
}
|
|
|
|
const uword n = ipiv1.n_elem;
|
|
const uword P_rows = U.n_rows;
|
|
|
|
podarray<blas_int> ipiv2(P_rows);
|
|
|
|
const blas_int* ipiv1_mem = ipiv1.memptr();
|
|
blas_int* ipiv2_mem = ipiv2.memptr();
|
|
|
|
for(uword i=0; i<P_rows; ++i)
|
|
{
|
|
ipiv2_mem[i] = blas_int(i);
|
|
}
|
|
|
|
for(uword i=0; i<n; ++i)
|
|
{
|
|
const uword k = static_cast<uword>(ipiv1_mem[i]);
|
|
|
|
if( ipiv2_mem[i] != ipiv2_mem[k] )
|
|
{
|
|
std::swap( ipiv2_mem[i], ipiv2_mem[k] );
|
|
}
|
|
}
|
|
|
|
P.zeros(P_rows, P_rows);
|
|
|
|
for(uword row=0; row<P_rows; ++row)
|
|
{
|
|
P.at(row, static_cast<uword>(ipiv2_mem[row])) = eT(1);
|
|
}
|
|
|
|
if(L.n_cols > U.n_rows)
|
|
{
|
|
L.shed_cols(U.n_rows, L.n_cols-1);
|
|
}
|
|
|
|
if(U.n_rows > L.n_cols)
|
|
{
|
|
U.shed_rows(L.n_cols, U.n_rows-1);
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::lu(Mat<eT>& L, Mat<eT>& U, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
podarray<blas_int> ipiv1;
|
|
const bool status = auxlib::lu(L, U, ipiv1, X);
|
|
|
|
if(status == false) { return false; }
|
|
|
|
if(U.is_empty())
|
|
{
|
|
// L and U have been already set to the correct empty matrices
|
|
return true;
|
|
}
|
|
|
|
const uword n = ipiv1.n_elem;
|
|
const uword P_rows = U.n_rows;
|
|
|
|
podarray<blas_int> ipiv2(P_rows);
|
|
|
|
const blas_int* ipiv1_mem = ipiv1.memptr();
|
|
blas_int* ipiv2_mem = ipiv2.memptr();
|
|
|
|
for(uword i=0; i<P_rows; ++i)
|
|
{
|
|
ipiv2_mem[i] = blas_int(i);
|
|
}
|
|
|
|
for(uword i=0; i<n; ++i)
|
|
{
|
|
const uword k = static_cast<uword>(ipiv1_mem[i]);
|
|
|
|
if( ipiv2_mem[i] != ipiv2_mem[k] )
|
|
{
|
|
std::swap( ipiv2_mem[i], ipiv2_mem[k] );
|
|
L.swap_rows( static_cast<uword>(ipiv2_mem[i]), static_cast<uword>(ipiv2_mem[k]) );
|
|
}
|
|
}
|
|
|
|
if(L.n_cols > U.n_rows)
|
|
{
|
|
L.shed_cols(U.n_rows, L.n_cols-1);
|
|
}
|
|
|
|
if(U.n_rows > L.n_cols)
|
|
{
|
|
U.shed_rows(L.n_cols, U.n_rows-1);
|
|
}
|
|
|
|
return true;
|
|
}
|
|
|
|
|
|
|
|
//! eigen decomposition of general square matrix (real)
|
|
template<typename T1>
|
|
inline
|
|
bool
|
|
auxlib::eig_gen
|
|
(
|
|
Mat< std::complex<typename T1::pod_type> >& vals,
|
|
Mat< std::complex<typename T1::pod_type> >& vecs,
|
|
const uword mode,
|
|
const Base<typename T1::pod_type,T1>& expr
|
|
)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename T1::pod_type T;
|
|
|
|
Mat<T> X = expr.get_ref();
|
|
|
|
arma_debug_check( (X.is_square() == false), "eig_gen(): given matrix must be square sized" );
|
|
|
|
arma_debug_assert_blas_size(X);
|
|
|
|
if(X.is_empty())
|
|
{
|
|
vals.reset();
|
|
vecs.reset();
|
|
return true;
|
|
}
|
|
|
|
if(X.is_finite() == false) { return false; }
|
|
|
|
vals.set_size(X.n_rows, 1);
|
|
|
|
Mat<T> tmp(1,1);
|
|
|
|
const bool calc_l = (mode == 1);
|
|
const bool calc_r = (mode == 2);
|
|
|
|
if(calc_l || calc_r)
|
|
{
|
|
vecs.set_size(X.n_rows, X.n_rows);
|
|
tmp.set_size(X.n_rows, X.n_rows);
|
|
}
|
|
|
|
podarray<T> junk(1);
|
|
|
|
char jobvl = (calc_l) ? 'V' : 'N';
|
|
char jobvr = (calc_r) ? 'V' : 'N';
|
|
blas_int N = blas_int(X.n_rows);
|
|
T* vl = (calc_l) ? tmp.memptr() : junk.memptr();
|
|
T* vr = (calc_r) ? tmp.memptr() : junk.memptr();
|
|
blas_int ldvl = (calc_l) ? blas_int(tmp.n_rows) : blas_int(1);
|
|
blas_int ldvr = (calc_r) ? blas_int(tmp.n_rows) : blas_int(1);
|
|
blas_int lwork = (calc_l || calc_r) ? (3 * ((std::max)(blas_int(1), 4*N)) ) : (3 * ((std::max)(blas_int(1), 3*N)) );
|
|
blas_int info = 0;
|
|
|
|
podarray<T> work( static_cast<uword>(lwork) );
|
|
|
|
podarray<T> vals_real(X.n_rows);
|
|
podarray<T> vals_imag(X.n_rows);
|
|
|
|
arma_extra_debug_print("lapack::geev() -- START");
|
|
lapack::geev(&jobvl, &jobvr, &N, X.memptr(), &N, vals_real.memptr(), vals_imag.memptr(), vl, &ldvl, vr, &ldvr, work.memptr(), &lwork, &info);
|
|
arma_extra_debug_print("lapack::geev() -- END");
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
arma_extra_debug_print("reformatting eigenvalues and eigenvectors");
|
|
|
|
std::complex<T>* vals_mem = vals.memptr();
|
|
|
|
for(uword i=0; i < X.n_rows; ++i) { vals_mem[i] = std::complex<T>(vals_real[i], vals_imag[i]); }
|
|
|
|
if(calc_l || calc_r)
|
|
{
|
|
for(uword j=0; j < X.n_rows; ++j)
|
|
{
|
|
if( (j < (X.n_rows-1)) && (vals_mem[j] == std::conj(vals_mem[j+1])) )
|
|
{
|
|
for(uword i=0; i < X.n_rows; ++i)
|
|
{
|
|
vecs.at(i,j) = std::complex<T>( tmp.at(i,j), tmp.at(i,j+1) );
|
|
vecs.at(i,j+1) = std::complex<T>( tmp.at(i,j), -tmp.at(i,j+1) );
|
|
}
|
|
|
|
++j;
|
|
}
|
|
else
|
|
{
|
|
for(uword i=0; i<X.n_rows; ++i)
|
|
{
|
|
vecs.at(i,j) = std::complex<T>(tmp.at(i,j), T(0));
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(vals);
|
|
arma_ignore(vecs);
|
|
arma_ignore(mode);
|
|
arma_ignore(expr);
|
|
arma_stop("eig_gen(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! eigen decomposition of general square matrix (complex)
|
|
template<typename T1>
|
|
inline
|
|
bool
|
|
auxlib::eig_gen
|
|
(
|
|
Mat< std::complex<typename T1::pod_type> >& vals,
|
|
Mat< std::complex<typename T1::pod_type> >& vecs,
|
|
const uword mode,
|
|
const Base< std::complex<typename T1::pod_type>, T1 >& expr
|
|
)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename T1::pod_type T;
|
|
typedef typename std::complex<T> eT;
|
|
|
|
Mat<eT> X = expr.get_ref();
|
|
|
|
arma_debug_check( (X.is_square() == false), "eig_gen(): given matrix must be square sized" );
|
|
|
|
arma_debug_assert_blas_size(X);
|
|
|
|
if(X.is_empty())
|
|
{
|
|
vals.reset();
|
|
vecs.reset();
|
|
return true;
|
|
}
|
|
|
|
if(X.is_finite() == false) { return false; }
|
|
|
|
vals.set_size(X.n_rows, 1);
|
|
|
|
const bool calc_l = (mode == 1);
|
|
const bool calc_r = (mode == 2);
|
|
|
|
if(calc_l || calc_r) { vecs.set_size(X.n_rows, X.n_rows); }
|
|
|
|
podarray<eT> junk(1);
|
|
|
|
char jobvl = (calc_l) ? 'V' : 'N';
|
|
char jobvr = (calc_r) ? 'V' : 'N';
|
|
blas_int N = blas_int(X.n_rows);
|
|
eT* vl = (calc_l) ? vecs.memptr() : junk.memptr();
|
|
eT* vr = (calc_r) ? vecs.memptr() : junk.memptr();
|
|
blas_int ldvl = (calc_l) ? blas_int(vecs.n_rows) : blas_int(1);
|
|
blas_int ldvr = (calc_r) ? blas_int(vecs.n_rows) : blas_int(1);
|
|
blas_int lwork = 3 * ((std::max)(blas_int(1), 2*N));
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
podarray< T> rwork( static_cast<uword>(2*N) );
|
|
|
|
arma_extra_debug_print("lapack::cx_geev() -- START");
|
|
lapack::cx_geev(&jobvl, &jobvr, &N, X.memptr(), &N, vals.memptr(), vl, &ldvl, vr, &ldvr, work.memptr(), &lwork, rwork.memptr(), &info);
|
|
arma_extra_debug_print("lapack::cx_geev() -- END");
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(vals);
|
|
arma_ignore(vecs);
|
|
arma_ignore(mode);
|
|
arma_ignore(expr);
|
|
arma_stop("eig_gen(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! eigen decomposition of general square matrix (real); calculate both left and right eigenvectors
|
|
template<typename T1>
|
|
inline
|
|
bool
|
|
auxlib::eig_gen_dual
|
|
(
|
|
Mat< std::complex<typename T1::pod_type> >& vals,
|
|
Mat<typename T1::pod_type>& vecs_l,
|
|
Mat<typename T1::pod_type>& vecs_r,
|
|
const Base<typename T1::pod_type,T1>& expr
|
|
)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename T1::pod_type T;
|
|
|
|
Mat<T> X = expr.get_ref();
|
|
|
|
arma_debug_check( (X.is_square() == false), "eig_gen(): given matrix must be square sized" );
|
|
|
|
arma_debug_assert_blas_size(X);
|
|
|
|
if(X.is_empty())
|
|
{
|
|
vals.reset();
|
|
vecs_l.reset();
|
|
vecs_r.reset();
|
|
return true;
|
|
}
|
|
|
|
if(X.is_finite() == false) { return false; }
|
|
|
|
vals.set_size(X.n_rows, 1);
|
|
|
|
vecs_l.set_size(X.n_rows, X.n_rows);
|
|
vecs_r.set_size(X.n_rows, X.n_rows);
|
|
|
|
char jobvl = 'V';
|
|
char jobvr = 'V';
|
|
blas_int N = blas_int(X.n_rows);
|
|
blas_int ldvl = blas_int(vecs_l.n_rows);
|
|
blas_int ldvr = blas_int(vecs_r.n_rows);
|
|
blas_int lwork = (3 * ((std::max)(blas_int(1), 4*N)) );
|
|
blas_int info = 0;
|
|
|
|
podarray<T> work( static_cast<uword>(lwork) );
|
|
|
|
podarray<T> vals_real(X.n_rows);
|
|
podarray<T> vals_imag(X.n_rows);
|
|
|
|
arma_extra_debug_print("lapack::geev() -- START");
|
|
lapack::geev(&jobvl, &jobvr, &N, X.memptr(), &N, vals_real.memptr(), vals_imag.memptr(), vecs_l.memptr(), &ldvl, vecs_r.memptr(), &ldvr, work.memptr(), &lwork, &info);
|
|
arma_extra_debug_print("lapack::geev() -- END");
|
|
|
|
std::complex<T>* vals_mem = vals.memptr();
|
|
|
|
for(uword i=0; i < X.n_rows; ++i) { vals_mem[i] = std::complex<T>(vals_real[i], vals_imag[i]); }
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(vals);
|
|
arma_ignore(vecs_l);
|
|
arma_ignore(vecs_r);
|
|
arma_ignore(expr);
|
|
arma_stop("eig_gen(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! eigen decomposition of general square matrix (complex); calculate both left and right eigenvectors
|
|
template<typename T1>
|
|
inline
|
|
bool
|
|
auxlib::eig_gen_dual
|
|
(
|
|
Mat< std::complex<typename T1::pod_type> >& vals,
|
|
Mat< std::complex<typename T1::pod_type> >& vecs_l,
|
|
Mat< std::complex<typename T1::pod_type> >& vecs_r,
|
|
const Base< std::complex<typename T1::pod_type>, T1 >& expr
|
|
)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename T1::pod_type T;
|
|
typedef typename std::complex<T> eT;
|
|
|
|
Mat<eT> X = expr.get_ref();
|
|
|
|
arma_debug_check( (X.is_square() == false), "eig_gen(): given matrix must be square sized" );
|
|
|
|
arma_debug_assert_blas_size(X);
|
|
|
|
if(X.is_empty())
|
|
{
|
|
vals.reset();
|
|
vecs_l.reset();
|
|
vecs_r.reset();
|
|
return true;
|
|
}
|
|
|
|
if(X.is_finite() == false) { return false; }
|
|
|
|
vals.set_size(X.n_rows, 1);
|
|
|
|
vecs_l.set_size(X.n_rows, X.n_rows);
|
|
vecs_r.set_size(X.n_rows, X.n_rows);
|
|
|
|
char jobvl = 'V';
|
|
char jobvr = 'V';
|
|
blas_int N = blas_int(X.n_rows);
|
|
blas_int ldvl = blas_int(vecs_l.n_rows);
|
|
blas_int ldvr = blas_int(vecs_r.n_rows);
|
|
blas_int lwork = 3 * ((std::max)(blas_int(1), 2*N));
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
podarray< T> rwork( static_cast<uword>(2*N) );
|
|
|
|
arma_extra_debug_print("lapack::cx_geev() -- START");
|
|
lapack::cx_geev(&jobvl, &jobvr, &N, X.memptr(), &N, vals.memptr(), vecs_l.memptr(), &ldvl, vecs_r.memptr(), &ldvr, work.memptr(), &lwork, rwork.memptr(), &info);
|
|
arma_extra_debug_print("lapack::cx_geev() -- END");
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(vals);
|
|
arma_ignore(vecs_l);
|
|
arma_ignore(vecs_r);
|
|
arma_ignore(expr);
|
|
arma_stop("eig_gen(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! eigendecomposition of general square real matrix pair (real)
|
|
template<typename T1, typename T2>
|
|
inline
|
|
bool
|
|
auxlib::eig_pair
|
|
(
|
|
Mat< std::complex<typename T1::pod_type> >& vals,
|
|
Mat< std::complex<typename T1::pod_type> >& vecs,
|
|
const uword mode,
|
|
const Base<typename T1::pod_type,T1>& A_expr,
|
|
const Base<typename T1::pod_type,T2>& B_expr
|
|
)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename T1::pod_type T;
|
|
typedef std::complex<T> eT;
|
|
|
|
Mat<T> A(A_expr.get_ref());
|
|
Mat<T> B(B_expr.get_ref());
|
|
|
|
arma_debug_check( ((A.is_square() == false) || (B.is_square() == false)), "eig_pair(): given matrices must be square sized" );
|
|
|
|
arma_debug_check( (A.n_rows != B.n_rows), "eig_pair(): given matrices must have the same size" );
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
if(A.is_empty())
|
|
{
|
|
vals.reset();
|
|
vecs.reset();
|
|
return true;
|
|
}
|
|
|
|
if(A.is_finite() == false) { return false; }
|
|
if(B.is_finite() == false) { return false; }
|
|
|
|
vals.set_size(A.n_rows, 1);
|
|
|
|
Mat<T> tmp(1,1);
|
|
|
|
const bool calc_l = (mode == 1);
|
|
const bool calc_r = (mode == 2);
|
|
|
|
if(calc_l || calc_r)
|
|
{
|
|
vecs.set_size(A.n_rows, A.n_rows);
|
|
tmp.set_size(A.n_rows, A.n_rows);
|
|
}
|
|
|
|
podarray<T> junk(1);
|
|
|
|
char jobvl = (calc_l) ? 'V' : 'N';
|
|
char jobvr = (calc_r) ? 'V' : 'N';
|
|
blas_int N = blas_int(A.n_rows);
|
|
T* vl = (calc_l) ? tmp.memptr() : junk.memptr();
|
|
T* vr = (calc_r) ? tmp.memptr() : junk.memptr();
|
|
blas_int ldvl = (calc_l) ? blas_int(tmp.n_rows) : blas_int(1);
|
|
blas_int ldvr = (calc_r) ? blas_int(tmp.n_rows) : blas_int(1);
|
|
blas_int lwork = 3 * ((std::max)(blas_int(1), 8*N));
|
|
blas_int info = 0;
|
|
|
|
podarray<T> alphar(A.n_rows);
|
|
podarray<T> alphai(A.n_rows);
|
|
podarray<T> beta(A.n_rows);
|
|
|
|
podarray<T> work( static_cast<uword>(lwork) );
|
|
|
|
arma_extra_debug_print("lapack::ggev()");
|
|
lapack::ggev(&jobvl, &jobvr, &N, A.memptr(), &N, B.memptr(), &N, alphar.memptr(), alphai.memptr(), beta.memptr(), vl, &ldvl, vr, &ldvr, work.memptr(), &lwork, &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
arma_extra_debug_print("reformatting eigenvalues and eigenvectors");
|
|
|
|
eT* vals_mem = vals.memptr();
|
|
const T* alphar_mem = alphar.memptr();
|
|
const T* alphai_mem = alphai.memptr();
|
|
const T* beta_mem = beta.memptr();
|
|
|
|
bool beta_has_zero = false;
|
|
|
|
for(uword j=0; j<A.n_rows; ++j)
|
|
{
|
|
const T alphai_val = alphai_mem[j];
|
|
const T beta_val = beta_mem[j];
|
|
|
|
const T re = alphar_mem[j] / beta_val;
|
|
const T im = alphai_val / beta_val;
|
|
|
|
beta_has_zero = (beta_has_zero || (beta_val == T(0)));
|
|
|
|
vals_mem[j] = std::complex<T>(re, im);
|
|
|
|
if( (alphai_val > T(0)) && (j < (A.n_rows-1)) )
|
|
{
|
|
++j;
|
|
vals_mem[j] = std::complex<T>(re,-im); // force exact conjugate
|
|
}
|
|
}
|
|
|
|
if(beta_has_zero) { arma_debug_warn("eig_pair(): given matrices appear ill-conditioned"); }
|
|
|
|
if(calc_l || calc_r)
|
|
{
|
|
for(uword j=0; j<A.n_rows; ++j)
|
|
{
|
|
if( (j < (A.n_rows-1)) && (vals_mem[j] == std::conj(vals_mem[j+1])) )
|
|
{
|
|
for(uword i=0; i<A.n_rows; ++i)
|
|
{
|
|
vecs.at(i,j) = std::complex<T>( tmp.at(i,j), tmp.at(i,j+1) );
|
|
vecs.at(i,j+1) = std::complex<T>( tmp.at(i,j), -tmp.at(i,j+1) );
|
|
}
|
|
|
|
++j;
|
|
}
|
|
else
|
|
{
|
|
for(uword i=0; i<A.n_rows; ++i)
|
|
{
|
|
vecs.at(i,j) = std::complex<T>(tmp.at(i,j), T(0));
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
return true;
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(vals);
|
|
arma_ignore(vecs);
|
|
arma_ignore(mode);
|
|
arma_ignore(A_expr);
|
|
arma_ignore(B_expr);
|
|
arma_stop("eig_pair(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! eigendecomposition of general square real matrix pair (complex)
|
|
template<typename T1, typename T2>
|
|
inline
|
|
bool
|
|
auxlib::eig_pair
|
|
(
|
|
Mat< std::complex<typename T1::pod_type> >& vals,
|
|
Mat< std::complex<typename T1::pod_type> >& vecs,
|
|
const uword mode,
|
|
const Base< std::complex<typename T1::pod_type>, T1 >& A_expr,
|
|
const Base< std::complex<typename T1::pod_type>, T2 >& B_expr
|
|
)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if (defined(ARMA_USE_LAPACK) && defined(ARMA_CRIPPLED_LAPACK))
|
|
{
|
|
arma_ignore(vals);
|
|
arma_ignore(vecs);
|
|
arma_ignore(mode);
|
|
arma_ignore(A_expr);
|
|
arma_ignore(B_expr);
|
|
arma_stop("eig_pair() for complex matrices not available due to crippled LAPACK");
|
|
return false;
|
|
}
|
|
#elif defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename T1::pod_type T;
|
|
typedef typename std::complex<T> eT;
|
|
|
|
Mat<eT> A(A_expr.get_ref());
|
|
Mat<eT> B(B_expr.get_ref());
|
|
|
|
arma_debug_check( ((A.is_square() == false) || (B.is_square() == false)), "eig_pair(): given matrices must be square sized" );
|
|
|
|
arma_debug_check( (A.n_rows != B.n_rows), "eig_pair(): given matrices must have the same size" );
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
if(A.is_empty())
|
|
{
|
|
vals.reset();
|
|
vecs.reset();
|
|
return true;
|
|
}
|
|
|
|
if(A.is_finite() == false) { return false; }
|
|
if(B.is_finite() == false) { return false; }
|
|
|
|
vals.set_size(A.n_rows, 1);
|
|
|
|
const bool calc_l = (mode == 1);
|
|
const bool calc_r = (mode == 2);
|
|
|
|
if(calc_l || calc_r) { vecs.set_size(A.n_rows, A.n_rows); }
|
|
|
|
podarray<eT> junk(1);
|
|
|
|
char jobvl = (calc_l) ? 'V' : 'N';
|
|
char jobvr = (calc_r) ? 'V' : 'N';
|
|
blas_int N = blas_int(A.n_rows);
|
|
eT* vl = (calc_l) ? vecs.memptr() : junk.memptr();
|
|
eT* vr = (calc_r) ? vecs.memptr() : junk.memptr();
|
|
blas_int ldvl = (calc_l) ? blas_int(vecs.n_rows) : blas_int(1);
|
|
blas_int ldvr = (calc_r) ? blas_int(vecs.n_rows) : blas_int(1);
|
|
blas_int lwork = 3 * ((std::max)(blas_int(1),2*N));
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> alpha(A.n_rows);
|
|
podarray<eT> beta(A.n_rows);
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
podarray<T> rwork( static_cast<uword>(8*N) );
|
|
|
|
arma_extra_debug_print("lapack::cx_ggev()");
|
|
lapack::cx_ggev(&jobvl, &jobvr, &N, A.memptr(), &N, B.memptr(), &N, alpha.memptr(), beta.memptr(), vl, &ldvl, vr, &ldvr, work.memptr(), &lwork, rwork.memptr(), &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
eT* vals_mem = vals.memptr();
|
|
const eT* alpha_mem = alpha.memptr();
|
|
const eT* beta_mem = beta.memptr();
|
|
|
|
const std::complex<T> zero(T(0), T(0));
|
|
|
|
bool beta_has_zero = false;
|
|
|
|
for(uword i=0; i<A.n_rows; ++i)
|
|
{
|
|
const eT& beta_val = beta_mem[i];
|
|
|
|
vals_mem[i] = alpha_mem[i] / beta_val;
|
|
|
|
beta_has_zero = (beta_has_zero || (beta_val == zero));
|
|
}
|
|
|
|
if(beta_has_zero) { arma_debug_warn("eig_pair(): given matrices appear ill-conditioned"); }
|
|
|
|
return true;
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(vals);
|
|
arma_ignore(vecs);
|
|
arma_ignore(mode);
|
|
arma_ignore(A_expr);
|
|
arma_ignore(B_expr);
|
|
arma_stop("eig_pair(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! eigenvalues of a symmetric real matrix
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::eig_sym(Col<eT>& eigval, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
Mat<eT> A(X.get_ref());
|
|
|
|
arma_debug_check( (A.is_square() == false), "eig_sym(): given matrix must be square sized" );
|
|
|
|
if(A.is_empty())
|
|
{
|
|
eigval.reset();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
eigval.set_size(A.n_rows);
|
|
|
|
char jobz = 'N';
|
|
char uplo = 'U';
|
|
|
|
blas_int N = blas_int(A.n_rows);
|
|
blas_int lwork = 3 * ( (std::max)(blas_int(1), 3*N-1) );
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
|
|
arma_extra_debug_print("lapack::syev()");
|
|
lapack::syev(&jobz, &uplo, &N, A.memptr(), &N, eigval.memptr(), work.memptr(), &lwork, &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(eigval);
|
|
arma_ignore(X);
|
|
arma_stop("eig_sym(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! eigenvalues of a hermitian complex matrix
|
|
template<typename T, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::eig_sym(Col<T>& eigval, const Base<std::complex<T>,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename std::complex<T> eT;
|
|
|
|
Mat<eT> A(X.get_ref());
|
|
|
|
arma_debug_check( (A.is_square() == false), "eig_sym(): given matrix must be square sized" );
|
|
|
|
if(A.is_empty())
|
|
{
|
|
eigval.reset();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
eigval.set_size(A.n_rows);
|
|
|
|
char jobz = 'N';
|
|
char uplo = 'U';
|
|
|
|
blas_int N = blas_int(A.n_rows);
|
|
blas_int lwork = 3 * ( (std::max)(blas_int(1), 2*N-1) );
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
podarray<T> rwork( static_cast<uword>( (std::max)(blas_int(1), 3*N-2) ) );
|
|
|
|
arma_extra_debug_print("lapack::heev()");
|
|
lapack::heev(&jobz, &uplo, &N, A.memptr(), &N, eigval.memptr(), work.memptr(), &lwork, rwork.memptr(), &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(eigval);
|
|
arma_ignore(X);
|
|
arma_stop("eig_sym(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! eigenvalues and eigenvectors of a symmetric real matrix
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::eig_sym(Col<eT>& eigval, Mat<eT>& eigvec, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
eigvec = X.get_ref();
|
|
|
|
arma_debug_check( (eigvec.is_square() == false), "eig_sym(): given matrix must be square sized" );
|
|
|
|
if(eigvec.is_empty())
|
|
{
|
|
eigval.reset();
|
|
eigvec.reset();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(eigvec);
|
|
|
|
eigval.set_size(eigvec.n_rows);
|
|
|
|
char jobz = 'V';
|
|
char uplo = 'U';
|
|
|
|
blas_int N = blas_int(eigvec.n_rows);
|
|
blas_int lwork = 3 * ( (std::max)(blas_int(1), 3*N-1) );
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
|
|
arma_extra_debug_print("lapack::syev()");
|
|
lapack::syev(&jobz, &uplo, &N, eigvec.memptr(), &N, eigval.memptr(), work.memptr(), &lwork, &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(eigval);
|
|
arma_ignore(eigvec);
|
|
arma_ignore(X);
|
|
arma_stop("eig_sym(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! eigenvalues and eigenvectors of a hermitian complex matrix
|
|
template<typename T, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::eig_sym(Col<T>& eigval, Mat< std::complex<T> >& eigvec, const Base<std::complex<T>,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename std::complex<T> eT;
|
|
|
|
eigvec = X.get_ref();
|
|
|
|
arma_debug_check( (eigvec.is_square() == false), "eig_sym(): given matrix must be square sized" );
|
|
|
|
if(eigvec.is_empty())
|
|
{
|
|
eigval.reset();
|
|
eigvec.reset();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(eigvec);
|
|
|
|
eigval.set_size(eigvec.n_rows);
|
|
|
|
char jobz = 'V';
|
|
char uplo = 'U';
|
|
|
|
blas_int N = blas_int(eigvec.n_rows);
|
|
blas_int lwork = 3 * ( (std::max)(blas_int(1), 2*N-1) );
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
podarray<T> rwork( static_cast<uword>((std::max)(blas_int(1), 3*N-2)) );
|
|
|
|
arma_extra_debug_print("lapack::heev()");
|
|
lapack::heev(&jobz, &uplo, &N, eigvec.memptr(), &N, eigval.memptr(), work.memptr(), &lwork, rwork.memptr(), &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(eigval);
|
|
arma_ignore(eigvec);
|
|
arma_ignore(X);
|
|
arma_stop("eig_sym(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! eigenvalues and eigenvectors of a symmetric real matrix (divide and conquer algorithm)
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::eig_sym_dc(Col<eT>& eigval, Mat<eT>& eigvec, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
eigvec = X.get_ref();
|
|
|
|
arma_debug_check( (eigvec.is_square() == false), "eig_sym(): given matrix must be square sized" );
|
|
|
|
if(eigvec.is_empty())
|
|
{
|
|
eigval.reset();
|
|
eigvec.reset();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(eigvec);
|
|
|
|
eigval.set_size(eigvec.n_rows);
|
|
|
|
char jobz = 'V';
|
|
char uplo = 'U';
|
|
|
|
blas_int N = blas_int(eigvec.n_rows);
|
|
blas_int lwork = 2 * (1 + 6*N + 2*(N*N));
|
|
blas_int liwork = 3 * (3 + 5*N);
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> work( static_cast<uword>( lwork) );
|
|
podarray<blas_int> iwork( static_cast<uword>(liwork) );
|
|
|
|
arma_extra_debug_print("lapack::syevd()");
|
|
lapack::syevd(&jobz, &uplo, &N, eigvec.memptr(), &N, eigval.memptr(), work.memptr(), &lwork, iwork.memptr(), &liwork, &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(eigval);
|
|
arma_ignore(eigvec);
|
|
arma_ignore(X);
|
|
arma_stop("eig_sym(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! eigenvalues and eigenvectors of a hermitian complex matrix (divide and conquer algorithm)
|
|
template<typename T, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::eig_sym_dc(Col<T>& eigval, Mat< std::complex<T> >& eigvec, const Base<std::complex<T>,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename std::complex<T> eT;
|
|
|
|
eigvec = X.get_ref();
|
|
|
|
arma_debug_check( (eigvec.is_square() == false), "eig_sym(): given matrix must be square sized" );
|
|
|
|
if(eigvec.is_empty())
|
|
{
|
|
eigval.reset();
|
|
eigvec.reset();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(eigvec);
|
|
|
|
eigval.set_size(eigvec.n_rows);
|
|
|
|
char jobz = 'V';
|
|
char uplo = 'U';
|
|
|
|
blas_int N = blas_int(eigvec.n_rows);
|
|
blas_int lwork = 2 * (2*N + N*N);
|
|
blas_int lrwork = 2 * (1 + 5*N + 2*(N*N));
|
|
blas_int liwork = 3 * (3 + 5*N);
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
podarray<T> rwork( static_cast<uword>(lrwork) );
|
|
podarray<blas_int> iwork( static_cast<uword>(liwork) );
|
|
|
|
arma_extra_debug_print("lapack::heevd()");
|
|
lapack::heevd(&jobz, &uplo, &N, eigvec.memptr(), &N, eigval.memptr(), work.memptr(), &lwork, rwork.memptr(), &lrwork, iwork.memptr(), &liwork, &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(eigval);
|
|
arma_ignore(eigvec);
|
|
arma_ignore(X);
|
|
arma_stop("eig_sym(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::chol(Mat<eT>& out, const Base<eT,T1>& X, const uword layout)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
out = X.get_ref();
|
|
|
|
arma_debug_check( (out.is_square() == false), "chol(): given matrix must be square sized" );
|
|
|
|
if(out.is_empty()) { return true; }
|
|
|
|
arma_debug_assert_blas_size(out);
|
|
|
|
const uword out_n_rows = out.n_rows;
|
|
|
|
char uplo = (layout == 0) ? 'U' : 'L';
|
|
blas_int n = out_n_rows;
|
|
blas_int info = 0;
|
|
|
|
arma_extra_debug_print("lapack::potrf()");
|
|
lapack::potrf(&uplo, &n, out.memptr(), &n, &info);
|
|
|
|
if(layout == 0)
|
|
{
|
|
for(uword col=0; col < out_n_rows; ++col)
|
|
{
|
|
eT* colptr = out.colptr(col);
|
|
|
|
for(uword row=(col+1); row < out_n_rows; ++row) { colptr[row] = eT(0); }
|
|
}
|
|
}
|
|
else
|
|
{
|
|
for(uword col=1; col < out_n_rows; ++col)
|
|
{
|
|
eT* colptr = out.colptr(col);
|
|
|
|
for(uword row=0; row < col; ++row) { colptr[row] = eT(0); }
|
|
}
|
|
}
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(out);
|
|
arma_ignore(X);
|
|
arma_ignore(layout);
|
|
|
|
arma_stop("chol(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::qr(Mat<eT>& Q, Mat<eT>& R, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
R = X.get_ref();
|
|
|
|
const uword R_n_rows = R.n_rows;
|
|
const uword R_n_cols = R.n_cols;
|
|
|
|
if(R.is_empty())
|
|
{
|
|
Q.eye(R_n_rows, R_n_rows);
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(R);
|
|
|
|
blas_int m = static_cast<blas_int>(R_n_rows);
|
|
blas_int n = static_cast<blas_int>(R_n_cols);
|
|
blas_int lwork = 0;
|
|
blas_int lwork_min = (std::max)(blas_int(1), (std::max)(m,n)); // take into account requirements of geqrf() _and_ orgqr()/ungqr()
|
|
blas_int k = (std::min)(m,n);
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> tau( static_cast<uword>(k) );
|
|
|
|
eT work_query[2];
|
|
blas_int lwork_query = -1;
|
|
|
|
arma_extra_debug_print("lapack::geqrf()");
|
|
lapack::geqrf(&m, &n, R.memptr(), &m, tau.memptr(), &work_query[0], &lwork_query, &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
blas_int lwork_proposed = static_cast<blas_int>( access::tmp_real(work_query[0]) );
|
|
|
|
lwork = (std::max)(lwork_proposed, lwork_min);
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
|
|
arma_extra_debug_print("lapack::geqrf()");
|
|
lapack::geqrf(&m, &n, R.memptr(), &m, tau.memptr(), work.memptr(), &lwork, &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
Q.set_size(R_n_rows, R_n_rows);
|
|
|
|
arrayops::copy( Q.memptr(), R.memptr(), (std::min)(Q.n_elem, R.n_elem) );
|
|
|
|
//
|
|
// construct R
|
|
|
|
for(uword col=0; col < R_n_cols; ++col)
|
|
{
|
|
for(uword row=(col+1); row < R_n_rows; ++row)
|
|
{
|
|
R.at(row,col) = eT(0);
|
|
}
|
|
}
|
|
|
|
|
|
if( (is_float<eT>::value) || (is_double<eT>::value) )
|
|
{
|
|
arma_extra_debug_print("lapack::orgqr()");
|
|
lapack::orgqr(&m, &m, &k, Q.memptr(), &m, tau.memptr(), work.memptr(), &lwork, &info);
|
|
}
|
|
else
|
|
if( (is_supported_complex_float<eT>::value) || (is_supported_complex_double<eT>::value) )
|
|
{
|
|
arma_extra_debug_print("lapack::ungqr()");
|
|
lapack::ungqr(&m, &m, &k, Q.memptr(), &m, tau.memptr(), work.memptr(), &lwork, &info);
|
|
}
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(Q);
|
|
arma_ignore(R);
|
|
arma_ignore(X);
|
|
arma_stop("qr(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::qr_econ(Mat<eT>& Q, Mat<eT>& R, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
if(is_Mat<T1>::value)
|
|
{
|
|
const unwrap<T1> tmp(X.get_ref());
|
|
const Mat<eT>& M = tmp.M;
|
|
|
|
if(M.n_rows < M.n_cols)
|
|
{
|
|
return auxlib::qr(Q, R, X);
|
|
}
|
|
}
|
|
|
|
Q = X.get_ref();
|
|
|
|
const uword Q_n_rows = Q.n_rows;
|
|
const uword Q_n_cols = Q.n_cols;
|
|
|
|
if( Q_n_rows <= Q_n_cols )
|
|
{
|
|
return auxlib::qr(Q, R, Q);
|
|
}
|
|
|
|
if(Q.is_empty())
|
|
{
|
|
Q.set_size(Q_n_rows, 0 );
|
|
R.set_size(0, Q_n_cols);
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(Q);
|
|
|
|
blas_int m = static_cast<blas_int>(Q_n_rows);
|
|
blas_int n = static_cast<blas_int>(Q_n_cols);
|
|
blas_int lwork = 0;
|
|
blas_int lwork_min = (std::max)(blas_int(1), (std::max)(m,n)); // take into account requirements of geqrf() _and_ orgqr()/ungqr()
|
|
blas_int k = (std::min)(m,n);
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> tau( static_cast<uword>(k) );
|
|
|
|
eT work_query[2];
|
|
blas_int lwork_query = -1;
|
|
|
|
arma_extra_debug_print("lapack::geqrf()");
|
|
lapack::geqrf(&m, &n, Q.memptr(), &m, tau.memptr(), &work_query[0], &lwork_query, &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
blas_int lwork_proposed = static_cast<blas_int>( access::tmp_real(work_query[0]) );
|
|
|
|
lwork = (std::max)(lwork_proposed, lwork_min);
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
|
|
arma_extra_debug_print("lapack::geqrf()");
|
|
lapack::geqrf(&m, &n, Q.memptr(), &m, tau.memptr(), work.memptr(), &lwork, &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
R.set_size(Q_n_cols, Q_n_cols);
|
|
|
|
//
|
|
// construct R
|
|
|
|
for(uword col=0; col < Q_n_cols; ++col)
|
|
{
|
|
for(uword row=0; row <= col; ++row)
|
|
{
|
|
R.at(row,col) = Q.at(row,col);
|
|
}
|
|
|
|
for(uword row=(col+1); row < Q_n_cols; ++row)
|
|
{
|
|
R.at(row,col) = eT(0);
|
|
}
|
|
}
|
|
|
|
if( (is_float<eT>::value) || (is_double<eT>::value) )
|
|
{
|
|
arma_extra_debug_print("lapack::orgqr()");
|
|
lapack::orgqr(&m, &n, &k, Q.memptr(), &m, tau.memptr(), work.memptr(), &lwork, &info);
|
|
}
|
|
else
|
|
if( (is_supported_complex_float<eT>::value) || (is_supported_complex_double<eT>::value) )
|
|
{
|
|
arma_extra_debug_print("lapack::ungqr()");
|
|
lapack::ungqr(&m, &n, &k, Q.memptr(), &m, tau.memptr(), work.memptr(), &lwork, &info);
|
|
}
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(Q);
|
|
arma_ignore(R);
|
|
arma_ignore(X);
|
|
arma_stop("qr_econ(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd(Col<eT>& S, const Base<eT,T1>& X, uword& X_n_rows, uword& X_n_cols)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
Mat<eT> A(X.get_ref());
|
|
|
|
X_n_rows = A.n_rows;
|
|
X_n_cols = A.n_cols;
|
|
|
|
if(A.is_empty())
|
|
{
|
|
S.reset();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
Mat<eT> U(1, 1);
|
|
Mat<eT> V(1, A.n_cols);
|
|
|
|
char jobu = 'N';
|
|
char jobvt = 'N';
|
|
|
|
blas_int m = A.n_rows;
|
|
blas_int n = A.n_cols;
|
|
blas_int min_mn = (std::min)(m,n);
|
|
blas_int lda = A.n_rows;
|
|
blas_int ldu = U.n_rows;
|
|
blas_int ldvt = V.n_rows;
|
|
blas_int lwork = 0;
|
|
blas_int lwork_min = (std::max)( blas_int(1), (std::max)( (3*min_mn + (std::max)(m,n)), 5*min_mn ) );
|
|
blas_int info = 0;
|
|
|
|
S.set_size( static_cast<uword>(min_mn) );
|
|
|
|
eT work_query[2];
|
|
blas_int lwork_query = -1;
|
|
|
|
arma_extra_debug_print("lapack::gesvd()");
|
|
lapack::gesvd<eT>(&jobu, &jobvt, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, &work_query[0], &lwork_query, &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
blas_int lwork_proposed = static_cast<blas_int>( work_query[0] );
|
|
|
|
lwork = (std::max)(lwork_proposed, lwork_min);
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
|
|
arma_extra_debug_print("lapack::gesvd()");
|
|
lapack::gesvd<eT>(&jobu, &jobvt, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork, &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(S);
|
|
arma_ignore(X);
|
|
arma_ignore(X_n_rows);
|
|
arma_ignore(X_n_cols);
|
|
arma_stop("svd(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename T, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd(Col<T>& S, const Base<std::complex<T>, T1>& X, uword& X_n_rows, uword& X_n_cols)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef std::complex<T> eT;
|
|
|
|
Mat<eT> A(X.get_ref());
|
|
|
|
X_n_rows = A.n_rows;
|
|
X_n_cols = A.n_cols;
|
|
|
|
if(A.is_empty())
|
|
{
|
|
S.reset();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
Mat<eT> U(1, 1);
|
|
Mat<eT> V(1, A.n_cols);
|
|
|
|
char jobu = 'N';
|
|
char jobvt = 'N';
|
|
|
|
blas_int m = A.n_rows;
|
|
blas_int n = A.n_cols;
|
|
blas_int min_mn = (std::min)(m,n);
|
|
blas_int lda = A.n_rows;
|
|
blas_int ldu = U.n_rows;
|
|
blas_int ldvt = V.n_rows;
|
|
blas_int lwork = 3 * ( (std::max)(blas_int(1), 2*min_mn+(std::max)(m,n) ) );
|
|
blas_int info = 0;
|
|
|
|
S.set_size( static_cast<uword>(min_mn) );
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork ) );
|
|
podarray< T> rwork( static_cast<uword>(5*min_mn) );
|
|
|
|
blas_int lwork_tmp = -1; // let gesvd_() calculate the optimum size of the workspace
|
|
|
|
arma_extra_debug_print("lapack::cx_gesvd()");
|
|
lapack::cx_gesvd<T>(&jobu, &jobvt, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork_tmp, rwork.memptr(), &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
blas_int proposed_lwork = static_cast<blas_int>(real(work[0]));
|
|
|
|
if(proposed_lwork > lwork)
|
|
{
|
|
lwork = proposed_lwork;
|
|
work.set_size( static_cast<uword>(lwork) );
|
|
}
|
|
|
|
arma_extra_debug_print("lapack::cx_gesvd()");
|
|
lapack::cx_gesvd<T>(&jobu, &jobvt, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork, rwork.memptr(), &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(S);
|
|
arma_ignore(X);
|
|
arma_ignore(X_n_rows);
|
|
arma_ignore(X_n_cols);
|
|
|
|
arma_stop("svd(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd(Col<eT>& S, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
uword junk;
|
|
return auxlib::svd(S, X, junk, junk);
|
|
}
|
|
|
|
|
|
|
|
template<typename T, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd(Col<T>& S, const Base<std::complex<T>, T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
uword junk;
|
|
return auxlib::svd(S, X, junk, junk);
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd(Mat<eT>& U, Col<eT>& S, Mat<eT>& V, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
Mat<eT> A(X.get_ref());
|
|
|
|
if(A.is_empty())
|
|
{
|
|
U.eye(A.n_rows, A.n_rows);
|
|
S.reset();
|
|
V.eye(A.n_cols, A.n_cols);
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
U.set_size(A.n_rows, A.n_rows);
|
|
V.set_size(A.n_cols, A.n_cols);
|
|
|
|
char jobu = 'A';
|
|
char jobvt = 'A';
|
|
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_cols);
|
|
blas_int min_mn = (std::min)(m,n);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
blas_int ldu = blas_int(U.n_rows);
|
|
blas_int ldvt = blas_int(V.n_rows);
|
|
blas_int lwork_min = (std::max)( blas_int(1), (std::max)( (3*min_mn + (std::max)(m,n)), 5*min_mn ) );
|
|
blas_int lwork = 0;
|
|
blas_int info = 0;
|
|
|
|
S.set_size( static_cast<uword>(min_mn) );
|
|
|
|
// let gesvd_() calculate the optimum size of the workspace
|
|
eT work_query[2];
|
|
blas_int lwork_query = -1;
|
|
|
|
arma_extra_debug_print("lapack::gesvd()");
|
|
lapack::gesvd<eT>(&jobu, &jobvt, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, &work_query[0], &lwork_query, &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
blas_int lwork_proposed = static_cast<blas_int>( work_query[0] );
|
|
|
|
lwork = (std::max)(lwork_proposed, lwork_min);
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
|
|
arma_extra_debug_print("lapack::gesvd()");
|
|
lapack::gesvd<eT>(&jobu, &jobvt, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork, &info);
|
|
|
|
op_strans::apply_mat_inplace(V);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(U);
|
|
arma_ignore(S);
|
|
arma_ignore(V);
|
|
arma_ignore(X);
|
|
arma_stop("svd(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename T, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd(Mat< std::complex<T> >& U, Col<T>& S, Mat< std::complex<T> >& V, const Base< std::complex<T>, T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef std::complex<T> eT;
|
|
|
|
Mat<eT> A(X.get_ref());
|
|
|
|
if(A.is_empty())
|
|
{
|
|
U.eye(A.n_rows, A.n_rows);
|
|
S.reset();
|
|
V.eye(A.n_cols, A.n_cols);
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
U.set_size(A.n_rows, A.n_rows);
|
|
V.set_size(A.n_cols, A.n_cols);
|
|
|
|
char jobu = 'A';
|
|
char jobvt = 'A';
|
|
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_cols);
|
|
blas_int min_mn = (std::min)(m,n);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
blas_int ldu = blas_int(U.n_rows);
|
|
blas_int ldvt = blas_int(V.n_rows);
|
|
blas_int lwork = 3 * ( (std::max)(blas_int(1), 2*min_mn + (std::max)(m,n) ) );
|
|
blas_int info = 0;
|
|
|
|
S.set_size( static_cast<uword>(min_mn) );
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork ) );
|
|
podarray<T> rwork( static_cast<uword>(5*min_mn) );
|
|
|
|
blas_int lwork_tmp = -1; // let gesvd_() calculate the optimum size of the workspace
|
|
|
|
arma_extra_debug_print("lapack::cx_gesvd()");
|
|
lapack::cx_gesvd<T>(&jobu, &jobvt, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork_tmp, rwork.memptr(), &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
blas_int proposed_lwork = static_cast<blas_int>(real(work[0]));
|
|
|
|
if(proposed_lwork > lwork)
|
|
{
|
|
lwork = proposed_lwork;
|
|
work.set_size( static_cast<uword>(lwork) );
|
|
}
|
|
|
|
arma_extra_debug_print("lapack::cx_gesvd()");
|
|
lapack::cx_gesvd<T>(&jobu, &jobvt, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork, rwork.memptr(), &info);
|
|
|
|
op_htrans::apply_mat_inplace(V);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(U);
|
|
arma_ignore(S);
|
|
arma_ignore(V);
|
|
arma_ignore(X);
|
|
arma_stop("svd(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd_econ(Mat<eT>& U, Col<eT>& S, Mat<eT>& V, const Base<eT,T1>& X, const char mode)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
Mat<eT> A(X.get_ref());
|
|
|
|
if(A.is_empty())
|
|
{
|
|
U.eye();
|
|
S.reset();
|
|
V.eye();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_cols);
|
|
blas_int min_mn = (std::min)(m,n);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
|
|
S.set_size( static_cast<uword>(min_mn) );
|
|
|
|
blas_int ldu = 0;
|
|
blas_int ldvt = 0;
|
|
|
|
char jobu = char(0);
|
|
char jobvt = char(0);
|
|
|
|
if(mode == 'l')
|
|
{
|
|
jobu = 'S';
|
|
jobvt = 'N';
|
|
|
|
ldu = m;
|
|
ldvt = 1;
|
|
|
|
U.set_size( static_cast<uword>(ldu), static_cast<uword>(min_mn) );
|
|
V.reset();
|
|
}
|
|
|
|
if(mode == 'r')
|
|
{
|
|
jobu = 'N';
|
|
jobvt = 'S';
|
|
|
|
ldu = 1;
|
|
ldvt = (std::min)(m,n);
|
|
|
|
U.reset();
|
|
V.set_size( static_cast<uword>(ldvt), static_cast<uword>(n) );
|
|
}
|
|
|
|
if(mode == 'b')
|
|
{
|
|
jobu = 'S';
|
|
jobvt = 'S';
|
|
|
|
ldu = m;
|
|
ldvt = (std::min)(m,n);
|
|
|
|
U.set_size( static_cast<uword>(ldu), static_cast<uword>(min_mn) );
|
|
V.set_size( static_cast<uword>(ldvt), static_cast<uword>(n ) );
|
|
}
|
|
|
|
|
|
blas_int lwork = 3 * ( (std::max)(blas_int(1), (std::max)( (3*min_mn + (std::max)(m,n)), 5*min_mn ) ) );
|
|
blas_int info = 0;
|
|
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
|
|
blas_int lwork_tmp = -1; // let gesvd_() calculate the optimum size of the workspace
|
|
|
|
arma_extra_debug_print("lapack::gesvd()");
|
|
lapack::gesvd<eT>(&jobu, &jobvt, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork_tmp, &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
blas_int proposed_lwork = static_cast<blas_int>(work[0]);
|
|
|
|
if(proposed_lwork > lwork)
|
|
{
|
|
lwork = proposed_lwork;
|
|
work.set_size( static_cast<uword>(lwork) );
|
|
}
|
|
|
|
arma_extra_debug_print("lapack::gesvd()");
|
|
lapack::gesvd<eT>(&jobu, &jobvt, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork, &info);
|
|
|
|
op_strans::apply_mat_inplace(V);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(U);
|
|
arma_ignore(S);
|
|
arma_ignore(V);
|
|
arma_ignore(X);
|
|
arma_ignore(mode);
|
|
arma_stop("svd(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename T, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd_econ(Mat< std::complex<T> >& U, Col<T>& S, Mat< std::complex<T> >& V, const Base< std::complex<T>, T1>& X, const char mode)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef std::complex<T> eT;
|
|
|
|
Mat<eT> A(X.get_ref());
|
|
|
|
if(A.is_empty())
|
|
{
|
|
U.eye();
|
|
S.reset();
|
|
V.eye();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_cols);
|
|
blas_int min_mn = (std::min)(m,n);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
|
|
S.set_size( static_cast<uword>(min_mn) );
|
|
|
|
blas_int ldu = 0;
|
|
blas_int ldvt = 0;
|
|
|
|
char jobu = char(0);
|
|
char jobvt = char(0);
|
|
|
|
if(mode == 'l')
|
|
{
|
|
jobu = 'S';
|
|
jobvt = 'N';
|
|
|
|
ldu = m;
|
|
ldvt = 1;
|
|
|
|
U.set_size( static_cast<uword>(ldu), static_cast<uword>(min_mn) );
|
|
V.reset();
|
|
}
|
|
|
|
if(mode == 'r')
|
|
{
|
|
jobu = 'N';
|
|
jobvt = 'S';
|
|
|
|
ldu = 1;
|
|
ldvt = (std::min)(m,n);
|
|
|
|
U.reset();
|
|
V.set_size( static_cast<uword>(ldvt), static_cast<uword>(n) );
|
|
}
|
|
|
|
if(mode == 'b')
|
|
{
|
|
jobu = 'S';
|
|
jobvt = 'S';
|
|
|
|
ldu = m;
|
|
ldvt = (std::min)(m,n);
|
|
|
|
U.set_size( static_cast<uword>(ldu), static_cast<uword>(min_mn) );
|
|
V.set_size( static_cast<uword>(ldvt), static_cast<uword>(n) );
|
|
}
|
|
|
|
blas_int lwork = 3 * ( (std::max)(blas_int(1), (std::max)( (3*min_mn + (std::max)(m,n)), 5*min_mn ) ) );
|
|
blas_int info = 0;
|
|
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork ) );
|
|
podarray<T> rwork( static_cast<uword>(5*min_mn) );
|
|
|
|
blas_int lwork_tmp = -1; // let gesvd_() calculate the optimum size of the workspace
|
|
|
|
arma_extra_debug_print("lapack::cx_gesvd()");
|
|
lapack::cx_gesvd<T>(&jobu, &jobvt, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork_tmp, rwork.memptr(), &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
blas_int proposed_lwork = static_cast<blas_int>(real(work[0]));
|
|
|
|
if(proposed_lwork > lwork)
|
|
{
|
|
lwork = proposed_lwork;
|
|
work.set_size( static_cast<uword>(lwork) );
|
|
}
|
|
|
|
arma_extra_debug_print("lapack::cx_gesvd()");
|
|
lapack::cx_gesvd<T>(&jobu, &jobvt, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork, rwork.memptr(), &info);
|
|
|
|
op_htrans::apply_mat_inplace(V);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(U);
|
|
arma_ignore(S);
|
|
arma_ignore(V);
|
|
arma_ignore(X);
|
|
arma_ignore(mode);
|
|
arma_stop("svd(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd_dc(Col<eT>& S, const Base<eT,T1>& X, uword& X_n_rows, uword& X_n_cols)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
Mat<eT> A(X.get_ref());
|
|
|
|
X_n_rows = A.n_rows;
|
|
X_n_cols = A.n_cols;
|
|
|
|
if(A.is_empty())
|
|
{
|
|
S.reset();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
Mat<eT> U(1, 1);
|
|
Mat<eT> V(1, 1);
|
|
|
|
char jobz = 'N';
|
|
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_cols);
|
|
blas_int min_mn = (std::min)(m,n);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
blas_int ldu = blas_int(U.n_rows);
|
|
blas_int ldvt = blas_int(V.n_rows);
|
|
blas_int lwork = 3 * ( 3*min_mn + std::max( std::max(m,n), 7*min_mn ) );
|
|
blas_int info = 0;
|
|
|
|
S.set_size( static_cast<uword>(min_mn) );
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork ) );
|
|
podarray<blas_int> iwork( static_cast<uword>(8*min_mn) );
|
|
|
|
arma_extra_debug_print("lapack::gesdd()");
|
|
lapack::gesdd<eT>(&jobz, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork, iwork.memptr(), &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(S);
|
|
arma_ignore(X);
|
|
arma_ignore(X_n_rows);
|
|
arma_ignore(X_n_cols);
|
|
arma_stop("svd(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename T, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd_dc(Col<T>& S, const Base<std::complex<T>, T1>& X, uword& X_n_rows, uword& X_n_cols)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if (defined(ARMA_USE_LAPACK) && defined(ARMA_CRIPPLED_LAPACK))
|
|
{
|
|
arma_extra_debug_print("auxlib::svd_dc(): redirecting to auxlib::svd() due to crippled LAPACK");
|
|
|
|
return auxlib::svd(S, X, X_n_rows, X_n_cols);
|
|
}
|
|
#elif defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef std::complex<T> eT;
|
|
|
|
Mat<eT> A(X.get_ref());
|
|
|
|
X_n_rows = A.n_rows;
|
|
X_n_cols = A.n_cols;
|
|
|
|
if(A.is_empty())
|
|
{
|
|
S.reset();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
Mat<eT> U(1, 1);
|
|
Mat<eT> V(1, 1);
|
|
|
|
char jobz = 'N';
|
|
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_cols);
|
|
blas_int min_mn = (std::min)(m,n);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
blas_int ldu = blas_int(U.n_rows);
|
|
blas_int ldvt = blas_int(V.n_rows);
|
|
blas_int lwork = 3 * (2*min_mn + std::max(m,n));
|
|
blas_int info = 0;
|
|
|
|
S.set_size( static_cast<uword>(min_mn) );
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork ) );
|
|
podarray<T> rwork( static_cast<uword>(7*min_mn) ); // LAPACK 3.4.2 docs state 5*min(m,n), while zgesdd() seems to write past the end
|
|
podarray<blas_int> iwork( static_cast<uword>(8*min_mn) );
|
|
|
|
arma_extra_debug_print("lapack::cx_gesdd()");
|
|
lapack::cx_gesdd<T>(&jobz, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork, rwork.memptr(), iwork.memptr(), &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(S);
|
|
arma_ignore(X);
|
|
arma_ignore(X_n_rows);
|
|
arma_ignore(X_n_cols);
|
|
arma_stop("svd(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd_dc(Col<eT>& S, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
uword junk;
|
|
return auxlib::svd_dc(S, X, junk, junk);
|
|
}
|
|
|
|
|
|
|
|
template<typename T, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd_dc(Col<T>& S, const Base<std::complex<T>, T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
uword junk;
|
|
return auxlib::svd_dc(S, X, junk, junk);
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd_dc(Mat<eT>& U, Col<eT>& S, Mat<eT>& V, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
Mat<eT> A(X.get_ref());
|
|
|
|
if(A.is_empty())
|
|
{
|
|
U.eye(A.n_rows, A.n_rows);
|
|
S.reset();
|
|
V.eye(A.n_cols, A.n_cols);
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
U.set_size(A.n_rows, A.n_rows);
|
|
V.set_size(A.n_cols, A.n_cols);
|
|
|
|
char jobz = 'A';
|
|
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_cols);
|
|
blas_int min_mn = (std::min)(m,n);
|
|
blas_int max_mn = (std::max)(m,n);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
blas_int ldu = blas_int(U.n_rows);
|
|
blas_int ldvt = blas_int(V.n_rows);
|
|
blas_int lwork1 = 3*min_mn*min_mn + (std::max)( max_mn, 4*min_mn*min_mn + 4*min_mn );
|
|
blas_int lwork2 = 3*min_mn + (std::max)( max_mn, 4*min_mn*min_mn + 3*min_mn + max_mn );
|
|
blas_int lwork = 2 * ((std::max)(lwork1, lwork2)); // due to differences between lapack 3.1 and 3.4
|
|
blas_int info = 0;
|
|
|
|
S.set_size( static_cast<uword>(min_mn) );
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork ) );
|
|
podarray<blas_int> iwork( static_cast<uword>(8*min_mn) );
|
|
|
|
arma_extra_debug_print("lapack::gesdd()");
|
|
lapack::gesdd<eT>(&jobz, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork, iwork.memptr(), &info);
|
|
|
|
op_strans::apply_mat_inplace(V);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(U);
|
|
arma_ignore(S);
|
|
arma_ignore(V);
|
|
arma_ignore(X);
|
|
arma_stop("svd(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename T, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd_dc(Mat< std::complex<T> >& U, Col<T>& S, Mat< std::complex<T> >& V, const Base< std::complex<T>, T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if (defined(ARMA_USE_LAPACK) && defined(ARMA_CRIPPLED_LAPACK))
|
|
{
|
|
arma_extra_debug_print("auxlib::svd_dc(): redirecting to auxlib::svd() due to crippled LAPACK");
|
|
|
|
return auxlib::svd(U, S, V, X);
|
|
}
|
|
#elif defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef std::complex<T> eT;
|
|
|
|
Mat<eT> A(X.get_ref());
|
|
|
|
if(A.is_empty())
|
|
{
|
|
U.eye(A.n_rows, A.n_rows);
|
|
S.reset();
|
|
V.eye(A.n_cols, A.n_cols);
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
U.set_size(A.n_rows, A.n_rows);
|
|
V.set_size(A.n_cols, A.n_cols);
|
|
|
|
char jobz = 'A';
|
|
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_cols);
|
|
blas_int min_mn = (std::min)(m,n);
|
|
blas_int max_mn = (std::max)(m,n);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
blas_int ldu = blas_int(U.n_rows);
|
|
blas_int ldvt = blas_int(V.n_rows);
|
|
blas_int lwork = 2 * (min_mn*min_mn + 2*min_mn + max_mn);
|
|
blas_int lrwork1 = 5*min_mn*min_mn + 7*min_mn;
|
|
blas_int lrwork2 = min_mn * ((std::max)(5*min_mn+7, 2*max_mn + 2*min_mn+1));
|
|
blas_int lrwork = (std::max)(lrwork1, lrwork2); // due to differences between lapack 3.1 and 3.4
|
|
blas_int info = 0;
|
|
|
|
S.set_size( static_cast<uword>(min_mn) );
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork ) );
|
|
podarray<T> rwork( static_cast<uword>(lrwork ) );
|
|
podarray<blas_int> iwork( static_cast<uword>(8*min_mn) );
|
|
|
|
arma_extra_debug_print("lapack::cx_gesdd()");
|
|
lapack::cx_gesdd<T>(&jobz, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork, rwork.memptr(), iwork.memptr(), &info);
|
|
|
|
op_htrans::apply_mat_inplace(V);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(U);
|
|
arma_ignore(S);
|
|
arma_ignore(V);
|
|
arma_ignore(X);
|
|
arma_stop("svd(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd_dc_econ(Mat<eT>& U, Col<eT>& S, Mat<eT>& V, const Base<eT,T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
Mat<eT> A(X.get_ref());
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
char jobz = 'S';
|
|
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_cols);
|
|
blas_int min_mn = (std::min)(m,n);
|
|
blas_int max_mn = (std::max)(m,n);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
blas_int ldu = m;
|
|
blas_int ldvt = min_mn;
|
|
blas_int lwork1 = 3*min_mn*min_mn + (std::max)( max_mn, 4*min_mn*min_mn + 4*min_mn );
|
|
blas_int lwork2 = 3*min_mn + (std::max)( max_mn, 4*min_mn*min_mn + 3*min_mn + max_mn );
|
|
blas_int lwork = 2 * ((std::max)(lwork1, lwork2)); // due to differences between lapack 3.1 and 3.4
|
|
blas_int info = 0;
|
|
|
|
if(A.is_empty())
|
|
{
|
|
U.eye();
|
|
S.reset();
|
|
V.eye( static_cast<uword>(n), static_cast<uword>(min_mn) );
|
|
return true;
|
|
}
|
|
|
|
S.set_size( static_cast<uword>(min_mn) );
|
|
|
|
U.set_size( static_cast<uword>(m), static_cast<uword>(min_mn) );
|
|
|
|
V.set_size( static_cast<uword>(min_mn), static_cast<uword>(n) );
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork ) );
|
|
podarray<blas_int> iwork( static_cast<uword>(8*min_mn) );
|
|
|
|
arma_extra_debug_print("lapack::gesdd()");
|
|
lapack::gesdd<eT>(&jobz, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork, iwork.memptr(), &info);
|
|
|
|
op_strans::apply_mat_inplace(V);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(U);
|
|
arma_ignore(S);
|
|
arma_ignore(V);
|
|
arma_ignore(X);
|
|
arma_stop("svd(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename T, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::svd_dc_econ(Mat< std::complex<T> >& U, Col<T>& S, Mat< std::complex<T> >& V, const Base< std::complex<T>, T1>& X)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if (defined(ARMA_USE_LAPACK) && defined(ARMA_CRIPPLED_LAPACK))
|
|
{
|
|
arma_extra_debug_print("auxlib::svd_dc_econ(): redirecting to auxlib::svd_econ() due to crippled LAPACK");
|
|
|
|
return auxlib::svd_econ(U, S, V, X, 'b');
|
|
}
|
|
#elif defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef std::complex<T> eT;
|
|
|
|
Mat<eT> A(X.get_ref());
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
char jobz = 'S';
|
|
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_cols);
|
|
blas_int min_mn = (std::min)(m,n);
|
|
blas_int max_mn = (std::max)(m,n);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
blas_int ldu = m;
|
|
blas_int ldvt = min_mn;
|
|
blas_int lwork = 2 * (min_mn*min_mn + 2*min_mn + max_mn);
|
|
blas_int lrwork1 = 5*min_mn*min_mn + 7*min_mn;
|
|
blas_int lrwork2 = min_mn * ((std::max)(5*min_mn+7, 2*max_mn + 2*min_mn+1));
|
|
blas_int lrwork = (std::max)(lrwork1, lrwork2); // due to differences between lapack 3.1 and 3.4
|
|
blas_int info = 0;
|
|
|
|
if(A.is_empty())
|
|
{
|
|
U.eye();
|
|
S.reset();
|
|
V.eye( static_cast<uword>(n), static_cast<uword>(min_mn) );
|
|
return true;
|
|
}
|
|
|
|
S.set_size( static_cast<uword>(min_mn) );
|
|
|
|
U.set_size( static_cast<uword>(m), static_cast<uword>(min_mn) );
|
|
|
|
V.set_size( static_cast<uword>(min_mn), static_cast<uword>(n) );
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork ) );
|
|
podarray<T> rwork( static_cast<uword>(lrwork ) );
|
|
podarray<blas_int> iwork( static_cast<uword>(8*min_mn) );
|
|
|
|
arma_extra_debug_print("lapack::cx_gesdd()");
|
|
lapack::cx_gesdd<T>(&jobz, &m, &n, A.memptr(), &lda, S.memptr(), U.memptr(), &ldu, V.memptr(), &ldvt, work.memptr(), &lwork, rwork.memptr(), iwork.memptr(), &info);
|
|
|
|
op_htrans::apply_mat_inplace(V);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(U);
|
|
arma_ignore(S);
|
|
arma_ignore(V);
|
|
arma_ignore(X);
|
|
arma_stop("svd(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! solve a system of linear equations via LU decomposition
|
|
template<typename T1>
|
|
inline
|
|
bool
|
|
auxlib::solve_square_fast(Mat<typename T1::elem_type>& out, Mat<typename T1::elem_type>& A, const Base<typename T1::elem_type,T1>& B_expr)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
typedef typename T1::elem_type eT;
|
|
|
|
const uword A_n_rows = A.n_rows;
|
|
|
|
if(A_n_rows <= 4)
|
|
{
|
|
Mat<eT> A_inv(A_n_rows, A_n_rows);
|
|
|
|
const bool status = auxlib::inv_noalias_tinymat(A_inv, A, A_n_rows);
|
|
|
|
if(status == true)
|
|
{
|
|
const unwrap<T1> U(B_expr.get_ref());
|
|
const Mat<eT>& B = U.M;
|
|
|
|
const uword B_n_rows = B.n_rows;
|
|
const uword B_n_cols = B.n_cols;
|
|
|
|
arma_debug_check( (A_n_rows != B_n_rows), "solve(): number of rows in the given matrices must be the same" );
|
|
|
|
if(A.is_empty() || B.is_empty())
|
|
{
|
|
out.zeros(A.n_cols, B_n_cols);
|
|
return true;
|
|
}
|
|
|
|
if(&out != &B)
|
|
{
|
|
out.set_size(A_n_rows, B_n_cols);
|
|
|
|
gemm_emul<false,false,false,false>::apply(out, A_inv, B);
|
|
}
|
|
else
|
|
{
|
|
Mat<eT> tmp(A_n_rows, B_n_cols);
|
|
|
|
gemm_emul<false,false,false,false>::apply(tmp, A_inv, B);
|
|
|
|
out.steal_mem(tmp);
|
|
}
|
|
|
|
return true;
|
|
}
|
|
}
|
|
|
|
out = B_expr.get_ref();
|
|
|
|
const uword B_n_rows = out.n_rows;
|
|
const uword B_n_cols = out.n_cols;
|
|
|
|
arma_debug_check( (A_n_rows != B_n_rows), "solve(): number of rows in the given matrices must be the same" );
|
|
|
|
if(A.is_empty() || out.is_empty())
|
|
{
|
|
out.zeros(A.n_cols, B_n_cols);
|
|
return true;
|
|
}
|
|
|
|
#if defined(ARMA_USE_ATLAS)
|
|
{
|
|
arma_debug_assert_atlas_size(A);
|
|
|
|
podarray<int> ipiv(A_n_rows + 2); // +2 for paranoia: old versions of Atlas might be trashing memory
|
|
|
|
arma_extra_debug_print("atlas::clapack_gesv()");
|
|
int info = atlas::clapack_gesv<eT>(atlas::CblasColMajor, A_n_rows, B_n_cols, A.memptr(), A_n_rows, ipiv.memptr(), out.memptr(), A_n_rows);
|
|
|
|
return (info == 0);
|
|
}
|
|
#elif defined(ARMA_USE_LAPACK)
|
|
{
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
blas_int n = blas_int(A_n_rows); // assuming A is square
|
|
blas_int lda = blas_int(A_n_rows);
|
|
blas_int ldb = blas_int(A_n_rows);
|
|
blas_int nrhs = blas_int(B_n_cols);
|
|
blas_int info = blas_int(0);
|
|
|
|
podarray<blas_int> ipiv(A_n_rows + 2); // +2 for paranoia: some versions of Lapack might be trashing memory
|
|
|
|
arma_extra_debug_print("lapack::gesv()");
|
|
lapack::gesv<eT>(&n, &nrhs, A.memptr(), &lda, ipiv.memptr(), out.memptr(), &ldb, &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_stop("solve(): use of ATLAS or LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! solve a system of linear equations via LU decomposition with refinement (real matrices)
|
|
template<typename T1>
|
|
inline
|
|
bool
|
|
auxlib::solve_square_refine(Mat<typename T1::pod_type>& out, typename T1::pod_type& out_rcond, Mat<typename T1::pod_type>& A, const Base<typename T1::pod_type,T1>& B_expr, const bool equilibrate)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename T1::pod_type eT;
|
|
|
|
Mat<eT> B = B_expr.get_ref(); // B is overwritten by lapack::gesvx()
|
|
|
|
arma_debug_check( (A.n_rows != B.n_rows), "solve(): number of rows in the given matrices must be the same" );
|
|
|
|
if(A.is_empty() || B.is_empty())
|
|
{
|
|
out.zeros(A.n_rows, B.n_cols);
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A,B);
|
|
|
|
out.set_size(A.n_rows, B.n_cols);
|
|
|
|
char fact = (equilibrate) ? 'E' : 'N';
|
|
char trans = 'N';
|
|
char equed = char(0);
|
|
blas_int n = blas_int(A.n_rows);
|
|
blas_int nrhs = blas_int(B.n_cols);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
blas_int ldaf = blas_int(A.n_rows);
|
|
blas_int ldb = blas_int(A.n_rows);
|
|
blas_int ldx = blas_int(A.n_rows);
|
|
blas_int info = blas_int(0);
|
|
eT rcond = eT(0);
|
|
|
|
Mat<eT> AF(A.n_rows, A.n_rows);
|
|
|
|
podarray<blas_int> IPIV( A.n_rows);
|
|
podarray<eT> R( A.n_rows);
|
|
podarray<eT> C( A.n_rows);
|
|
podarray<eT> FERR( B.n_cols);
|
|
podarray<eT> BERR( B.n_cols);
|
|
podarray<eT> WORK(4*A.n_rows);
|
|
podarray<blas_int> IWORK( A.n_rows);
|
|
|
|
arma_extra_debug_print("lapack::gesvx()");
|
|
lapack::gesvx
|
|
(
|
|
&fact, &trans, &n, &nrhs,
|
|
A.memptr(), &lda,
|
|
AF.memptr(), &ldaf,
|
|
IPIV.memptr(),
|
|
&equed,
|
|
R.memptr(),
|
|
C.memptr(),
|
|
B.memptr(), &ldb,
|
|
out.memptr(), &ldx,
|
|
&rcond,
|
|
FERR.memptr(),
|
|
BERR.memptr(),
|
|
WORK.memptr(),
|
|
IWORK.memptr(),
|
|
&info
|
|
);
|
|
|
|
// if(info == (n+1)) { arma_debug_warn("solve(): matrix appears singular to working precision; rcond = ", rcond); }
|
|
//
|
|
// const bool singular = ( (info > 0) && (info <= n) );
|
|
//
|
|
// return (singular == false);
|
|
|
|
out_rcond = rcond;
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(out);
|
|
arma_ignore(out_rcond);
|
|
arma_ignore(A);
|
|
arma_ignore(B_expr);
|
|
arma_stop("solve(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! solve a system of linear equations via LU decomposition with refinement (complex matrices)
|
|
template<typename T1>
|
|
inline
|
|
bool
|
|
auxlib::solve_square_refine(Mat< std::complex<typename T1::pod_type> >& out, typename T1::pod_type& out_rcond, Mat< std::complex<typename T1::pod_type> >& A, const Base<std::complex<typename T1::pod_type>,T1>& B_expr, const bool equilibrate)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if (defined(ARMA_USE_LAPACK) && defined(ARMA_CRIPPLED_LAPACK))
|
|
{
|
|
arma_ignore(out_rcond);
|
|
arma_ignore(equilibrate);
|
|
|
|
arma_debug_warn("solve(): refinement and/or equilibration not done due to crippled LAPACK");
|
|
|
|
return auxlib::solve_square_fast(out, A, B_expr);
|
|
}
|
|
#elif defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename T1::pod_type T;
|
|
typedef typename std::complex<T> eT;
|
|
|
|
Mat<eT> B = B_expr.get_ref(); // B is overwritten by lapack::cx_gesvx()
|
|
|
|
arma_debug_check( (A.n_rows != B.n_rows), "solve(): number of rows in the given matrices must be the same" );
|
|
|
|
if(A.is_empty() || B.is_empty())
|
|
{
|
|
out.zeros(A.n_rows, B.n_cols);
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A,B);
|
|
|
|
out.set_size(A.n_rows, B.n_cols);
|
|
|
|
char fact = (equilibrate) ? 'E' : 'N';
|
|
char trans = 'N';
|
|
char equed = char(0);
|
|
blas_int n = blas_int(A.n_rows);
|
|
blas_int nrhs = blas_int(B.n_cols);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
blas_int ldaf = blas_int(A.n_rows);
|
|
blas_int ldb = blas_int(A.n_rows);
|
|
blas_int ldx = blas_int(A.n_rows);
|
|
blas_int info = blas_int(0);
|
|
T rcond = T(0);
|
|
|
|
Mat<eT> AF(A.n_rows, A.n_rows);
|
|
|
|
podarray<blas_int> IPIV( A.n_rows);
|
|
podarray< T> R( A.n_rows);
|
|
podarray< T> C( A.n_rows);
|
|
podarray< T> FERR( B.n_cols);
|
|
podarray< T> BERR( B.n_cols);
|
|
podarray<eT> WORK(2*A.n_rows);
|
|
podarray< T> RWORK(2*A.n_rows);
|
|
|
|
arma_extra_debug_print("lapack::cx_gesvx()");
|
|
lapack::cx_gesvx
|
|
(
|
|
&fact, &trans, &n, &nrhs,
|
|
A.memptr(), &lda,
|
|
AF.memptr(), &ldaf,
|
|
IPIV.memptr(),
|
|
&equed,
|
|
R.memptr(),
|
|
C.memptr(),
|
|
B.memptr(), &ldb,
|
|
out.memptr(), &ldx,
|
|
&rcond,
|
|
FERR.memptr(),
|
|
BERR.memptr(),
|
|
WORK.memptr(),
|
|
RWORK.memptr(),
|
|
&info
|
|
);
|
|
|
|
// if(info == (n+1)) { arma_debug_warn("solve(): matrix appears singular to working precision; rcond = ", rcond); }
|
|
//
|
|
// const bool singular = ( (info > 0) && (info <= n) );
|
|
//
|
|
// return (singular == false);
|
|
|
|
out_rcond = rcond;
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(out);
|
|
arma_ignore(out_rcond);
|
|
arma_ignore(A);
|
|
arma_ignore(B_expr);
|
|
arma_stop("solve(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//! solve a non-square full-rank system via QR or LQ decomposition
|
|
template<typename T1>
|
|
inline
|
|
bool
|
|
auxlib::solve_approx_fast(Mat<typename T1::elem_type>& out, Mat<typename T1::elem_type>& A, const Base<typename T1::elem_type,T1>& B_expr)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename T1::elem_type eT;
|
|
|
|
const unwrap<T1> U(B_expr.get_ref());
|
|
const Mat<eT>& B = U.M;
|
|
|
|
arma_debug_check( (A.n_rows != B.n_rows), "solve(): number of rows in the given matrices must be the same" );
|
|
|
|
if(A.is_empty() || B.is_empty())
|
|
{
|
|
out.zeros(A.n_cols, B.n_cols);
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A,B);
|
|
|
|
Mat<eT> tmp( (std::max)(A.n_rows, A.n_cols), B.n_cols );
|
|
|
|
if(size(tmp) == size(B))
|
|
{
|
|
tmp = B;
|
|
}
|
|
else
|
|
{
|
|
tmp.zeros();
|
|
tmp(0,0, size(B)) = B;
|
|
}
|
|
|
|
char trans = 'N';
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_cols);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
blas_int ldb = blas_int(tmp.n_rows);
|
|
blas_int nrhs = blas_int(B.n_cols);
|
|
blas_int mn = (std::min)(m,n);
|
|
blas_int lwork = 3 * ( (std::max)(blas_int(1), mn + (std::max)(mn, nrhs)) );
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
|
|
arma_extra_debug_print("lapack::gels()");
|
|
lapack::gels<eT>( &trans, &m, &n, &nrhs, A.memptr(), &lda, tmp.memptr(), &ldb, work.memptr(), &lwork, &info );
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
if(tmp.n_rows == A.n_cols)
|
|
{
|
|
out.steal_mem(tmp);
|
|
}
|
|
else
|
|
{
|
|
out = tmp.head_rows(A.n_cols);
|
|
}
|
|
|
|
return true;
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(out);
|
|
arma_ignore(A);
|
|
arma_ignore(B_expr);
|
|
arma_stop("solve(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename T1>
|
|
inline
|
|
bool
|
|
auxlib::solve_approx_svd(Mat<typename T1::pod_type>& out, Mat<typename T1::pod_type>& A, const Base<typename T1::pod_type,T1>& B_expr)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename T1::pod_type eT;
|
|
|
|
const unwrap<T1> U(B_expr.get_ref());
|
|
const Mat<eT>& B = U.M;
|
|
|
|
arma_debug_check( (A.n_rows != B.n_rows), "solve(): number of rows in the given matrices must be the same" );
|
|
|
|
if(A.is_empty() || B.is_empty())
|
|
{
|
|
out.zeros(A.n_cols, B.n_cols);
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A,B);
|
|
|
|
Mat<eT> tmp( (std::max)(A.n_rows, A.n_cols), B.n_cols );
|
|
|
|
if(size(tmp) == size(B))
|
|
{
|
|
tmp = B;
|
|
}
|
|
else
|
|
{
|
|
tmp.zeros();
|
|
tmp(0,0, size(B)) = B;
|
|
}
|
|
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_cols);
|
|
blas_int nrhs = blas_int(B.n_cols);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
blas_int ldb = blas_int(tmp.n_rows);
|
|
eT rcond = eT(-1); // -1 means "use machine precision"
|
|
blas_int rank = blas_int(0);
|
|
blas_int info = blas_int(0);
|
|
|
|
const uword min_mn = (std::min)(A.n_rows, A.n_cols);
|
|
|
|
podarray<eT> S(min_mn);
|
|
|
|
|
|
blas_int ispec = blas_int(9);
|
|
|
|
const char* const_name = (is_float<eT>::value) ? "SGELSD" : "DGELSD";
|
|
const char* const_opts = "";
|
|
|
|
char* name = const_cast<char*>(const_name);
|
|
char* opts = const_cast<char*>(const_opts);
|
|
|
|
blas_int n1 = m;
|
|
blas_int n2 = n;
|
|
blas_int n3 = nrhs;
|
|
blas_int n4 = lda;
|
|
|
|
blas_int smlsiz = (std::max)( blas_int(25), lapack::laenv(&ispec, name, opts, &n1, &n2, &n3, &n4) ); // in case lapack::laenv() returns -1
|
|
blas_int smlsiz_p1 = blas_int(1) + smlsiz;
|
|
|
|
blas_int nlvl = (std::max)( blas_int(0), blas_int(1) + blas_int( std::log(double(min_mn) / double(smlsiz_p1))/double(0.69314718055994530942) ) );
|
|
blas_int liwork = (std::max)( blas_int(1), (blas_int(3)*blas_int(min_mn)*nlvl + blas_int(11)*blas_int(min_mn)) );
|
|
|
|
podarray<blas_int> iwork( static_cast<uword>(liwork) );
|
|
|
|
eT work_query[2];
|
|
blas_int lwork_query = blas_int(-1);
|
|
|
|
arma_extra_debug_print("lapack::gelsd()");
|
|
lapack::gelsd(&m, &n, &nrhs, A.memptr(), &lda, tmp.memptr(), &ldb, S.memptr(), &rcond, &rank, &work_query[0], &lwork_query, iwork.memptr(), &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
blas_int lwork = static_cast<blas_int>( access::tmp_real(work_query[0]) );
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
|
|
arma_extra_debug_print("lapack::gelsd()");
|
|
lapack::gelsd(&m, &n, &nrhs, A.memptr(), &lda, tmp.memptr(), &ldb, S.memptr(), &rcond, &rank, work.memptr(), &lwork, iwork.memptr(), &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
if(tmp.n_rows == A.n_cols)
|
|
{
|
|
out.steal_mem(tmp);
|
|
}
|
|
else
|
|
{
|
|
out = tmp.head_rows(A.n_cols);
|
|
}
|
|
|
|
return true;
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(out);
|
|
arma_ignore(A);
|
|
arma_ignore(B_expr);
|
|
arma_stop("solve(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename T1>
|
|
inline
|
|
bool
|
|
auxlib::solve_approx_svd(Mat< std::complex<typename T1::pod_type> >& out, Mat< std::complex<typename T1::pod_type> >& A, const Base<std::complex<typename T1::pod_type>,T1>& B_expr)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if (defined(ARMA_USE_LAPACK) && defined(ARMA_CRIPPLED_LAPACK))
|
|
{
|
|
arma_ignore(out);
|
|
arma_ignore(A);
|
|
arma_ignore(B_expr);
|
|
arma_debug_warn("solve() for rank-deficient matrices not available due to crippled LAPACK");
|
|
return false;
|
|
}
|
|
#elif defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename T1::pod_type T;
|
|
typedef typename std::complex<T> eT;
|
|
|
|
const unwrap<T1> U(B_expr.get_ref());
|
|
const Mat<eT>& B = U.M;
|
|
|
|
arma_debug_check( (A.n_rows != B.n_rows), "solve(): number of rows in the given matrices must be the same" );
|
|
|
|
if(A.is_empty() || B.is_empty())
|
|
{
|
|
out.zeros(A.n_cols, B.n_cols);
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A,B);
|
|
|
|
Mat<eT> tmp( (std::max)(A.n_rows, A.n_cols), B.n_cols );
|
|
|
|
if(size(tmp) == size(B))
|
|
{
|
|
tmp = B;
|
|
}
|
|
else
|
|
{
|
|
tmp.zeros();
|
|
tmp(0,0, size(B)) = B;
|
|
}
|
|
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_cols);
|
|
blas_int nrhs = blas_int(B.n_cols);
|
|
blas_int lda = blas_int(A.n_rows);
|
|
blas_int ldb = blas_int(tmp.n_rows);
|
|
T rcond = T(-1); // -1 means "use machine precision"
|
|
blas_int rank = blas_int(0);
|
|
blas_int info = blas_int(0);
|
|
|
|
const uword min_mn = (std::min)(A.n_rows, A.n_cols);
|
|
|
|
podarray<T> S(min_mn);
|
|
|
|
blas_int ispec = blas_int(9);
|
|
|
|
const char* const_name = (is_float<T>::value) ? "CGELSD" : "ZGELSD";
|
|
const char* const_opts = "";
|
|
|
|
char* name = const_cast<char*>(const_name);
|
|
char* opts = const_cast<char*>(const_opts);
|
|
|
|
blas_int n1 = m;
|
|
blas_int n2 = n;
|
|
blas_int n3 = nrhs;
|
|
blas_int n4 = lda;
|
|
|
|
blas_int smlsiz = (std::max)( blas_int(25), lapack::laenv(&ispec, name, opts, &n1, &n2, &n3, &n4) ); // in case lapack::laenv() returns -1
|
|
blas_int smlsiz_p1 = blas_int(1) + smlsiz;
|
|
|
|
blas_int nlvl = (std::max)( blas_int(0), blas_int(1) + blas_int( std::log(double(min_mn) / double(smlsiz_p1))/double(0.69314718055994530942) ) );
|
|
|
|
blas_int lrwork = (m >= n)
|
|
? blas_int(10)*n + blas_int(2)*n*smlsiz + blas_int(8)*n*nlvl + blas_int(3)*smlsiz*nrhs + (std::max)( (smlsiz_p1)*(smlsiz_p1), n*(blas_int(1)+nrhs) + blas_int(2)*nrhs )
|
|
: blas_int(10)*m + blas_int(2)*m*smlsiz + blas_int(8)*m*nlvl + blas_int(3)*smlsiz*nrhs + (std::max)( (smlsiz_p1)*(smlsiz_p1), n*(blas_int(1)+nrhs) + blas_int(2)*nrhs );
|
|
|
|
blas_int liwork = (std::max)( blas_int(1), (blas_int(3)*blas_int(min_mn)*nlvl + blas_int(11)*blas_int(min_mn)) );
|
|
|
|
podarray<T> rwork( static_cast<uword>(lrwork) );
|
|
podarray<blas_int> iwork( static_cast<uword>(liwork) );
|
|
|
|
eT work_query[2];
|
|
blas_int lwork_query = blas_int(-1);
|
|
|
|
arma_extra_debug_print("lapack::cx_gelsd()");
|
|
lapack::cx_gelsd(&m, &n, &nrhs, A.memptr(), &lda, tmp.memptr(), &ldb, S.memptr(), &rcond, &rank, &work_query[0], &lwork_query, rwork.memptr(), iwork.memptr(), &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
blas_int lwork = static_cast<blas_int>( access::tmp_real( work_query[0]) );
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
|
|
arma_extra_debug_print("lapack::cx_gelsd()");
|
|
lapack::cx_gelsd(&m, &n, &nrhs, A.memptr(), &lda, tmp.memptr(), &ldb, S.memptr(), &rcond, &rank, work.memptr(), &lwork, rwork.memptr(), iwork.memptr(), &info);
|
|
|
|
if(info != 0) { return false; }
|
|
|
|
if(tmp.n_rows == A.n_cols)
|
|
{
|
|
out.steal_mem(tmp);
|
|
}
|
|
else
|
|
{
|
|
out = tmp.head_rows(A.n_cols);
|
|
}
|
|
|
|
return true;
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(out);
|
|
arma_ignore(A);
|
|
arma_ignore(B_expr);
|
|
arma_stop("solve(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename T1>
|
|
inline
|
|
bool
|
|
auxlib::solve_tri(Mat<typename T1::elem_type>& out, const Mat<typename T1::elem_type>& A, const Base<typename T1::elem_type,T1>& B_expr, const uword layout)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
out = B_expr.get_ref();
|
|
|
|
const uword B_n_rows = out.n_rows;
|
|
const uword B_n_cols = out.n_cols;
|
|
|
|
arma_debug_check( (A.n_rows != B_n_rows), "solve(): number of rows in the given matrices must be the same" );
|
|
|
|
if(A.is_empty() || out.is_empty())
|
|
{
|
|
out.zeros(A.n_cols, B_n_cols);
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A,out);
|
|
|
|
char uplo = (layout == 0) ? 'U' : 'L';
|
|
char trans = 'N';
|
|
char diag = 'N';
|
|
blas_int n = blas_int(A.n_rows);
|
|
blas_int nrhs = blas_int(B_n_cols);
|
|
blas_int info = 0;
|
|
|
|
arma_extra_debug_print("lapack::trtrs()");
|
|
lapack::trtrs(&uplo, &trans, &diag, &n, &nrhs, A.memptr(), &n, out.memptr(), &n, &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(out);
|
|
arma_ignore(A);
|
|
arma_ignore(B_expr);
|
|
arma_ignore(layout);
|
|
arma_stop("solve(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//
|
|
// Schur decomposition
|
|
|
|
template<typename eT, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::schur(Mat<eT>& U, Mat<eT>& S, const Base<eT,T1>& X, const bool calc_U)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
S = X.get_ref();
|
|
|
|
arma_debug_check( (S.is_square() == false), "schur(): given matrix must be square sized" );
|
|
|
|
if(S.is_empty())
|
|
{
|
|
U.reset();
|
|
S.reset();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(S);
|
|
|
|
const uword S_n_rows = S.n_rows;
|
|
|
|
if(calc_U) { U.set_size(S_n_rows, S_n_rows); } else { U.set_size(1,1); }
|
|
|
|
char jobvs = calc_U ? 'V' : 'N';
|
|
char sort = 'N';
|
|
void* select = 0;
|
|
blas_int n = blas_int(S_n_rows);
|
|
blas_int sdim = 0;
|
|
blas_int ldvs = calc_U ? n : blas_int(1);
|
|
blas_int lwork = 3 * ((std::max)(blas_int(1), 3*n));
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> wr(S_n_rows);
|
|
podarray<eT> wi(S_n_rows);
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
podarray<blas_int> bwork(S_n_rows);
|
|
|
|
arma_extra_debug_print("lapack::gees()");
|
|
lapack::gees(&jobvs, &sort, select, &n, S.memptr(), &n, &sdim, wr.memptr(), wi.memptr(), U.memptr(), &ldvs, work.memptr(), &lwork, bwork.memptr(), &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(U);
|
|
arma_ignore(S);
|
|
arma_ignore(X);
|
|
arma_stop("schur(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename T, typename T1>
|
|
inline
|
|
bool
|
|
auxlib::schur(Mat<std::complex<T> >& U, Mat<std::complex<T> >& S, const Base<std::complex<T>,T1>& X, const bool calc_U)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if (defined(ARMA_USE_LAPACK) && defined(ARMA_CRIPPLED_LAPACK))
|
|
{
|
|
arma_ignore(U);
|
|
arma_ignore(S);
|
|
arma_ignore(X);
|
|
arma_ignore(calc_U);
|
|
arma_stop("schur() for complex matrices not available due to crippled LAPACK");
|
|
return false;
|
|
}
|
|
#elif defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef std::complex<T> eT;
|
|
|
|
S = X.get_ref();
|
|
|
|
arma_debug_check( (S.is_square() == false), "schur(): given matrix must be square sized" );
|
|
|
|
if(S.is_empty())
|
|
{
|
|
U.reset();
|
|
S.reset();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(S);
|
|
|
|
const uword S_n_rows = S.n_rows;
|
|
|
|
if(calc_U) { U.set_size(S_n_rows, S_n_rows); } else { U.set_size(1,1); }
|
|
|
|
char jobvs = calc_U ? 'V' : 'N';
|
|
char sort = 'N';
|
|
void* select = 0;
|
|
blas_int n = blas_int(S_n_rows);
|
|
blas_int sdim = 0;
|
|
blas_int ldvs = calc_U ? n : blas_int(1);
|
|
blas_int lwork = 3 * ((std::max)(blas_int(1), 2*n));
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> w(S_n_rows);
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
podarray< T> rwork(S_n_rows);
|
|
podarray<blas_int> bwork(S_n_rows);
|
|
|
|
arma_extra_debug_print("lapack::cx_gees()");
|
|
lapack::cx_gees(&jobvs, &sort, select, &n, S.memptr(), &n, &sdim, w.memptr(), U.memptr(), &ldvs, work.memptr(), &lwork, rwork.memptr(), bwork.memptr(), &info);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(U);
|
|
arma_ignore(S);
|
|
arma_ignore(X);
|
|
arma_ignore(calc_U);
|
|
arma_stop("schur(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//
|
|
// syl (solution of the Sylvester equation AX + XB = C)
|
|
|
|
template<typename eT>
|
|
inline
|
|
bool
|
|
auxlib::syl(Mat<eT>& X, const Mat<eT>& A, const Mat<eT>& B, const Mat<eT>& C)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
arma_debug_check( (A.is_square() == false) || (B.is_square() == false), "syl(): given matrices must be square sized" );
|
|
|
|
arma_debug_check( (C.n_rows != A.n_rows) || (C.n_cols != B.n_cols), "syl(): matrices are not conformant" );
|
|
|
|
if(A.is_empty() || B.is_empty() || C.is_empty())
|
|
{
|
|
X.reset();
|
|
return true;
|
|
}
|
|
|
|
Mat<eT> Z1, Z2, T1, T2;
|
|
|
|
const bool status_sd1 = auxlib::schur(Z1, T1, A);
|
|
const bool status_sd2 = auxlib::schur(Z2, T2, B);
|
|
|
|
if( (status_sd1 == false) || (status_sd2 == false) )
|
|
{
|
|
return false;
|
|
}
|
|
|
|
char trana = 'N';
|
|
char tranb = 'N';
|
|
blas_int isgn = +1;
|
|
blas_int m = blas_int(T1.n_rows);
|
|
blas_int n = blas_int(T2.n_cols);
|
|
|
|
eT scale = eT(0);
|
|
blas_int info = 0;
|
|
|
|
Mat<eT> Y = trans(Z1) * C * Z2;
|
|
|
|
arma_extra_debug_print("lapack::trsyl()");
|
|
lapack::trsyl<eT>(&trana, &tranb, &isgn, &m, &n, T1.memptr(), &m, T2.memptr(), &n, Y.memptr(), &m, &scale, &info);
|
|
|
|
//Y /= scale;
|
|
Y /= (-scale);
|
|
|
|
X = Z1 * Y * trans(Z2);
|
|
|
|
return (info >= 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(X);
|
|
arma_ignore(A);
|
|
arma_ignore(B);
|
|
arma_ignore(C);
|
|
arma_stop("syl(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//
|
|
// QZ decomposition of general square real matrix pair
|
|
|
|
template<typename T, typename T1, typename T2>
|
|
inline
|
|
bool
|
|
auxlib::qz(Mat<T>& A, Mat<T>& B, Mat<T>& vsl, Mat<T>& vsr, const Base<T,T1>& X_expr, const Base<T,T2>& Y_expr)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
A = X_expr.get_ref();
|
|
B = Y_expr.get_ref();
|
|
|
|
arma_debug_check( ((A.is_square() == false) || (B.is_square() == false)), "qz(): given matrices must be square sized" );
|
|
|
|
arma_debug_check( (A.n_rows != B.n_rows), "qz(): given matrices must have the same size" );
|
|
|
|
if(A.is_empty())
|
|
{
|
|
A.reset();
|
|
B.reset();
|
|
vsl.reset();
|
|
vsr.reset();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
vsl.set_size(A.n_rows, A.n_rows);
|
|
vsr.set_size(A.n_rows, A.n_rows);
|
|
|
|
char jobvsl = 'V';
|
|
char jobvsr = 'V';
|
|
char eigsort = 'N';
|
|
void* selctg = 0;
|
|
blas_int N = blas_int(A.n_rows);
|
|
blas_int sdim = 0;
|
|
blas_int lwork = 3 * ((std::max)(blas_int(1),8*N+16));
|
|
blas_int info = 0;
|
|
|
|
podarray<T> alphar(A.n_rows);
|
|
podarray<T> alphai(A.n_rows);
|
|
podarray<T> beta(A.n_rows);
|
|
|
|
podarray<T> work( static_cast<uword>(lwork) );
|
|
podarray<T> bwork( static_cast<uword>(N) );
|
|
|
|
arma_extra_debug_print("lapack::gges()");
|
|
|
|
lapack::gges
|
|
(
|
|
&jobvsl, &jobvsr, &eigsort, selctg, &N,
|
|
A.memptr(), &N, B.memptr(), &N, &sdim,
|
|
alphar.memptr(), alphai.memptr(), beta.memptr(),
|
|
vsl.memptr(), &N, vsr.memptr(), &N,
|
|
work.memptr(), &lwork, bwork.memptr(),
|
|
&info
|
|
);
|
|
|
|
op_strans::apply_mat_inplace(vsl);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(A);
|
|
arma_ignore(B);
|
|
arma_ignore(vsl);
|
|
arma_ignore(vsr);
|
|
arma_ignore(X_expr);
|
|
arma_ignore(Y_expr);
|
|
arma_stop("qz(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
//
|
|
// QZ decomposition of general square complex matrix pair
|
|
|
|
template<typename T, typename T1, typename T2>
|
|
inline
|
|
bool
|
|
auxlib::qz(Mat< std::complex<T> >& A, Mat< std::complex<T> >& B, Mat< std::complex<T> >& vsl, Mat< std::complex<T> >& vsr, const Base< std::complex<T>, T1 >& X_expr, const Base< std::complex<T>, T2 >& Y_expr)
|
|
{
|
|
arma_extra_debug_sigprint();
|
|
|
|
#if (defined(ARMA_USE_LAPACK) && defined(ARMA_CRIPPLED_LAPACK))
|
|
{
|
|
arma_ignore(A);
|
|
arma_ignore(B);
|
|
arma_ignore(vsl);
|
|
arma_ignore(vsr);
|
|
arma_ignore(X_expr);
|
|
arma_ignore(Y_expr);
|
|
arma_stop("qz() for complex matrices not available due to crippled LAPACK");
|
|
return false;
|
|
}
|
|
#elif defined(ARMA_USE_LAPACK)
|
|
{
|
|
typedef typename std::complex<T> eT;
|
|
|
|
A = X_expr.get_ref();
|
|
B = Y_expr.get_ref();
|
|
|
|
arma_debug_check( ((A.is_square() == false) || (B.is_square() == false)), "qz(): given matrices must be square sized" );
|
|
|
|
arma_debug_check( (A.n_rows != B.n_rows), "qz(): given matrices must have the same size" );
|
|
|
|
if(A.is_empty())
|
|
{
|
|
A.reset();
|
|
B.reset();
|
|
vsl.reset();
|
|
vsr.reset();
|
|
return true;
|
|
}
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
vsl.set_size(A.n_rows, A.n_rows);
|
|
vsr.set_size(A.n_rows, A.n_rows);
|
|
|
|
char jobvsl = 'V';
|
|
char jobvsr = 'V';
|
|
char eigsort = 'N';
|
|
void* selctg = 0;
|
|
blas_int N = blas_int(A.n_rows);
|
|
blas_int sdim = 0;
|
|
blas_int lwork = 3 * ((std::max)(blas_int(1),2*N));
|
|
blas_int info = 0;
|
|
|
|
podarray<eT> alpha(A.n_rows);
|
|
podarray<eT> beta(A.n_rows);
|
|
|
|
podarray<eT> work( static_cast<uword>(lwork) );
|
|
podarray< T> rwork( static_cast<uword>(8*N) );
|
|
podarray< T> bwork( static_cast<uword>(N) );
|
|
|
|
arma_extra_debug_print("lapack::cx_gges()");
|
|
|
|
lapack::cx_gges
|
|
(
|
|
&jobvsl, &jobvsr, &eigsort, selctg, &N,
|
|
A.memptr(), &N, B.memptr(), &N, &sdim,
|
|
alpha.memptr(), beta.memptr(),
|
|
vsl.memptr(), &N, vsr.memptr(), &N,
|
|
work.memptr(), &lwork, rwork.memptr(), bwork.memptr(),
|
|
&info
|
|
);
|
|
|
|
op_htrans::apply_mat_inplace(vsl);
|
|
|
|
return (info == 0);
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(A);
|
|
arma_ignore(B);
|
|
arma_ignore(vsl);
|
|
arma_ignore(vsr);
|
|
arma_ignore(X_expr);
|
|
arma_ignore(Y_expr);
|
|
arma_stop("qz(): use of LAPACK must be enabled");
|
|
return false;
|
|
}
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
template<typename T1>
|
|
inline
|
|
typename T1::pod_type
|
|
auxlib::rcond(const Base<typename T1::pod_type,T1>& A_expr)
|
|
{
|
|
typedef typename T1::pod_type T;
|
|
typedef typename T1::elem_type eT;
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
Mat<eT> A = A_expr.get_ref();
|
|
|
|
arma_debug_check( (A.is_square() == false), "rcond(): matrix must be square sized" );
|
|
|
|
if(A.is_empty()) { return Datum<T>::inf; }
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
char norm_id = '1';
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_rows); // assuming square matrix
|
|
blas_int lda = blas_int(A.n_rows);
|
|
T norm_val = T(0);
|
|
T rcond = T(0);
|
|
blas_int info = blas_int(0);
|
|
|
|
podarray<eT> work(4*A.n_rows);
|
|
podarray<blas_int> iwork(A.n_rows);
|
|
podarray<blas_int> ipiv( (std::min)(A.n_rows, A.n_cols) );
|
|
|
|
norm_val = lapack::lange(&norm_id, &m, &n, A.memptr(), &lda, work.memptr());
|
|
|
|
lapack::getrf(&m, &n, A.memptr(), &lda, ipiv.memptr(), &info);
|
|
|
|
if(info != blas_int(0)) { return T(0); }
|
|
|
|
lapack::gecon(&norm_id, &n, A.memptr(), &lda, &norm_val, &rcond, work.memptr(), iwork.memptr(), &info);
|
|
|
|
if(info != blas_int(0)) { return T(0); }
|
|
|
|
return rcond;
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(A_expr);
|
|
arma_stop("rcond(): use of LAPACK must be enabled");
|
|
}
|
|
#endif
|
|
|
|
return T(0);
|
|
}
|
|
|
|
|
|
|
|
template<typename T1>
|
|
inline
|
|
typename T1::pod_type
|
|
auxlib::rcond(const Base<std::complex<typename T1::pod_type>,T1>& A_expr)
|
|
{
|
|
typedef typename T1::pod_type T;
|
|
typedef typename T1::elem_type eT;
|
|
|
|
#if defined(ARMA_USE_LAPACK)
|
|
{
|
|
Mat<eT> A = A_expr.get_ref();
|
|
|
|
arma_debug_check( (A.is_square() == false), "rcond(): matrix must be square sized" );
|
|
|
|
if(A.is_empty()) { return Datum<T>::inf; }
|
|
|
|
arma_debug_assert_blas_size(A);
|
|
|
|
char norm_id = '1';
|
|
blas_int m = blas_int(A.n_rows);
|
|
blas_int n = blas_int(A.n_rows); // assuming square matrix
|
|
blas_int lda = blas_int(A.n_rows);
|
|
T norm_val = T(0);
|
|
T rcond = T(0);
|
|
blas_int info = blas_int(0);
|
|
|
|
podarray< T> junk(1);
|
|
podarray<eT> work(2*A.n_rows);
|
|
podarray< T> rwork(2*A.n_rows);
|
|
podarray<blas_int> iwork(A.n_rows);
|
|
podarray<blas_int> ipiv( (std::min)(A.n_rows, A.n_cols) );
|
|
|
|
norm_val = lapack::lange(&norm_id, &m, &n, A.memptr(), &lda, junk.memptr());
|
|
|
|
lapack::getrf(&m, &n, A.memptr(), &lda, ipiv.memptr(), &info);
|
|
|
|
if(info != blas_int(0)) { return T(0); }
|
|
|
|
lapack::cx_gecon(&norm_id, &n, A.memptr(), &lda, &norm_val, &rcond, work.memptr(), rwork.memptr(), &info);
|
|
|
|
if(info != blas_int(0)) { return T(0); }
|
|
|
|
return rcond;
|
|
}
|
|
#else
|
|
{
|
|
arma_ignore(A_expr);
|
|
arma_stop("rcond(): use of LAPACK must be enabled");
|
|
}
|
|
#endif
|
|
|
|
return T(0);
|
|
}
|
|
|
|
|
|
|
|
//! @}
|