668 lines
24 KiB
C
668 lines
24 KiB
C
#define STATIC_ASSERT(COND,MSG) typedef char static_assertion_##MSG[(COND)?1:-1]
|
||
|
||
#define cg2s(x) gsl_complex_tostd(x)
|
||
#define cs2g(x) gsl_complex_fromstd(x)
|
||
|
||
#include <complex.h>
|
||
#include <lapacke.h>
|
||
#include <stdio.h>
|
||
#include <stdlib.h>
|
||
#include <math.h>
|
||
#include <time.h>
|
||
#include "qpms_error.h"
|
||
|
||
// Maybe GSL works?
|
||
#include <gsl/gsl_matrix.h>
|
||
#include <gsl/gsl_complex_math.h>
|
||
#include <gsl/gsl_linalg.h>
|
||
#include <gsl/gsl_blas.h>
|
||
#include <gsl/gsl_eigen.h>
|
||
|
||
#include "beyn.h"
|
||
#define SQ(x) ((x)*(x))
|
||
|
||
STATIC_ASSERT((sizeof(lapack_complex_double) == sizeof(gsl_complex)), lapack_and_gsl_complex_must_be_consistent);
|
||
|
||
|
||
typedef struct BeynSolver
|
||
{
|
||
int M; // dimension of matrices
|
||
int L; // number of columns of VHat matrix
|
||
|
||
gsl_vector_complex *eigenvalues, *eigenvalue_errors;
|
||
gsl_matrix_complex *eigenvectors;
|
||
gsl_matrix_complex *A0, *A1, *A0_coarse, *A1_coarse, *MInvVHat;
|
||
gsl_matrix_complex *VHat;
|
||
gsl_vector *Sigma, *residuals;
|
||
} BeynSolver;
|
||
|
||
// constructor, destructor
|
||
BeynSolver *BeynSolver_create(int M, int L);
|
||
void BeynSolver_free(BeynSolver *solver);
|
||
|
||
// reset the random matrix VHat used in Beyn's algorithm
|
||
void BeynSolver_srandom(BeynSolver *solver, unsigned int RandSeed);
|
||
|
||
// Uniformly random number from interval [a, b].
|
||
static double randU(double a, double b) { return a + (b-a) * random() * (1. / RAND_MAX); }
|
||
|
||
// Random number from normal distribution (via Box-Muller transform, which is enough for our purposes).
|
||
static double randN(double Sigma, double Mu) {
|
||
double u1 = randU(0, 1);
|
||
double u2 = randU(0, 1);
|
||
return Mu + Sigma*sqrt(-2*log(u1))*cos(2.*M_PI*u2);
|
||
}
|
||
|
||
static complex double zrandN(double sigma, double mu){
|
||
return randN(sigma, mu) + I*randN(sigma, mu);
|
||
}
|
||
|
||
static inline double dsq(double a) { return a * a; }
|
||
|
||
static _Bool beyn_contour_ellipse_inside_test(struct beyn_contour_t *c, complex double z) {
|
||
double rRe = c->z_dz[c->n][0];
|
||
double rIm = c->z_dz[c->n][1];
|
||
complex double zn = z - c->centre;
|
||
return dsq(creal(zn)/rRe) + dsq(cimag(zn)/rIm) < 1;
|
||
}
|
||
|
||
beyn_contour_t *beyn_contour_ellipse(complex double centre, double rRe, double rIm, size_t n)
|
||
{
|
||
beyn_contour_t *c;
|
||
QPMS_CRASHING_MALLOC(c, sizeof(beyn_contour_t) + (n+1)*sizeof(c->z_dz[0]));
|
||
c->centre = centre;
|
||
c->n = n;
|
||
for(size_t i = 0; i < n; ++i) {
|
||
double t = i*2*M_PI/n;
|
||
double st = sin(t), ct = cos(t);
|
||
c->z_dz[i][0] = centre + ct*rRe + I*st*rIm;
|
||
c->z_dz[i][1] = (-rRe*st + I*rIm*ct) * (2*M_PI / n);
|
||
}
|
||
// We hide the half-axes metadata after the discretisation points.
|
||
c->z_dz[n][0] = rRe;
|
||
c->z_dz[n][1] = rIm;
|
||
c->inside_test = beyn_contour_ellipse_inside_test;
|
||
return c;
|
||
}
|
||
|
||
|
||
// Sets correct sign to zero for a given branch cut orientation
|
||
static inline complex double
|
||
align_zero(complex double z, beyn_contour_halfellipse_orientation or)
|
||
{
|
||
// Maybe redundant, TODO check the standard.
|
||
const double positive_zero = copysign(0., +1.);
|
||
const double negative_zero = copysign(0., -1.);
|
||
switch(or) { // ensure correct zero signs; CHECKME!!!
|
||
case BEYN_CONTOUR_HALFELLIPSE_RE_PLUS:
|
||
if(creal(z) == 0 && signbit(creal(z)))
|
||
z = positive_zero + I * cimag(z);
|
||
break;
|
||
case BEYN_CONTOUR_HALFELLIPSE_RE_MINUS:
|
||
if(creal(z) == 0 && !signbit(creal(z)))
|
||
z = negative_zero + I * cimag(z);
|
||
break;
|
||
case BEYN_CONTOUR_HALFELLIPSE_IM_PLUS:
|
||
if(cimag(z) == 0 && signbit(cimag(z)))
|
||
z = creal(z) + I * positive_zero;
|
||
break;
|
||
case BEYN_CONTOUR_HALFELLIPSE_IM_MINUS:
|
||
if(cimag(z) == 0 && !signbit(cimag(z)))
|
||
z = creal(z) + I * negative_zero;
|
||
break;
|
||
default: QPMS_WTF;
|
||
}
|
||
return z;
|
||
}
|
||
|
||
|
||
beyn_contour_t *beyn_contour_halfellipse(complex double centre, double rRe,
|
||
double rIm, size_t n, beyn_contour_halfellipse_orientation or)
|
||
{
|
||
beyn_contour_t *c;
|
||
QPMS_CRASHING_MALLOC(c, sizeof(beyn_contour_t) + (n+1)*sizeof(c->z_dz[0])
|
||
+ sizeof(beyn_contour_halfellipse_orientation));
|
||
c->centre = centre;
|
||
c->n = n;
|
||
const size_t nline = n/2;
|
||
const size_t narc = n - nline;
|
||
complex double faktor;
|
||
double l = rRe, h = rIm;
|
||
switch(or) {
|
||
case BEYN_CONTOUR_HALFELLIPSE_RE_PLUS:
|
||
faktor = -I;
|
||
l = rIm; h = rRe;
|
||
break;
|
||
case BEYN_CONTOUR_HALFELLIPSE_RE_MINUS:
|
||
faktor = I;
|
||
l = rIm; h = rRe;
|
||
break;
|
||
case BEYN_CONTOUR_HALFELLIPSE_IM_PLUS:
|
||
faktor = 1;
|
||
break;
|
||
case BEYN_CONTOUR_HALFELLIPSE_IM_MINUS:
|
||
faktor = -1;
|
||
break;
|
||
default: QPMS_WTF;
|
||
}
|
||
|
||
for(size_t i = 0; i < narc; ++i) {
|
||
double t = (i+0.5)*M_PI/narc;
|
||
double st = sin(t), ct = cos(t);
|
||
c->z_dz[i][0] = centre + faktor*(ct*l + I*st*h);
|
||
c->z_dz[i][1] = faktor * (-l*st + I*h*ct) * (M_PI / narc);
|
||
}
|
||
for(size_t i = 0; i < nline; ++i) {
|
||
double t = 0.5 * (1 - (double) nline) + i;
|
||
c->z_dz[narc + i][0] = align_zero(centre + faktor * t * 2 * l / nline, or);
|
||
c->z_dz[narc + i][1] = faktor * 2 * l / nline;
|
||
}
|
||
// We hide the half-axes metadata after the discretisation points.
|
||
c->z_dz[n][0] = rRe;
|
||
c->z_dz[n][1] = rIm;
|
||
// ugly...
|
||
*((beyn_contour_halfellipse_orientation *) &c->z_dz[n+1][0]) = or;
|
||
c->inside_test = NULL; // TODO beyn_contour_halfellipse_inside_test;
|
||
return c;
|
||
}
|
||
|
||
beyn_contour_t *beyn_contour_kidney(complex double centre, double rRe,
|
||
double rIm, const double rounding, const size_t n, beyn_contour_halfellipse_orientation or)
|
||
{
|
||
beyn_contour_t *c;
|
||
QPMS_ENSURE(rounding >= 0 && rounding < .5, "rounding must lie in the interval [0, 0.5)");
|
||
QPMS_CRASHING_MALLOC(c, sizeof(beyn_contour_t) + (n+1)*sizeof(c->z_dz[0])
|
||
+ sizeof(beyn_contour_halfellipse_orientation));
|
||
c->centre = centre;
|
||
c->n = n;
|
||
complex double faktor;
|
||
double l = rRe, h = rIm;
|
||
switch(or) {
|
||
case BEYN_CONTOUR_HALFELLIPSE_RE_PLUS:
|
||
faktor = -I;
|
||
l = rIm; h = rRe;
|
||
break;
|
||
case BEYN_CONTOUR_HALFELLIPSE_RE_MINUS:
|
||
faktor = I;
|
||
l = rIm; h = rRe;
|
||
break;
|
||
case BEYN_CONTOUR_HALFELLIPSE_IM_PLUS:
|
||
faktor = 1;
|
||
break;
|
||
case BEYN_CONTOUR_HALFELLIPSE_IM_MINUS:
|
||
faktor = -1;
|
||
break;
|
||
default: QPMS_WTF;
|
||
}
|
||
|
||
// Small circle centre coordinates.
|
||
const double y = rounding * h; // distance from the cut / straight line
|
||
const double x = sqrt(SQ(h - y) - SQ(y));
|
||
|
||
const double alpha = asin(y/(h-y));
|
||
const double ar = l/h; // aspect ratio
|
||
|
||
// Parameter range (equal to the contour length if ar == 1)
|
||
const double tmax = 2 * (x + (M_PI_2 + alpha) * y + (M_PI_2 - alpha) * h);
|
||
const double dt = tmax / n;
|
||
|
||
size_t i = 0;
|
||
double t;
|
||
// Straight line, first part
|
||
double t_lo = 0, t_hi = x;
|
||
for(; t = i * dt, t <= t_hi; ++i) {
|
||
c->z_dz[i][0] = align_zero(centre + (t - t_lo) * ar * faktor, or);
|
||
c->z_dz[i][1] = dt * ar * faktor;
|
||
}
|
||
// First small arc
|
||
t_lo = t_hi; t_hi = t_lo + (M_PI_2 + alpha) * y;
|
||
for(; t = i * dt, t < t_hi; ++i) {
|
||
double phi = (t - t_lo) / y - M_PI_2;
|
||
c->z_dz[i][0] = centre + (ar * (x + y * cos(phi)) + y * (1 + sin(phi)) * I) * faktor;
|
||
c->z_dz[i][1] = dt * (- ar * sin(phi) + cos(phi) * I) * faktor;
|
||
}
|
||
// Big arc
|
||
t_lo = t_hi; t_hi = t_lo + (M_PI - 2 * alpha) * h;
|
||
for(; t = i * dt, t < t_hi; ++i) {
|
||
double phi = (t - t_lo) / h + alpha;
|
||
c->z_dz[i][0] = centre + (ar * (h * cos(phi)) + h * sin(phi) * I) * faktor;
|
||
c->z_dz[i][1] = dt * (- ar * sin(phi) + cos(phi) * I) * faktor;
|
||
}
|
||
// Second small arc
|
||
t_lo = t_hi; t_hi = t_lo + (M_PI_2 + alpha) * y;
|
||
for(; t = i * dt, t < t_hi; ++i) {
|
||
double phi = (t - t_lo) / y + M_PI - alpha;
|
||
c->z_dz[i][0] = centre + (ar * (- x + y * cos(phi)) + y * (1 + sin(phi)) * I) * faktor;
|
||
c->z_dz[i][1] = dt * (- ar * sin(phi) + cos(phi) * I) * faktor;
|
||
}
|
||
// Straight line, second part
|
||
t_lo = t_hi; t_hi = tmax;
|
||
for(; t = i * dt, i < n; ++i) {
|
||
c->z_dz[i][0] = align_zero(centre + (t - t_lo - x) * ar * faktor, or);
|
||
c->z_dz[i][1] = dt * ar * faktor;
|
||
}
|
||
|
||
#if 0 // TODO later
|
||
// We hide the half-axes metadata after the discretisation points.
|
||
c->z_dz[n][0] = rRe;
|
||
c->z_dz[n][1] = rIm;
|
||
// ugly...
|
||
*((beyn_contour_halfellipse_orientation *) &c->z_dz[n+1][0]) = or;
|
||
#endif
|
||
c->inside_test = NULL; // TODO beyn_contour_halfellipse_inside_test;
|
||
return c;
|
||
}
|
||
|
||
void beyn_result_gsl_free(beyn_result_gsl_t *r) {
|
||
if(r) {
|
||
gsl_vector_complex_free(r->eigval);
|
||
gsl_vector_complex_free(r->eigval_err);
|
||
gsl_vector_free(r->residuals);
|
||
gsl_matrix_complex_free(r->eigvec);
|
||
gsl_vector_free(r->ranktest_SV);
|
||
free(r);
|
||
}
|
||
}
|
||
|
||
BeynSolver *BeynSolver_create(int M, int L)
|
||
{
|
||
BeynSolver *solver= (BeynSolver *)malloc(sizeof(*solver));
|
||
|
||
solver->M = M;
|
||
solver->L = L;
|
||
QPMS_ENSURE(L <= M, "We expect L <= M, but we got L = %d, M = %d ", L, M);
|
||
|
||
// storage for eigenvalues and eigenvectors
|
||
solver->eigenvalues = gsl_vector_complex_calloc(L);
|
||
solver->eigenvalue_errors = gsl_vector_complex_calloc(L);
|
||
solver->residuals = gsl_vector_calloc(L);
|
||
solver->eigenvectors = gsl_matrix_complex_calloc(M, L);
|
||
|
||
// storage for singular values, random VHat matrix, etc. used in algorithm
|
||
solver->A0 = gsl_matrix_complex_calloc(M,L);
|
||
solver->A1 = gsl_matrix_complex_calloc(M,L);
|
||
solver->A0_coarse = gsl_matrix_complex_calloc(M,L);
|
||
solver->A1_coarse = gsl_matrix_complex_calloc(M,L);
|
||
solver->MInvVHat = gsl_matrix_complex_calloc(M,L);
|
||
solver->VHat = gsl_matrix_complex_calloc(M,L);
|
||
solver->Sigma = gsl_vector_calloc(L);
|
||
// Beyn Step 1: Generate random matrix VHat
|
||
BeynSolver_srandom(solver,(unsigned)time(NULL));
|
||
|
||
return solver;
|
||
|
||
}
|
||
|
||
void BeynSolver_free(BeynSolver *solver)
|
||
{
|
||
gsl_vector_complex_free(solver->eigenvalues);
|
||
gsl_vector_complex_free(solver->eigenvalue_errors);
|
||
gsl_matrix_complex_free(solver->eigenvectors);
|
||
|
||
gsl_matrix_complex_free(solver->A0);
|
||
gsl_matrix_complex_free(solver->A1);
|
||
gsl_matrix_complex_free(solver->A0_coarse);
|
||
gsl_matrix_complex_free(solver->A1_coarse);
|
||
gsl_matrix_complex_free(solver->MInvVHat);
|
||
gsl_vector_free(solver->Sigma);
|
||
gsl_vector_free(solver->residuals);
|
||
gsl_matrix_complex_free(solver->VHat);
|
||
|
||
free(solver);
|
||
}
|
||
|
||
void BeynSolver_free_partial(BeynSolver *solver)
|
||
{
|
||
gsl_matrix_complex_free(solver->A0);
|
||
gsl_matrix_complex_free(solver->A1);
|
||
gsl_matrix_complex_free(solver->A0_coarse);
|
||
gsl_matrix_complex_free(solver->A1_coarse);
|
||
gsl_matrix_complex_free(solver->MInvVHat);
|
||
gsl_matrix_complex_free(solver->VHat);
|
||
|
||
free(solver);
|
||
}
|
||
|
||
void BeynSolver_srandom(BeynSolver *solver, unsigned int RandSeed)
|
||
{
|
||
if (RandSeed==0)
|
||
RandSeed=time(0);
|
||
srandom(RandSeed);
|
||
gsl_matrix_complex *VHat=solver->VHat;
|
||
for(int nr=0; nr<VHat->size1; nr++)
|
||
for(int nc=0; nc<VHat->size2; nc++)
|
||
gsl_matrix_complex_set(VHat,nr,nc,cs2g(zrandN(1, 0)));
|
||
|
||
}
|
||
|
||
|
||
/*
|
||
* linear-algebra manipulations on the A0 and A1 matrices
|
||
* (obtained via numerical quadrature) to extract eigenvalues
|
||
* and eigenvectors
|
||
*/
|
||
|
||
static int beyn_process_matrices(BeynSolver *solver, beyn_function_M_gsl_t M_function,
|
||
void *Params,
|
||
gsl_matrix_complex *A0, gsl_matrix_complex *A1, double complex z0,
|
||
gsl_vector_complex *eigenvalues, gsl_matrix_complex *eigenvectors, const double rank_tol, size_t rank_sel_min, const double res_tol)
|
||
{
|
||
const size_t m = solver->M;
|
||
const size_t l = solver->L;
|
||
gsl_vector *Sigma = solver->Sigma;
|
||
|
||
int verbose = 1; // TODO
|
||
|
||
// Beyn Step 3: Compute SVD: A0 = V0_full * Sigma * W0T_full
|
||
if(verbose) printf(" Beyn: computing SVD...\n");
|
||
gsl_matrix_complex* V0_full = gsl_matrix_complex_alloc(m,l);
|
||
gsl_matrix_complex_memcpy(V0_full,A0);
|
||
gsl_matrix_complex* W0T_full = gsl_matrix_complex_alloc(l,l);
|
||
QPMS_ENSURE(Sigma->stride == 1, "Sigma vector stride must be 1 for LAPACKE_zgesdd, got %zd.", Sigma->stride);
|
||
QPMS_ENSURE(V0_full->size1 >= V0_full->size2, "m = %zd, l = %zd, what the hell?");
|
||
QPMS_ENSURE_SUCCESS(LAPACKE_zgesdd(LAPACK_ROW_MAJOR, // A = U*Σ*conjg(V')
|
||
'O' /*jobz, 'O' overwrites a with U and saves conjg(V') in vt if m >= n, i.e. if M >= L, which holds*/,
|
||
V0_full->size1 /* m, number of rows */,
|
||
V0_full->size2 /* n, number of columns */,
|
||
(lapack_complex_double *)(V0_full->data) /*a*/,
|
||
V0_full->tda /*lda*/,
|
||
Sigma->data /*s*/,
|
||
NULL /*u; not used*/,
|
||
m /*ldu; should not be really used but lapacke requires it for some obscure reason*/,
|
||
(lapack_complex_double *)W0T_full->data /*vt*/,
|
||
W0T_full->tda /*ldvt*/
|
||
));
|
||
|
||
|
||
// Beyn Step 4: Rank test for Sigma
|
||
// compute effective rank K (number of eigenvalue candidates)
|
||
int K=0;
|
||
for (int k=0; k<Sigma->size /* this is l, actually */; k++) {
|
||
if (verbose) printf("Beyn: SV(%d)=%e\n",k,gsl_vector_get(Sigma, k));
|
||
if (k < rank_sel_min || gsl_vector_get(Sigma, k) > rank_tol)
|
||
K++;
|
||
}
|
||
if (verbose)printf(" Beyn: %d/%zd relevant singular values\n",K,l);
|
||
if (K==0) {
|
||
QPMS_WARN("no singular values found in Beyn eigensolver\n");
|
||
return 0;
|
||
}
|
||
|
||
// Beyn step 5: B = V0' * A1 * W0 * Sigma^-1
|
||
// set V0, W0T = matrices of first K right, left singular vectors
|
||
gsl_matrix_complex *V0 = gsl_matrix_complex_alloc(m,K);
|
||
gsl_matrix_complex *W0T= gsl_matrix_complex_alloc(K,l);
|
||
|
||
for (int k = 0; k < K; ++k) {
|
||
gsl_vector_complex_view tmp;
|
||
tmp = gsl_matrix_complex_column(V0_full, k);
|
||
gsl_matrix_complex_set_col(V0, k, &(tmp.vector));
|
||
tmp = gsl_matrix_complex_row(W0T_full, k);
|
||
gsl_matrix_complex_set_row(W0T, k, &(tmp.vector));
|
||
}
|
||
|
||
gsl_matrix_complex_free(V0_full);
|
||
gsl_matrix_complex_free(W0T_full);
|
||
|
||
gsl_matrix_complex *TM2 = gsl_matrix_complex_calloc(K,l);
|
||
gsl_matrix_complex *B = gsl_matrix_complex_calloc(K,K);
|
||
|
||
if(verbose) printf(" Multiplying V0*A1->TM...\n");
|
||
|
||
const gsl_complex one = gsl_complex_rect(1,0);
|
||
const gsl_complex zero = gsl_complex_rect(0,0);
|
||
gsl_blas_zgemm(CblasConjTrans, CblasNoTrans, one,
|
||
V0, A1, zero, TM2);
|
||
|
||
if(verbose) printf(" Multiplying TM*W0T->B...\n");
|
||
|
||
gsl_blas_zgemm(CblasNoTrans, CblasConjTrans, one,
|
||
TM2, W0T, zero, B);
|
||
|
||
gsl_matrix_complex_free(W0T);
|
||
gsl_matrix_complex_free(TM2);
|
||
|
||
if(verbose) printf(" Scaling B <- B*Sigma^{-1}\n");
|
||
gsl_vector_complex *tmp = gsl_vector_complex_calloc(K);
|
||
for(int i = 0; i < K; i++) {
|
||
gsl_matrix_complex_get_col(tmp, B, i);
|
||
gsl_vector_complex_scale(tmp, gsl_complex_rect(1.0/gsl_vector_get(Sigma,i), 0));
|
||
gsl_matrix_complex_set_col(B,i,tmp);
|
||
}
|
||
gsl_vector_complex_free(tmp);
|
||
|
||
//for(int m=0; m<K; m++) // B <- B * Sigma^{-1}
|
||
|
||
// Beyn step 6.
|
||
// Eigenvalue decomposition B -> S*Lambda*S'
|
||
/* According to Beyn's paper (Algorithm 1), one should check conditioning
|
||
* of the eigenvalues; if they are ill-conditioned, one should perform
|
||
* a procedure involving Schur decomposition and reordering.
|
||
*
|
||
* Beyn refers to MATLAB routines eig, condeig, schur, ordschur.
|
||
* I am not sure about the equivalents in LAPACK, TODO check zgeevx, zgeesx.
|
||
*/
|
||
if(verbose) printf(" Eigensolving (%i,%i)\n",K,K);
|
||
|
||
gsl_vector_complex *Lambda = gsl_vector_complex_alloc(K); // eigenvalues
|
||
gsl_matrix_complex *S = gsl_matrix_complex_alloc(K,K); // eigenvectors
|
||
|
||
QPMS_ENSURE(Sigma->stride == 1, "Sigma vector stride must be 1 for LAPACKE_zgesdd, got %zd.", Sigma->stride);
|
||
QPMS_ENSURE(Lambda->stride == 1, "Lambda vector stride must be 1 for LAPACKE_zgesdd, got %zd.", Sigma->stride);
|
||
QPMS_ENSURE_SUCCESS(LAPACKE_zgeev(
|
||
LAPACK_ROW_MAJOR,
|
||
'N' /* jobvl; don't compute left eigenvectors */,
|
||
'V' /* jobvr; do compute right eigenvectors */,
|
||
K /* n */,
|
||
(lapack_complex_double *)(B->data) /* a */,
|
||
B->tda /* lda */,
|
||
(lapack_complex_double *) Lambda->data /* w */,
|
||
NULL /* vl */,
|
||
m /* ldvl, not used by for some reason needed */,
|
||
(lapack_complex_double *)(S->data)/* vr */,
|
||
S->tda/* ldvr */
|
||
));
|
||
|
||
gsl_matrix_complex_free(B);
|
||
|
||
// V0S <- V0*S
|
||
printf("Multiplying V0*S...\n");
|
||
gsl_matrix_complex *V0S = gsl_matrix_complex_alloc(m, K);
|
||
QPMS_ENSURE_SUCCESS(gsl_blas_zgemm(CblasNoTrans, CblasNoTrans,
|
||
one, V0, S, zero, V0S));
|
||
|
||
gsl_matrix_complex_free(V0);
|
||
|
||
// FIXME!!! make clear relation between KRetained and K in the results!
|
||
// (If they differ, there are possibly some spurious eigenvalues.)
|
||
int KRetained = 0;
|
||
gsl_matrix_complex *Mmat = gsl_matrix_complex_alloc(m, m);
|
||
gsl_vector_complex *MVk = gsl_vector_complex_alloc(m);
|
||
for (int k = 0; k < K; ++k) {
|
||
const gsl_complex zgsl = gsl_complex_add(gsl_complex_rect(creal(z0), cimag(z0)), gsl_vector_complex_get(Lambda, k));
|
||
const complex double z = GSL_REAL(zgsl) + I*GSL_IMAG(zgsl);
|
||
gsl_vector_complex_const_view Vk = gsl_matrix_complex_const_column(V0S, k);
|
||
|
||
double residual = 0;
|
||
if(res_tol > 0) {
|
||
QPMS_ENSURE_SUCCESS(M_function(Mmat, z, Params));
|
||
QPMS_ENSURE_SUCCESS(gsl_blas_zgemv(CblasNoTrans, one, Mmat, &(Vk.vector), zero, MVk));
|
||
residual = gsl_blas_dznrm2(MVk);
|
||
if (verbose) printf("Beyn: Residual(%i)=%e\n",k,residual);
|
||
}
|
||
if (res_tol > 0 && residual > res_tol) continue;
|
||
|
||
gsl_vector_complex_set(eigenvalues, KRetained, zgsl);
|
||
if(eigenvectors) {
|
||
gsl_matrix_complex_set_row(eigenvectors, KRetained, &(Vk.vector));
|
||
gsl_vector_set(solver->residuals, KRetained, residual);
|
||
}
|
||
++KRetained;
|
||
}
|
||
|
||
gsl_matrix_complex_free(V0S);
|
||
gsl_matrix_complex_free(Mmat);
|
||
gsl_vector_complex_free(MVk);
|
||
gsl_matrix_complex_free(S);
|
||
gsl_vector_complex_free(Lambda);
|
||
|
||
return KRetained;
|
||
}
|
||
|
||
|
||
beyn_result_gsl_t *beyn_solve_gsl(const size_t m, const size_t l,
|
||
beyn_function_M_gsl_t M_function, beyn_function_M_inv_Vhat_gsl_t M_inv_Vhat_function,
|
||
void *params, const beyn_contour_t *contour,
|
||
double rank_tol, size_t rank_sel_min, double res_tol)
|
||
{
|
||
BeynSolver *solver = BeynSolver_create(m, l);
|
||
|
||
gsl_matrix_complex *A0 = solver->A0;
|
||
gsl_matrix_complex *A1 = solver->A1;
|
||
gsl_matrix_complex *A0_coarse = solver->A0_coarse;
|
||
gsl_matrix_complex *A1_coarse = solver->A1_coarse;
|
||
gsl_matrix_complex *MInvVHat = solver->MInvVHat;
|
||
gsl_matrix_complex *VHat = solver->VHat;
|
||
|
||
/***************************************************************/
|
||
/* evaluate contour integrals by numerical quadrature to get */
|
||
/* A0 and A1 matrices */
|
||
/***************************************************************/
|
||
|
||
gsl_matrix_complex_set_zero(A0);
|
||
gsl_matrix_complex_set_zero(A1);
|
||
gsl_matrix_complex_set_zero(A0_coarse);
|
||
gsl_matrix_complex_set_zero(A1_coarse);
|
||
const size_t N = contour->n;
|
||
if(N & 1) QPMS_WARN("Contour discretisation point number is odd (%zd),"
|
||
" the error estimates might be a bit off.", N);
|
||
|
||
|
||
// Beyn Step 2: Computa A0, A1
|
||
const complex double z0 = contour->centre;
|
||
for(int n=0; n<N; n++) {
|
||
const complex double z = contour->z_dz[n][0];
|
||
const complex double dz = contour->z_dz[n][1];
|
||
|
||
gsl_matrix_complex_memcpy(MInvVHat, VHat);
|
||
|
||
if(M_inv_Vhat_function) {
|
||
QPMS_ENSURE_SUCCESS(M_inv_Vhat_function(MInvVHat, VHat, z, params));
|
||
} else {
|
||
lapack_int *pivot;
|
||
gsl_matrix_complex *Mmat = gsl_matrix_complex_alloc(m,m);
|
||
QPMS_ENSURE_SUCCESS(M_function(Mmat, z, params));
|
||
QPMS_CRASHING_MALLOC(pivot, sizeof(lapack_int) * m);
|
||
QPMS_ENSURE_SUCCESS(LAPACKE_zgetrf(LAPACK_ROW_MAJOR,
|
||
m /*m*/, m /*n*/,(lapack_complex_double *) Mmat->data /*a*/, Mmat->tda /*lda*/, pivot /*ipiv*/));
|
||
QPMS_ENSURE(MInvVHat->tda == l, "wut?");
|
||
QPMS_ENSURE_SUCCESS(LAPACKE_zgetrs(LAPACK_ROW_MAJOR, 'N' /*trans*/,
|
||
m /*n*/, l/*nrhs*/, (lapack_complex_double *)(Mmat->data) /*a*/, Mmat->tda /*lda*/, pivot/*ipiv*/,
|
||
(lapack_complex_double *)(MInvVHat->data) /*b*/, MInvVHat->tda/*ldb*/));
|
||
|
||
free(pivot);
|
||
gsl_matrix_complex_free(Mmat);
|
||
}
|
||
|
||
gsl_matrix_complex_scale(MInvVHat, cs2g(dz));
|
||
gsl_matrix_complex_add(A0, MInvVHat);
|
||
if((n%2)==0) {
|
||
gsl_matrix_complex_add(A0_coarse, MInvVHat);
|
||
gsl_matrix_complex_add(A0_coarse, MInvVHat);
|
||
}
|
||
|
||
gsl_matrix_complex_scale(MInvVHat, cs2g(z - z0)); // A_1 scaling as in Beyn's Remark 3.2(b) for numerical stability.
|
||
gsl_matrix_complex_add(A1, MInvVHat);
|
||
if((n%2)==0) {
|
||
gsl_matrix_complex_add(A1_coarse, MInvVHat);
|
||
gsl_matrix_complex_add(A1_coarse, MInvVHat);
|
||
}
|
||
}
|
||
|
||
gsl_vector_complex *eigenvalues = solver->eigenvalues;
|
||
gsl_vector_complex *eigenvalue_errors = solver->eigenvalue_errors;
|
||
gsl_matrix_complex *eigenvectors = solver->eigenvectors;
|
||
|
||
// Repeat Steps 3–6 with rougher contour approximation to get an error estimate.
|
||
int K_coarse = beyn_process_matrices(solver, M_function, params, A0_coarse, A1_coarse, z0, eigenvalue_errors, /*eigenvectors_coarse*/ NULL, rank_tol, rank_sel_min, res_tol);
|
||
// Reid did also fabs on the complex and real parts ^^^.
|
||
|
||
// Beyn Steps 3–6
|
||
int K = beyn_process_matrices(solver, M_function, params, A0, A1, z0, eigenvalues, eigenvectors, rank_tol, rank_sel_min, res_tol);
|
||
gsl_blas_zaxpy(gsl_complex_rect(-1,0), eigenvalues, eigenvalue_errors);
|
||
|
||
beyn_result_gsl_t *result;
|
||
QPMS_CRASHING_MALLOC(result, sizeof(beyn_result_gsl_t));
|
||
result->eigval = solver->eigenvalues;
|
||
result->eigval_err = solver->eigenvalue_errors;
|
||
result->residuals = solver->residuals;
|
||
result->eigvec = solver->eigenvectors;
|
||
result->ranktest_SV = solver->Sigma;
|
||
result->neig = K;
|
||
|
||
BeynSolver_free_partial(solver);
|
||
|
||
return result;
|
||
}
|
||
|
||
// Wrapper of pure C array M-matrix function to GSL.
|
||
|
||
struct beyn_function_M_carr2gsl_param {
|
||
beyn_function_M_t M_function;
|
||
beyn_function_M_inv_Vhat_t M_inv_Vhat_function;
|
||
void *param;
|
||
};
|
||
|
||
static int beyn_function_M_carr2gsl(gsl_matrix_complex *target_M, complex double z, void *params)
|
||
{
|
||
struct beyn_function_M_carr2gsl_param *p = params;
|
||
// These could rather be asserts.
|
||
QPMS_ENSURE(target_M->size2 == target_M->tda, "Target GSL matrix is not a C-contiguous array. This is a bug, please report!");
|
||
QPMS_ENSURE(target_M->size1 == target_M->size2, "Target is not a square matrix. This is a bug, please report!");
|
||
return p->M_function((complex double *) target_M->data, target_M->size1, z, p->param);
|
||
}
|
||
|
||
static int beyn_function_M_inv_Vhat_carr2gsl(gsl_matrix_complex *target,
|
||
const gsl_matrix_complex *Vhat, complex double z, void *params)
|
||
{
|
||
QPMS_UNTESTED;
|
||
struct beyn_function_M_carr2gsl_param *p = params;
|
||
// These could rather be asserts.
|
||
QPMS_ENSURE(target->size2 == target->tda, "Target GSL matrix is not a C-contiguous array. This is a bug, please report!");
|
||
QPMS_ENSURE(Vhat->size2 == Vhat->tda, "Source GSL matrix is not a C-contiguous array. This is a bug, please report!");
|
||
// TODO here I could also check whether Vhat and target have compatible sizes.
|
||
return p->M_inv_Vhat_function((complex double *) target->data, target->size1, target->size2,
|
||
(complex double *) Vhat->data, z, p->param);
|
||
}
|
||
|
||
beyn_result_t *beyn_solve(size_t m, size_t l, beyn_function_M_t M, beyn_function_M_inv_Vhat_t M_inv_Vhat,
|
||
void *params, const beyn_contour_t *contour, double rank_tol, size_t rank_sel_min, double res_tol) {
|
||
struct beyn_function_M_carr2gsl_param p = {M, M_inv_Vhat, params};
|
||
return beyn_result_from_beyn_result_gsl(
|
||
beyn_solve_gsl(m, l, beyn_function_M_carr2gsl,
|
||
(p.M_inv_Vhat_function) ? beyn_function_M_inv_Vhat_carr2gsl : NULL,
|
||
(void *) &p, contour, rank_tol, rank_sel_min, res_tol)
|
||
);
|
||
}
|
||
|
||
beyn_result_t *beyn_result_from_beyn_result_gsl(beyn_result_gsl_t *g) {
|
||
struct beyn_result_t *result;
|
||
QPMS_CRASHING_MALLOC(result, sizeof(beyn_result_t));
|
||
result->gsl = g;
|
||
result->neig = result->gsl->neig;
|
||
result->vlen = result->gsl->eigvec->size2;
|
||
result->eigval = (complex double *) result->gsl->eigval->data;
|
||
result->eigval_err = (complex double *) result->gsl->eigval_err->data;
|
||
result->residuals = result->gsl->residuals->data;
|
||
result->eigvec = (complex double *) result->gsl->eigvec->data;
|
||
result->ranktest_SV = result->gsl->ranktest_SV->data;
|
||
return result;
|
||
}
|
||
|
||
void beyn_result_free(beyn_result_t *result) {
|
||
if(result)
|
||
beyn_result_gsl_free(result->gsl);
|
||
free(result);
|
||
}
|
||
|