qpms/qpms/ewald.c

#include "ewald.h"
#include <stdlib.h>
#include "indexing.h"
#include "kahansum.h"
#include <assert.h>
#include <string.h>
#include <complex.h>
#include "tiny_inlines.h"
#include <gsl/gsl_integration.h>
#include <gsl/gsl_errno.h>
#include <gsl/gsl_sf_legendre.h>

// parameters for the quadrature of integral in (4.6)
#ifndef INTEGRATION_WORKSPACE_LIMIT
#define INTEGRATION_WORKSPACE_LIMIT 30000
#endif

#ifndef INTEGRATION_EPSABS
#define INTEGRATION_EPSABS 1e-13
#endif

#ifndef INTEGRATION_EPSREL
#define INTEGRATION_EPSREL 1e-13
#endif

#ifndef M_SQRTPI
#define M_SQRTPI 1.7724538509055160272981674833411452
#endif


// sloppy implementation of factorial
static inline double factorial(const int n) {
  assert(n >= 0);
  if (n < 0)
    return 0; // should not happen in the functions below. (Therefore the assert above)
  else if (n <= 20) {
    double fac = 1;
    for (int i = 1; i <= n; ++i)
      fac *= i;
    return fac;
  }
  else 
    return tgamma(n + 1); // hope it's precise and that overflow does not happen
}

static inline complex double csq(complex double x) { return x * x; }
static inline double sq(double x) { return x * x; }


typedef enum {
  EWALD32_CONSTANTS_ORIG, // As in [1, (4,5)], NOT USED right now.
  EWALD32_CONSTANTS_AGNOSTIC /* Not depending on the spherical harmonic sign/normalisation
                              * convention – the $e^{im\alpha_pq}$ term in [1,(4.5)] being
                              * replaced by the respective $Y_n^m(\pi/2,\alpha)$ 
                              * spherical harmonic. See notes/ewald.lyx.
                              */

} ewald32_constants_option;

static const ewald32_constants_option type = EWALD32_CONSTANTS_AGNOSTIC;

qpms_ewald32_constants_t *qpms_ewald32_constants_init(const qpms_l_t lMax /*, const ewald32_constants_option type */,
    const int csphase)
{
  qpms_ewald32_constants_t *c = malloc(sizeof(qpms_ewald32_constants_t));
  //if (c == NULL) return NULL; // Do I really want to do this?
  c->lMax = lMax;
  c->nelem_sc = qpms_lMax2nelem_sc(lMax);
  c->s1_jMaxes = malloc(c->nelem_sc * sizeof(qpms_l_t));
  c->s1_constfacs = malloc(c->nelem_sc * sizeof(complex double *));
  //if (c->s1_jMaxes == NULL) return NULL;

  //determine sizes
  size_t s1_constfacs_sz = 0;
  for (qpms_y_t y = 0; y < c->nelem_sc; ++y) {
    qpms_l_t n; qpms_m_t m; qpms_y2mn_sc_p(y, &m, &n);
    if ((m + n) % 2 == 0) 
      s1_constfacs_sz += 1 + (c->s1_jMaxes[y] = (n-abs(m))/2);
    else
      c->s1_jMaxes[y] = -1;
  }

  c->s1_constfacs_base = malloc(s1_constfacs_sz * sizeof(complex double));
  size_t s1_constfacs_sz_cumsum = 0;
  for (qpms_y_t y = 0; y < c->nelem_sc; ++y) {
    qpms_l_t n; qpms_m_t m; qpms_y2mn_sc_p(y, &m, &n);
    if ((m + n) % 2 == 0) {
      c->s1_constfacs[y] = c->s1_constfacs_base + s1_constfacs_sz_cumsum;
      // and here comes the actual calculation
      for (qpms_l_t j = 0; j <= c->s1_jMaxes[y]; ++j){
        switch(type) {
          case EWALD32_CONSTANTS_ORIG: // NOT USED
            c->s1_constfacs[y][j] = -0.5 * ipow(n+1) * min1pow((n+m)/2) 
              * sqrt((2*n + 1) * factorial(n-m) * factorial(n+m))
              * min1pow(j) * pow(0.5, n-2*j)
              / (factorial(j) * factorial((n-m)/2-j) * factorial((n+m)/2-j))
              * pow(0.5, 2*j-1);
            break;
          case EWALD32_CONSTANTS_AGNOSTIC:
            c->s1_constfacs[y][j] = -2 * ipow(n+1) * M_SQRTPI  
              * factorial((n-m)/2) * factorial((n+m)/2)
              * min1pow(j) 
              / (factorial(j) * factorial((n-m)/2-j) * factorial((n+m)/2-j));
            break;
          default:
            abort();
        }
      }
      s1_constfacs_sz_cumsum += 1 + c->s1_jMaxes[y];
    }
    else
      c->s1_constfacs[y] = NULL;
  }

  c->legendre_csphase = csphase;
  c->legendre0 = malloc(gsl_sf_legendre_array_n(lMax) * sizeof(double));
  // N.B. here I use the GSL_SF_LEGENRE_NONE, in order to be consistent with translations.c
  c->legendre_normconv = GSL_SF_LEGENDRE_NONE;
  // Moreover, using this approach (i.e. gsl) takes about 64kB extra memory
  if(GSL_SUCCESS != gsl_sf_legendre_array_e(c->legendre_normconv, lMax, 0, csphase, c->legendre0))
    abort();
  if(GSL_SUCCESS != gsl_sf_legendre_array_e(c->legendre_normconv, lMax, +1, csphase, c->legendre_plus1))
    abort();
  if(GSL_SUCCESS != gsl_sf_legendre_array_e(c->legendre_normconv, lMax, -1, csphase, c->legendre_minus1))
    abort();
  return c;
}

void qpms_ewald32_constants_free(qpms_ewald32_constants_t *c) {
  free(c->legendre0);
  free(c->s1_constfacs);
  free(c->s1_constfacs_base);
  free(c->s1_jMaxes);
  free(c);
}


int ewald3_sigma0(complex double *result, double *err,
    const qpms_ewald32_constants_t *c,
    const double eta, const double k)
{
  qpms_csf_result gam;
  int retval = complex_gamma_inc_e(-0.5, -sq(k/(2*eta)), &gam);
  gam.val = conj(gam.val); // We take the other branch, cf. [Linton, p. 642 in the middle]
  if (0 != retval)
    abort();
  *result = gam.val * c->legendre0[gsl_sf_legendre_array_index(0,0)] / 2 / M_SQRTPI;
  if(err) 
    *err = gam.err * fabs(c->legendre0[gsl_sf_legendre_array_index(0,0)] / 2 / M_SQRTPI);
  return 0;
}

int ewald32_sigma0(complex double *result, double *err,
    const qpms_ewald32_constants_t *c,
    const double eta, const double k)
{
  return ewald3_sigma0(result, err, c, eta, k);
}


int ewald32_sigma_long_shiftedpoints (
    complex double *target, // must be c->nelem_sc long
    double *err,
    const qpms_ewald32_constants_t *c,
    const double eta, const double k, const double unitcell_area,
    const size_t npoints, const point2d *Kpoints_plus_beta,
    const point2d beta, // not needed
    const point2d particle_shift // target - src
    ) 
{
  const qpms_y_t nelem_sc = c->nelem_sc;
  const qpms_l_t lMax = c->lMax;
  
  // Manual init of the ewald summation targets
  complex double *target_c = calloc(nelem_sc, sizeof(complex double));
  memset(target, 0, nelem_sc * sizeof(complex double));
  double *err_c = NULL;
  if (err) {
    err_c = calloc(nelem_sc, sizeof(double));
    memset(err, 0, nelem_sc * sizeof(double));
  }

  const double commonfac = 1/(k*k*unitcell_area); // used in the very end (CFC)
  assert(commonfac > 0);

  // space for Gamma_pq[j]'s
  qpms_csf_result Gamma_pq[lMax/2+1];

  // CHOOSE POINT BEGIN
  for (size_t i = 0; i < npoints; ++i) { // BEGIN POINT LOOP
    const point2d beta_pq = Kpoints_plus_beta[i];
    const point2d K_pq = {beta_pq.x - beta.x, beta_pq.y - beta.y};
    const double rbeta_pq = cart2norm(beta_pq);
  // CHOOSE POINT END

    const complex double phasefac = cexp(I*cart2_dot(K_pq,particle_shift)); // POINT-DEPENDENT (PFC) // !!!CHECKSIGN!!!
    const double arg_pq = atan2(beta_pq.y, beta_pq.x); // POINT-DEPENDENT

    // R-DEPENDENT BEGIN
    const complex double gamma_pq = lilgamma(rbeta_pq/k);
    const complex double z = csq(gamma_pq*k/(2*eta)); // Když o tom tak přemýšlím, tak tohle je vlastně vždy reálné
    for(qpms_l_t j = 0; j <= lMax/2; ++j) {
      int retval = complex_gamma_inc_e(0.5-j, z, Gamma_pq+j);
      // we take the other branch, cf. [Linton, p. 642 in the middle]: FIXME instead use the C11 CMPLX macros and fill in -O*I part to z in the line above
      if(creal(z) < 0) 
        Gamma_pq[j].val = conj(Gamma_pq[j].val); //FIXME as noted above
      if(!(retval==0 ||retval==GSL_EUNDRFLW)) abort();
    }
    // R-DEPENDENT END
    
    // TODO optimisations: all the j-dependent powers can be done for each j only once, stored in array
    // and just fetched for each n, m pair
    for(qpms_l_t n = 0; n <= lMax; ++n)
      for(qpms_m_t m = -n; m <= n; ++m) {
        if((m+n) % 2 != 0) // odd coefficients are zero.
          continue;
        const qpms_y_t y = qpms_mn2y_sc(m, n);
        const complex double e_imalpha_pq = cexp(I*m*arg_pq);
        complex double jsum, jsum_c; ckahaninit(&jsum, &jsum_c);
        double jsum_err, jsum_err_c; kahaninit(&jsum_err, &jsum_err_c); // TODO do I really need to kahan sum errors?
        assert((n-abs(m))/2 == c->s1_jMaxes[y]);
        for(qpms_l_t j = 0; j <= c->s1_jMaxes[y]/*(n-abs(m))/2*/; ++j) { // FIXME </<= ?
          complex double summand = pow(rbeta_pq/k, n-2*j) 
            * e_imalpha_pq  * c->legendre0[gsl_sf_legendre_array_index(n,abs(m))] * min1pow_m_neg(m) // This line can actually go outside j-loop
            * cpow(gamma_pq, 2*j-1) // * Gamma_pq[j] bellow (GGG) after error computation
            * c->s1_constfacs[y][j];
          if(err) {
            // FIXME include also other errors than Gamma_pq's relative error
             kahanadd(&jsum_err, &jsum_err_c, Gamma_pq[j].err * cabs(summand));
          }
          summand *= Gamma_pq[j].val; // GGG
          ckahanadd(&jsum, &jsum_c, summand);
        }
        jsum *= phasefac; // PFC
        ckahanadd(target + y, target_c + y, jsum);
        if(err) kahanadd(err + y, err_c + y, jsum_err);
      }
  } // END POINT LOOP
 
  free(err_c);
  free(target_c);
  for(qpms_y_t y = 0; y < nelem_sc; ++y) // CFC common factor from above
    target[y] *= commonfac;
  if(err)
    for(qpms_y_t y = 0; y < nelem_sc; ++y)
      err[y] *= commonfac;
  return 0;
}

int ewald32_sigma_long_points_and_shift (
    complex double *target, // must be c->nelem_sc long
    double *err,
    const qpms_ewald32_constants_t *c,
    const double eta, const double k, const double unitcell_area,
    const size_t npoints, const point2d *Kpoints,
    const point2d beta, 
    const point2d particle_shift // target - src
    ) 
{
  const qpms_y_t nelem_sc = c->nelem_sc;
  const qpms_l_t lMax = c->lMax;
  
  // Manual init of the ewald summation targets
  complex double *target_c = calloc(nelem_sc, sizeof(complex double));
  memset(target, 0, nelem_sc * sizeof(complex double));
  double *err_c = NULL;
  if (err) {
    err_c = calloc(nelem_sc, sizeof(double));
    memset(err, 0, nelem_sc * sizeof(double));
  }

  const double commonfac = 1/(k*k*unitcell_area); // used in the very end (CFC)
  assert(commonfac > 0);

  // space for Gamma_pq[j]'s
  qpms_csf_result Gamma_pq[lMax/2+1];

  // CHOOSE POINT BEGIN
  for (size_t i = 0; i < npoints; ++i) { // BEGIN POINT LOOP
    // Only these following two lines differ from ewald32_sigma_long_points_and_shift()!!!  WTFCOMMENT?!
    const point2d K_pq = Kpoints[i]; 
    const point2d beta_pq = {K_pq.x + beta.x, K_pq.y + beta.y};
    const double rbeta_pq = cart2norm(beta_pq);
  // CHOOSE POINT END

    const complex double phasefac = cexp(I*cart2_dot(K_pq,particle_shift)); // POINT-DEPENDENT (PFC) // !!!CHECKSIGN!!!
    const double arg_pq = atan2(beta_pq.y, beta_pq.x); // POINT-DEPENDENT

    // R-DEPENDENT BEGIN
    const complex double gamma_pq = lilgamma(rbeta_pq/k);
    const complex double z = csq(gamma_pq*k/(2*eta)); // Když o tom tak přemýšlím, tak tohle je vlastně vždy reálné
    for(qpms_l_t j = 0; j <= lMax/2; ++j) {
      int retval = complex_gamma_inc_e(0.5-j, z, Gamma_pq+j);
      // we take the other branch, cf. [Linton, p. 642 in the middle]: FIXME instead use the C11 CMPLX macros and fill in -O*I part to z in the line above
      if(creal(z) < 0) 
        Gamma_pq[j].val = conj(Gamma_pq[j].val); //FIXME as noted above
      if(!(retval==0 ||retval==GSL_EUNDRFLW)) abort();
    }
    // R-DEPENDENT END
    
    // TODO optimisations: all the j-dependent powers can be done for each j only once, stored in array
    // and just fetched for each n, m pair
    for(qpms_l_t n = 0; n <= lMax; ++n)
      for(qpms_m_t m = -n; m <= n; ++m) {
        if((m+n) % 2 != 0) // odd coefficients are zero.
          continue;
        const qpms_y_t y = qpms_mn2y_sc(m, n);
        const complex double e_imalpha_pq = cexp(I*m*arg_pq);
        complex double jsum, jsum_c; ckahaninit(&jsum, &jsum_c);
        double jsum_err, jsum_err_c; kahaninit(&jsum_err, &jsum_err_c); // TODO do I really need to kahan sum errors?
        assert((n-abs(m))/2 == c->s1_jMaxes[y]);
        for(qpms_l_t j = 0; j <= c->s1_jMaxes[y]/*(n-abs(m))/2*/; ++j) { // FIXME </<= ?
          complex double summand = pow(rbeta_pq/k, n-2*j) 
            * e_imalpha_pq  * c->legendre0[gsl_sf_legendre_array_index(n,abs(m))] * min1pow_m_neg(m) // This line can actually go outside j-loop
            * cpow(gamma_pq, 2*j-1) // * Gamma_pq[j] bellow (GGG) after error computation
            * c->s1_constfacs[y][j];
          if(err) {
            // FIXME include also other errors than Gamma_pq's relative error
             kahanadd(&jsum_err, &jsum_err_c, Gamma_pq[j].err * cabs(summand));
          }
          summand *= Gamma_pq[j].val; // GGG
          ckahanadd(&jsum, &jsum_c, summand);
        }
        jsum *= phasefac; // PFC
        ckahanadd(target + y, target_c + y, jsum);
        if(err) kahanadd(err + y, err_c + y, jsum_err);
      }
  } // END POINT LOOP
 
  free(err_c);
  free(target_c);
  for(qpms_y_t y = 0; y < nelem_sc; ++y) // CFC common factor from above
    target[y] *= commonfac;
  if(err)
    for(qpms_y_t y = 0; y < nelem_sc; ++y)
      err[y] *= commonfac;
  return 0;
}


struct sigma2_integrand_params {
  int n;
  double k, R;
};

static double sigma2_integrand(double ksi, void *params) {
  struct sigma2_integrand_params *p = (struct sigma2_integrand_params *) params;
  return exp(-sq(p->R * ksi) + sq(p->k / ksi / 2)) * pow(ksi, 2*p->n);
}

static int ewald32_sr_integral(double r, double k, int n, double eta,
    double *result, double *err, gsl_integration_workspace *workspace)
{
  struct sigma2_integrand_params p;


  const double R0 = r; // Maybe could be chosen otherwise, but fuck it for now.
  p.n = n;
  eta *= R0;
  p.k = k * R0;
  p.R = r / R0;  // i.e. p.R = 1

  gsl_function F;
  F.function = sigma2_integrand;
  F.params = &p;

  int retval = gsl_integration_qagiu(&F, eta, INTEGRATION_EPSABS, 
      INTEGRATION_EPSREL, INTEGRATION_WORKSPACE_LIMIT,
      workspace, result, err);
  double normfac = pow(R0, -2*p.n - 1);
  *result *= normfac;
  *err *= normfac;
  return retval;
}

int ewald32_sigma_short_shiftedpoints(
    complex double *target, // must be c->nelem_sc long
    double *err,
    const qpms_ewald32_constants_t *c, // N.B. not too useful here
    const double eta, const double k,
    const size_t npoints, const point2d *Rpoints_plus_particle_shift,
    const point2d beta,
    const point2d particle_shift           // used only in the very end to multiply it by the phase
    )
{
  const qpms_y_t nelem_sc = c->nelem_sc;
  const qpms_l_t lMax = c->lMax;
  gsl_integration_workspace *workspace = 
    gsl_integration_workspace_alloc(INTEGRATION_WORKSPACE_LIMIT);
  
  // Manual init of the ewald summation targets
  complex double * const target_c = calloc(nelem_sc, sizeof(complex double));
  memset(target, 0, nelem_sc * sizeof(complex double));
  double *err_c = NULL;
  if (err) {
    err_c = calloc(nelem_sc, sizeof(double));
    memset(err, 0, nelem_sc * sizeof(double));
  }
  

// CHOOSE POINT BEGIN
  for (size_t i = 0; i < npoints; ++i) { // BEGIN POINT LOOP
    const point2d Rpq_shifted = Rpoints_plus_particle_shift[i];
    const double r_pq_shifted = cart2norm(Rpq_shifted);
// CHOOSE POINT END

    const double Rpq_shifted_arg = atan2(Rpq_shifted.y, Rpq_shifted.x); // POINT-DEPENDENT
    const complex double e_beta_Rpq = cexp(I*cart2_dot(beta, Rpq_shifted)); // POINT-DEPENDENT
    
    for(qpms_l_t n = 0; n <= lMax; ++n) {
      const double complex prefacn = - I * pow(2./k, n+1) * M_2_SQRTPI / 2; // TODO put outside the R-loop and multiply in the end
      const double R_pq_pown = pow(r_pq_shifted, n);
      // TODO the integral here
      double intres, interr;
      int retval = ewald32_sr_integral(r_pq_shifted, k, n, eta,
          &intres, &interr, workspace);
      if (retval) abort();
      for (qpms_m_t m = -n; m <= n; ++m){
        if((m+n) % 2 != 0) // odd coefficients are zero.
          continue; // nothing needed, already done by memset
        const complex double e_imf = cexp(I*m*Rpq_shifted_arg);
        const double leg = c->legendre0[gsl_sf_legendre_array_index(n, abs(m))];
        const qpms_y_t y = qpms_mn2y_sc(m,n);
        if(err)
          kahanadd(err + y, err_c + y, cabs(leg * (prefacn / I) * R_pq_pown
              * interr)); // TODO include also other errors
        ckahanadd(target + y, target_c + y,
            prefacn * R_pq_pown * leg * intres * e_beta_Rpq * e_imf * min1pow_m_neg(m));
      }

    }
  }

  gsl_integration_workspace_free(workspace);
  if(err) free(err_c);
  free(target_c);
  return 0;
}

int ewald32_sigma_short_points_and_shift(
    complex double *target, // must be c->nelem_sc long
    double *err,
    const qpms_ewald32_constants_t *c, // N.B. not too useful here
    const double eta, const double k,
    const size_t npoints, const point2d *Rpoints,
    const point2d beta,
    const point2d particle_shift           // used only in the very end to multiply it by the phase
    )
{
  const qpms_y_t nelem_sc = c->nelem_sc;
  const qpms_l_t lMax = c->lMax;
  gsl_integration_workspace *workspace = 
    gsl_integration_workspace_alloc(INTEGRATION_WORKSPACE_LIMIT);
  
  // Manual init of the ewald summation targets
  complex double * const target_c = calloc(nelem_sc, sizeof(complex double));
  memset(target, 0, nelem_sc * sizeof(complex double));
  double *err_c = NULL;
  if (err) {
    err_c = calloc(nelem_sc, sizeof(double));
    memset(err, 0, nelem_sc * sizeof(double));
  }
  

// CHOOSE POINT BEGIN
  for (size_t i = 0; i < npoints; ++i) { // BEGIN POINT LOOP
    //const point2d Rpq_shifted = Rpoints_plus_particle_shift[i];
    const point2d Rpq_shifted = cart2_add(Rpoints[i], cart2_scale(-1,particle_shift)); // CHECKSIGN!!!!
    const double r_pq_shifted = cart2norm(Rpq_shifted);
// CHOOSE POINT END

    const double Rpq_shifted_arg = atan2(Rpq_shifted.y, Rpq_shifted.x); // POINT-DEPENDENT
    const complex double e_beta_Rpq = cexp(I*cart2_dot(beta, Rpq_shifted)); // POINT-DEPENDENT
    
    for(qpms_l_t n = 0; n <= lMax; ++n) {
      const double complex prefacn = - I * pow(2./k, n+1) * M_2_SQRTPI / 2; // TODO put outside the R-loop and multiply in the end
      const double R_pq_pown = pow(r_pq_shifted, n);
      // TODO the integral here
      double intres, interr;
      int retval = ewald32_sr_integral(r_pq_shifted, k, n, eta,
          &intres, &interr, workspace);
      if (retval) abort();
      for (qpms_m_t m = -n; m <= n; ++m){
        if((m+n) % 2 != 0) // odd coefficients are zero.
          continue; // nothing needed, already done by memset
        const complex double e_imf = cexp(I*m*Rpq_shifted_arg);
        const double leg = c->legendre0[gsl_sf_legendre_array_index(n, abs(m))];
        const qpms_y_t y = qpms_mn2y_sc(m,n);
        if(err)
          kahanadd(err + y, err_c + y, cabs(leg * (prefacn / I) * R_pq_pown
              * interr)); // TODO include also other errors
        ckahanadd(target + y, target_c + y,
            prefacn * R_pq_pown * leg * intres * e_beta_Rpq * e_imf * min1pow_m_neg(m));
      }

    }
  }

  gsl_integration_workspace_free(workspace);
  if(err) free(err_c);
  free(target_c);
  return 0;
}

int ewald3_sigma_short( 
                complex double *target, // must be c->nelem_sc long
                double *err, // must be c->nelem_sc long or NULL
                const qpms_ewald32_constants_t *c,
                const double eta, const double k,
                const LatticeDimensionality latdim, // apart from asserts and possible optimisations ignored, as the SR formula stays the same
                PGenSph *pgen_R, const bool pgen_generates_shifted_points
                /* If false, the behaviour corresponds to the old ewald32_sigma_short_points_and_shift,
                 * so the function assumes that the generated points correspond to the unshifted Bravais lattice,
                 * and adds particle_shift to the generated points before calculations.
                 * If true, it assumes that they are already shifted (if calculating interaction between
                 * different particles in the unit cell).
                 */,
                const cart3_t beta,
                const cart3_t particle_shift
                )
{
  const qpms_y_t nelem_sc = c->nelem_sc;
  const qpms_l_t lMax = c->lMax;
  gsl_integration_workspace *workspace = 
    gsl_integration_workspace_alloc(INTEGRATION_WORKSPACE_LIMIT);

  double legendre_buf[gsl_sf_legendre_array_n(c->lMax)]; // work space for the legendre polynomials (used only in the general case)
  
  // Manual init of the ewald summation targets
  complex double * const target_c = calloc(nelem_sc, sizeof(complex double));
  memset(target, 0, nelem_sc * sizeof(complex double));
  double *err_c = NULL;
  if (err) {
    err_c = calloc(nelem_sc, sizeof(double));
    memset(err, 0, nelem_sc * sizeof(double));
  }
  

  PGenSphReturnData pgen_retdata;
#ifndef NDEBUG
  double r_pq_shifted_prev;
#endif
  // recyclable variables if r_pq_shifted stays the same:
  double intres[lMax+1], interr[lMax+1];

// CHOOSE POINT BEGIN
  while ((pgen_retdata = PGenSph_next(pgen_R)).flags & PGEN_NOTDONE) { // BEGIN POINT LOOP
// CHOOSE POINT END
    cart3_t Rpq_shifted_cart; // I will need both sph and cart representations anyway...
    sph_t Rpq_shifted_sph;
    if (pgen_generates_shifted_points) {
      Rpq_shifted_sph = pgen_retdata.point_sph;
      Rpq_shifted_cart = sph2cart(Rpq_shifted_sph);
    } else { // as in the old _points_and_shift functions
      //const point2d Rpq_shifted = Rpoints_plus_particle_shift[i];
      const sph_t bravais_point_sph = pgen_retdata.point_sph;
      const cart3_t bravais_point_cart = sph2cart(bravais_point_sph);
      Rpq_shifted_cart = cart3_add(bravais_point_cart, cart3_scale(-1, particle_shift)); // CHECKSIGN!!!
      Rpq_shifted_sph = cart2sph(Rpq_shifted_cart);
    }

    // TODO eliminate and use the Rpq_shifted_sph members directly (but in compiler optimizations we trust)
    const double Rpq_shifted_arg = Rpq_shifted_sph.phi; //atan2(Rpq_shifted.y, Rpq_shifted.x); // POINT-DEPENDENT
    const double Rpq_shifted_theta = Rpq_shifted_sph.theta; // POINT-DEPENDENT
    const double r_pq_shifted = Rpq_shifted_sph.r;

    // if the radius is the same as in previous cycle, most of the calculations can be recycled
    const bool new_r_pq_shifted = (!pgen_generates_shifted_points) || (pgen_retdata.flags & PGEN_NEWR);
    if (!new_r_pq_shifted) assert(r_pq_shifted_prev == r_pq_shifted);

    const complex double e_beta_Rpq = cexp(I*cart3_dot(beta, Rpq_shifted_cart)); // POINT-DEPENDENT
    LatticeDimensionality speedup_regime = 0;
    if ((latdim & LAT_2D_IN_3D_XYONLY) == LAT_2D_IN_3D_XYONLY) speedup_regime = LAT_2D_IN_3D_XYONLY;
    if ((latdim & LAT_1D_IN_3D_ZONLY)  == LAT_1D_IN_3D_ZONLY)  speedup_regime = LAT_1D_IN_3D_ZONLY;

    const double * legendre_array;

    switch(speedup_regime) {
      // speedup checks for special geometries and Legendre polynomials
      case LAT_1D_IN_3D_ZONLY:
        assert((pgen_retdata.flags & PGEN_AT_Z) == PGEN_AT_Z);
        assert(Rpq_shifted_theta == M_PI || Rpq_shifted_theta == 0);
        legendre_array = (Rpq_shifted_theta == 0) ? c->legendre_plus1 : c->legendre_minus1; // CHECKSIGN
        break;
      case LAT_2D_IN_3D_XYONLY:
        assert((pgen_retdata.flags &PGEN_AT_XY) == PGEN_AT_XY);
        assert(Rpq_shifted_theta == M_PI_2);
        legendre_array = c->legendre0;
        break;
      default:
        if(GSL_SUCCESS != gsl_sf_legendre_array_e(c->legendre_normconv, lMax, cos(Rpq_shifted_theta), c->legendre_csphase, legendre_buf))
        abort();
        legendre_array = legendre_buf;
        break;
    }
    
    for(qpms_l_t n = 0; n <= lMax; ++n) {
      const double complex prefacn = - I * pow(2./k, n+1) * M_2_SQRTPI / 2; // profiling TODO put outside the R-loop and multiply in the end?
      const double R_pq_pown = pow(r_pq_shifted, n); // profiling TODO: maybe put this into the new_r_pq_shifted condition as well?
      if (new_r_pq_shifted) {
        int retval = ewald32_sr_integral(r_pq_shifted, k, n, eta,
            intres + n, interr + n, workspace);
        if (retval) abort();
      } // otherwise recycle the integrals
      for (qpms_m_t m = -n; m <= n; ++m){
        complex double e_imf;
        // SPEEDUPS for some special geometries
        if(speedup_regime == LAT_2D_IN_3D_XYONLY) { //2D lattice inside the xy plane
          if((m+n) % 2 != 0) // odd coefficients are zero.
            continue; // nothing needed, already done by memset
          e_imf = cexp(I*m*Rpq_shifted_arg); // profiling TODO: calculate outside the n-loop?
        } else if (speedup_regime == LAT_1D_IN_3D_ZONLY) { // 1D lattice along the z axis
          if (m != 0) // m-non-zero coefficients are zero
            continue; // nothing needed, already done by memset
          e_imf = 1;
        } else { // general 1D/2D/3D lattice in 3D space
          e_imf = cexp(I*m*Rpq_shifted_arg);
        }

        const double leg = legendre_array[gsl_sf_legendre_array_index(n, abs(m))];

        const qpms_y_t y = qpms_mn2y_sc(m,n);
        if(err)
          kahanadd(err + y, err_c + y, cabs(leg * (prefacn / I) * R_pq_pown
              * interr[n])); // TODO include also other errors
        ckahanadd(target + y, target_c + y,
            prefacn * R_pq_pown * leg * intres[n] * e_beta_Rpq * e_imf * min1pow_m_neg(m));
      }

    }
#ifndef NDEBUG
    r_pq_shifted_prev = r_pq_shifted;
#endif
  }

  gsl_integration_workspace_free(workspace);
  if(err) free(err_c);
  free(target_c);
  return 0;
}


#if 0

int ewald32_sigma_long_shiftedpoints_rordered(
    complex double *target_sigmalr_y, // must be c->nelem_sc long
    const qpms_ewald32_constants_t *c,
    double eta, double k, double unitcell_area,
    const points2d_rordered_t *Kpoints_plus_beta_rordered,
    point2d particle_shift
    );
int ewald32_sigma_short_points_rordered(
    complex double *target_sigmasr_y, // must be c->nelem_sc long
    const qpms_ewald32_constants_t *c, // N.B. not too useful here
    double eta, double k,
    const points2d_rordered_t *Rpoints_plus_particle_shift_rordered,
    point2d particle_shift    // used only in the very end to multiply it by the phase
    );

#endif
-												Lattice sum constants fators


Former-commit-id: 0337b5e459ad57ca81c4c903f1bc4446ec7e5566
											
										
										
											2018-08-21 18:13:42 +03:00
+								#include "ewald.h"
 								#include <stdlib.h>
 								#include "indexing.h"
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								#include "kahansum.h"
-												Lattice sum constants fators


Former-commit-id: 0337b5e459ad57ca81c4c903f1bc4446ec7e5566
											
										
										
											2018-08-21 18:13:42 +03:00
+								#include <assert.h>
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								#include <string.h>
-												ewald.c compiles


Former-commit-id: 7bcd240f3d9b5aba233550e4242736e700f96c35
											
										
										
											2018-09-05 10:58:13 +03:00
+								#include <complex.h>
-												Lattice sum constants fators


Former-commit-id: 0337b5e459ad57ca81c4c903f1bc4446ec7e5566
											
										
										
											2018-08-21 18:13:42 +03:00
+								#include "tiny_inlines.h"
-												SR ewald sum in progress


Former-commit-id: 927486c4e73f5d60dd1f3c94ff5b4878506a5e17
											
										
										
											2018-08-27 14:39:29 +03:00
+								#include <gsl/gsl_integration.h>
 								#include <gsl/gsl_errno.h>
-												ewald.c compiles


Former-commit-id: 7bcd240f3d9b5aba233550e4242736e700f96c35
											
										
										
											2018-09-05 10:58:13 +03:00
+								#include <gsl/gsl_sf_legendre.h>
-												SR ewald sum in progress


Former-commit-id: 927486c4e73f5d60dd1f3c94ff5b4878506a5e17
											
										
										
											2018-08-27 14:39:29 +03:00
 								// parameters for the quadrature of integral in (4.6)
 								#ifndef INTEGRATION_WORKSPACE_LIMIT
 								#define INTEGRATION_WORKSPACE_LIMIT 30000
 								#endif
 								#ifndef INTEGRATION_EPSABS
-												More test params etc. (still wrong results)


Former-commit-id: 589f4a643ac318f384554b83318355289fdf827d
											
										
										
											2018-09-05 22:45:28 +03:00
+								#define INTEGRATION_EPSABS 1e-13
-												SR ewald sum in progress


Former-commit-id: 927486c4e73f5d60dd1f3c94ff5b4878506a5e17
											
										
										
											2018-08-27 14:39:29 +03:00
+								#endif
 								#ifndef INTEGRATION_EPSREL
 								#define INTEGRATION_EPSREL 1e-13
 								#endif
-												Lattice sum constants fators


Former-commit-id: 0337b5e459ad57ca81c4c903f1bc4446ec7e5566
											
										
										
											2018-08-21 18:13:42 +03:00
-												Ewald short-range part etc.


Former-commit-id: 181d2da97f80dfcbe942d27819d831895a2df263
											
										
										
											2018-09-05 09:07:03 +03:00
+								#ifndef M_SQRTPI
 								#define M_SQRTPI 1.7724538509055160272981674833411452
 								#endif
-												Sigma0 ready, it's time for writing some tests.


Former-commit-id: 956254dcd4c337374d945465ff228fc40595fc3e
											
										
										
											2018-09-05 14:09:22 +03:00
-												Lattice sum constants fators


Former-commit-id: 0337b5e459ad57ca81c4c903f1bc4446ec7e5566
											
										
										
											2018-08-21 18:13:42 +03:00
+								// sloppy implementation of factorial
 								static inline double factorial(const int n) {
 								  assert(n >= 0);
 								  if (n < 0)
 								    return 0; // should not happen in the functions below. (Therefore the assert above)
 								  else if (n <= 20) {
 								    double fac = 1;
 								    for (int i = 1; i <= n; ++i)
 								      fac *= i;
 								    return fac;
 								  }
 								  else
 								    return tgamma(n + 1); // hope it's precise and that overflow does not happen
 								}
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								static inline complex double csq(complex double x) { return x * x; }
-												SR ewald sum in progress


Former-commit-id: 927486c4e73f5d60dd1f3c94ff5b4878506a5e17
											
										
										
											2018-08-27 14:39:29 +03:00
+								static inline double sq(double x) { return x * x; }
-												Lattice sum constants fators


Former-commit-id: 0337b5e459ad57ca81c4c903f1bc4446ec7e5566
											
										
										
											2018-08-21 18:13:42 +03:00
-												Ewald short-range part etc.


Former-commit-id: 181d2da97f80dfcbe942d27819d831895a2df263
											
										
										
											2018-09-05 09:07:03 +03:00
 								typedef enum {
 								  EWALD32_CONSTANTS_ORIG, // As in [1, (4,5)], NOT USED right now.
 								  EWALD32_CONSTANTS_AGNOSTIC /* Not depending on the spherical harmonic sign/normalisation
 								                              * convention – the $e^{im\alpha_pq}$ term in [1,(4.5)] being
 								                              * replaced by the respective $Y_n^m(\pi/2,\alpha)$
 								                              * spherical harmonic. See notes/ewald.lyx.
 								                              */
 								} ewald32_constants_option;
 								static const ewald32_constants_option type = EWALD32_CONSTANTS_AGNOSTIC;
 								qpms_ewald32_constants_t *qpms_ewald32_constants_init(const qpms_l_t lMax /*, const ewald32_constants_option type */,
 								    const int csphase)
-												Lattice sum constants fators


Former-commit-id: 0337b5e459ad57ca81c4c903f1bc4446ec7e5566
											
										
										
											2018-08-21 18:13:42 +03:00
+								{
 								  qpms_ewald32_constants_t *c = malloc(sizeof(qpms_ewald32_constants_t));
 								  //if (c == NULL) return NULL; // Do I really want to do this?
 								  c->lMax = lMax;
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								  c->nelem_sc = qpms_lMax2nelem_sc(lMax);
 								  c->s1_jMaxes = malloc(c->nelem_sc * sizeof(qpms_l_t));
 								  c->s1_constfacs = malloc(c->nelem_sc * sizeof(complex double *));
-												Lattice sum constants fators


Former-commit-id: 0337b5e459ad57ca81c4c903f1bc4446ec7e5566
											
										
										
											2018-08-21 18:13:42 +03:00
+								  //if (c->s1_jMaxes == NULL) return NULL;
 								  //determine sizes
 								  size_t s1_constfacs_sz = 0;
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								  for (qpms_y_t y = 0; y < c->nelem_sc; ++y) {
 								    qpms_l_t n; qpms_m_t m; qpms_y2mn_sc_p(y, &m, &n);
-												Lattice sum constants fators


Former-commit-id: 0337b5e459ad57ca81c4c903f1bc4446ec7e5566
											
										
										
											2018-08-21 18:13:42 +03:00
+								    if ((m + n) % 2 == 0)
 								      s1_constfacs_sz += 1 + (c->s1_jMaxes[y] = (n-abs(m))/2);
 								    else
 								      c->s1_jMaxes[y] = -1;
 								  }
-												[ewald.c] Fix malloc size


Former-commit-id: a2da5e820d4835e1cf91ab308a63f0aedd431789
											
										
										
											2018-09-07 15:39:52 +03:00
+								  c->s1_constfacs_base = malloc(s1_constfacs_sz * sizeof(complex double));
-												Lattice sum constants fators


Former-commit-id: 0337b5e459ad57ca81c4c903f1bc4446ec7e5566
											
										
										
											2018-08-21 18:13:42 +03:00
+								  size_t s1_constfacs_sz_cumsum = 0;
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								  for (qpms_y_t y = 0; y < c->nelem_sc; ++y) {
 								    qpms_l_t n; qpms_m_t m; qpms_y2mn_sc_p(y, &m, &n);
-												Lattice sum constants fators


Former-commit-id: 0337b5e459ad57ca81c4c903f1bc4446ec7e5566
											
										
										
											2018-08-21 18:13:42 +03:00
+								    if ((m + n) % 2 == 0) {
 								      c->s1_constfacs[y] = c->s1_constfacs_base + s1_constfacs_sz_cumsum;
 								      // and here comes the actual calculation
 								      for (qpms_l_t j = 0; j <= c->s1_jMaxes[y]; ++j){
-												Ewald short-range part etc.


Former-commit-id: 181d2da97f80dfcbe942d27819d831895a2df263
											
										
										
											2018-09-05 09:07:03 +03:00
+								        switch(type) {
 								          case EWALD32_CONSTANTS_ORIG: // NOT USED
 								            c->s1_constfacs[y][j] = -0.5 * ipow(n+1) * min1pow((n+m)/2)
 								              * sqrt((2*n + 1) * factorial(n-m) * factorial(n+m))
 								              * min1pow(j) * pow(0.5, n-2*j)
 								              / (factorial(j) * factorial((n-m)/2-j) * factorial((n+m)/2-j))
 								              * pow(0.5, 2*j-1);
 								            break;
 								          case EWALD32_CONSTANTS_AGNOSTIC:
-												[ewald.c] Fix malloc size


Former-commit-id: a2da5e820d4835e1cf91ab308a63f0aedd431789
											
										
										
											2018-09-07 15:39:52 +03:00
+								            c->s1_constfacs[y][j] = -2 * ipow(n+1) * M_SQRTPI
-												Ewald short-range part etc.


Former-commit-id: 181d2da97f80dfcbe942d27819d831895a2df263
											
										
										
											2018-09-05 09:07:03 +03:00
+								              * factorial((n-m)/2) * factorial((n+m)/2)
 								              * min1pow(j)
 								              / (factorial(j) * factorial((n-m)/2-j) * factorial((n+m)/2-j));
 								            break;
 								          default:
 								            abort();
 								        }
-												Lattice sum constants fators


Former-commit-id: 0337b5e459ad57ca81c4c903f1bc4446ec7e5566
											
										
										
											2018-08-21 18:13:42 +03:00
+								      }
 								      s1_constfacs_sz_cumsum += 1 + c->s1_jMaxes[y];
 								    }
 								    else
 								      c->s1_constfacs[y] = NULL;
 								  }
-												Ewald short-range part etc.


Former-commit-id: 181d2da97f80dfcbe942d27819d831895a2df263
											
										
										
											2018-09-05 09:07:03 +03:00
-												General 3D Ewald short-range part now compiles.
Unchecked, untested.


Former-commit-id: 40c10a0eef6575cd29e95be5a0908e28c24ded1d
											
										
										
											2018-11-21 21:41:20 +02:00
+								  c->legendre_csphase = csphase;
-												ewald.c compiles


Former-commit-id: 7bcd240f3d9b5aba233550e4242736e700f96c35
											
										
										
											2018-09-05 10:58:13 +03:00
+								  c->legendre0 = malloc(gsl_sf_legendre_array_n(lMax) * sizeof(double));
 								  // N.B. here I use the GSL_SF_LEGENRE_NONE, in order to be consistent with translations.c
-												Half-implemented the general short-range part of ewald sum in 3D,
unchecked, untested, dudom.


Former-commit-id: b3551114b8c7136e378feb6dc78cb575a5bfc162
											
										
										
											2018-11-21 19:49:07 +02:00
+								  c->legendre_normconv = GSL_SF_LEGENDRE_NONE;
-												ewald.c compiles


Former-commit-id: 7bcd240f3d9b5aba233550e4242736e700f96c35
											
										
										
											2018-09-05 10:58:13 +03:00
+								  // Moreover, using this approach (i.e. gsl) takes about 64kB extra memory
-												Half-implemented the general short-range part of ewald sum in 3D,
unchecked, untested, dudom.


Former-commit-id: b3551114b8c7136e378feb6dc78cb575a5bfc162
											
										
										
											2018-11-21 19:49:07 +02:00
+								  if(GSL_SUCCESS != gsl_sf_legendre_array_e(c->legendre_normconv, lMax, 0, csphase, c->legendre0))
 								    abort();
 								  if(GSL_SUCCESS != gsl_sf_legendre_array_e(c->legendre_normconv, lMax, +1, csphase, c->legendre_plus1))
 								    abort();
 								  if(GSL_SUCCESS != gsl_sf_legendre_array_e(c->legendre_normconv, lMax, -1, csphase, c->legendre_minus1))
-												Ewald short-range part etc.


Former-commit-id: 181d2da97f80dfcbe942d27819d831895a2df263
											
										
										
											2018-09-05 09:07:03 +03:00
+								    abort();
-												Lattice sum constants fators


Former-commit-id: 0337b5e459ad57ca81c4c903f1bc4446ec7e5566
											
										
										
											2018-08-21 18:13:42 +03:00
+								  return c;
 								}
 								void qpms_ewald32_constants_free(qpms_ewald32_constants_t *c) {
-												Ewald short-range part etc.


Former-commit-id: 181d2da97f80dfcbe942d27819d831895a2df263
											
										
										
											2018-09-05 09:07:03 +03:00
+								  free(c->legendre0);
-												Lattice sum constants fators


Former-commit-id: 0337b5e459ad57ca81c4c903f1bc4446ec7e5566
											
										
										
											2018-08-21 18:13:42 +03:00
+								  free(c->s1_constfacs);
 								  free(c->s1_constfacs_base);
 								  free(c->s1_jMaxes);
 								  free(c);
 								}
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
-												Half-implemented the general short-range part of ewald sum in 3D,
unchecked, untested, dudom.


Former-commit-id: b3551114b8c7136e378feb6dc78cb575a5bfc162
											
										
										
											2018-11-21 19:49:07 +02:00
+								int ewald3_sigma0(complex double *result, double *err,
-												Sigma0 ready, it's time for writing some tests.


Former-commit-id: 956254dcd4c337374d945465ff228fc40595fc3e
											
										
										
											2018-09-05 14:09:22 +03:00
+								    const qpms_ewald32_constants_t *c,
 								    const double eta, const double k)
 								{
 								  qpms_csf_result gam;
-												Fix ewald32_sigma0()


Former-commit-id: 969764c516c0e0e8cc928e18447eb5327791d5bc
											
										
										
											2018-09-06 11:52:54 +03:00
+								  int retval = complex_gamma_inc_e(-0.5, -sq(k/(2*eta)), &gam);
-												Fix branch selection in long-range ewald sum.

Now everything is consistent except for sigma0


Former-commit-id: 86132a0db0604ed8c56f725eb95c5b22a103b804
											
										
										
											2018-09-13 01:16:13 +03:00
+								  gam.val = conj(gam.val); // We take the other branch, cf. [Linton, p. 642 in the middle]
-												Sigma0 ready, it's time for writing some tests.


Former-commit-id: 956254dcd4c337374d945465ff228fc40595fc3e
											
										
										
											2018-09-05 14:09:22 +03:00
+								  if (0 != retval)
 								    abort();
 								  *result = gam.val * c->legendre0[gsl_sf_legendre_array_index(0,0)] / 2 / M_SQRTPI;
 								  if(err)
-												Fix ewalds.c test output;  n.b. the current long-range parts.


Former-commit-id: f51675842d53a2ba0c6c2821180c11fe60445257
											
										
										
											2018-09-06 15:00:38 +03:00
+								    *err = gam.err * fabs(c->legendre0[gsl_sf_legendre_array_index(0,0)] / 2 / M_SQRTPI);
-												Sigma0 ready, it's time for writing some tests.


Former-commit-id: 956254dcd4c337374d945465ff228fc40595fc3e
											
										
										
											2018-09-05 14:09:22 +03:00
+								  return 0;
 								}
-												Half-implemented the general short-range part of ewald sum in 3D,
unchecked, untested, dudom.


Former-commit-id: b3551114b8c7136e378feb6dc78cb575a5bfc162
											
										
										
											2018-11-21 19:49:07 +02:00
+								int ewald32_sigma0(complex double *result, double *err,
 								    const qpms_ewald32_constants_t *c,
 								    const double eta, const double k)
 								{
 								  return ewald3_sigma0(result, err, c, eta, k);
 								}
-												Sigma0 ready, it's time for writing some tests.


Former-commit-id: 956254dcd4c337374d945465ff228fc40595fc3e
											
										
										
											2018-09-05 14:09:22 +03:00
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								int ewald32_sigma_long_shiftedpoints (
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								    complex double *target, // must be c->nelem_sc long
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								    double *err,
 								    const qpms_ewald32_constants_t *c,
 								    const double eta, const double k, const double unitcell_area,
 								    const size_t npoints, const point2d *Kpoints_plus_beta,
-												Shifted lattices now consistent, TODO check overall shift sign and fix LR declarations


Former-commit-id: ff8a3a0b93447566a605bc7fe6ddbfe34dec3cd2
											
										
										
											2018-09-15 00:10:10 +03:00
+								    const point2d beta, // not needed
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								    const point2d particle_shift // target - src
 								    )
 								{
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								  const qpms_y_t nelem_sc = c->nelem_sc;
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								  const qpms_l_t lMax = c->lMax;
 								  // Manual init of the ewald summation targets
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								  complex double *target_c = calloc(nelem_sc, sizeof(complex double));
 								  memset(target, 0, nelem_sc * sizeof(complex double));
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								  double *err_c = NULL;
 								  if (err) {
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								    err_c = calloc(nelem_sc, sizeof(double));
 								    memset(err, 0, nelem_sc * sizeof(double));
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								  }
 								  const double commonfac = 1/(k*k*unitcell_area); // used in the very end (CFC)
 								  assert(commonfac > 0);
 								  // space for Gamma_pq[j]'s
-												Catch underflows; fix some off-by-one errors. Some test values pass now.


Former-commit-id: 3add9f21ad6fee5d443fafc3a6b2c02f2f8b6524
											
										
										
											2018-09-07 20:46:07 +03:00
+								  qpms_csf_result Gamma_pq[lMax/2+1];
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
 								  // CHOOSE POINT BEGIN
 								  for (size_t i = 0; i < npoints; ++i) { // BEGIN POINT LOOP
-												ewald.c: type qualifiers


Former-commit-id: d1436642545f21bf3bf4a74f4365ece45b3a5c7d
											
										
										
											2018-09-15 21:32:49 +03:00
+								    const point2d beta_pq = Kpoints_plus_beta[i];
 								    const point2d K_pq = {beta_pq.x - beta.x, beta_pq.y - beta.y};
 								    const double rbeta_pq = cart2norm(beta_pq);
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								  // CHOOSE POINT END
-												ewald.c: type qualifiers


Former-commit-id: d1436642545f21bf3bf4a74f4365ece45b3a5c7d
											
										
										
											2018-09-15 21:32:49 +03:00
+								    const complex double phasefac = cexp(I*cart2_dot(K_pq,particle_shift)); // POINT-DEPENDENT (PFC) // !!!CHECKSIGN!!!
 								    const double arg_pq = atan2(beta_pq.y, beta_pq.x); // POINT-DEPENDENT
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
 								    // R-DEPENDENT BEGIN
-												ewald.c: type qualifiers


Former-commit-id: d1436642545f21bf3bf4a74f4365ece45b3a5c7d
											
										
										
											2018-09-15 21:32:49 +03:00
+								    const complex double gamma_pq = lilgamma(rbeta_pq/k);
 								    const complex double z = csq(gamma_pq*k/(2*eta)); // Když o tom tak přemýšlím, tak tohle je vlastně vždy reálné
-												Catch underflows; fix some off-by-one errors. Some test values pass now.


Former-commit-id: 3add9f21ad6fee5d443fafc3a6b2c02f2f8b6524
											
										
										
											2018-09-07 20:46:07 +03:00
+								    for(qpms_l_t j = 0; j <= lMax/2; ++j) {
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								      int retval = complex_gamma_inc_e(0.5-j, z, Gamma_pq+j);
-												Fix branch selection in long-range ewald sum.

Now everything is consistent except for sigma0


Former-commit-id: 86132a0db0604ed8c56f725eb95c5b22a103b804
											
										
										
											2018-09-13 01:16:13 +03:00
+								      // we take the other branch, cf. [Linton, p. 642 in the middle]: FIXME instead use the C11 CMPLX macros and fill in -O*I part to z in the line above
 								      if(creal(z) < 0)
 								        Gamma_pq[j].val = conj(Gamma_pq[j].val); //FIXME as noted above
-												Catch underflows; fix some off-by-one errors. Some test values pass now.


Former-commit-id: 3add9f21ad6fee5d443fafc3a6b2c02f2f8b6524
											
										
										
											2018-09-07 20:46:07 +03:00
+								      if(!(retval==0 ||retval==GSL_EUNDRFLW)) abort();
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								    }
 								    // R-DEPENDENT END
 								    // TODO optimisations: all the j-dependent powers can be done for each j only once, stored in array
 								    // and just fetched for each n, m pair
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								    for(qpms_l_t n = 0; n <= lMax; ++n)
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								      for(qpms_m_t m = -n; m <= n; ++m) {
-												Jdunakonferenci


Former-commit-id: e734bb63665d03b986a98e45f937979eacab58c4
											
										
										
											2018-08-27 10:28:34 +03:00
+								        if((m+n) % 2 != 0) // odd coefficients are zero.
 								          continue;
-												ewald.c: type qualifiers


Former-commit-id: d1436642545f21bf3bf4a74f4365ece45b3a5c7d
											
										
										
											2018-09-15 21:32:49 +03:00
+								        const qpms_y_t y = qpms_mn2y_sc(m, n);
 								        const complex double e_imalpha_pq = cexp(I*m*arg_pq);
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								        complex double jsum, jsum_c; ckahaninit(&jsum, &jsum_c);
 								        double jsum_err, jsum_err_c; kahaninit(&jsum_err, &jsum_err_c); // TODO do I really need to kahan sum errors?
-												Catch underflows; fix some off-by-one errors. Some test values pass now.


Former-commit-id: 3add9f21ad6fee5d443fafc3a6b2c02f2f8b6524
											
										
										
											2018-09-07 20:46:07 +03:00
+								        assert((n-abs(m))/2 == c->s1_jMaxes[y]);
 								        for(qpms_l_t j = 0; j <= c->s1_jMaxes[y]/*(n-abs(m))/2*/; ++j) { // FIXME </<= ?
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								          complex double summand = pow(rbeta_pq/k, n-2*j)
-												Fix spherical harmonics for negative m in ewald.c.


Former-commit-id: 960dd721a009e2b2f82c986677c3faa65d36394c
											
										
										
											2018-09-10 15:28:41 +03:00
+								            * e_imalpha_pq  * c->legendre0[gsl_sf_legendre_array_index(n,abs(m))] * min1pow_m_neg(m) // This line can actually go outside j-loop
-												Ewald short-range part etc.


Former-commit-id: 181d2da97f80dfcbe942d27819d831895a2df263
											
										
										
											2018-09-05 09:07:03 +03:00
+								            * cpow(gamma_pq, 2*j-1) // * Gamma_pq[j] bellow (GGG) after error computation
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								            * c->s1_constfacs[y][j];
 								          if(err) {
 								            // FIXME include also other errors than Gamma_pq's relative error
 								             kahanadd(&jsum_err, &jsum_err_c, Gamma_pq[j].err * cabs(summand));
 								          }
 								          summand *= Gamma_pq[j].val; // GGG
 								          ckahanadd(&jsum, &jsum_c, summand);
 								        }
-												Jdunakonferenci


Former-commit-id: e734bb63665d03b986a98e45f937979eacab58c4
											
										
										
											2018-08-27 10:28:34 +03:00
+								        jsum *= phasefac; // PFC
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								        ckahanadd(target + y, target_c + y, jsum);
 								        if(err) kahanadd(err + y, err_c + y, jsum_err);
 								      }
 								  } // END POINT LOOP
 								  free(err_c);
 								  free(target_c);
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								  for(qpms_y_t y = 0; y < nelem_sc; ++y) // CFC common factor from above
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								    target[y] *= commonfac;
 								  if(err)
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								    for(qpms_y_t y = 0; y < nelem_sc; ++y)
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								      err[y] *= commonfac;
 								  return 0;
 								}
-												SR ewald sum in progress


Former-commit-id: 927486c4e73f5d60dd1f3c94ff5b4878506a5e17
											
										
										
											2018-08-27 14:39:29 +03:00
-												Ewald summation – stupid implementation of alternative lattice sums


Former-commit-id: de2830e9e5b65fd679fcf5fd1e8ec3e13dba116a
											
										
										
											2018-09-18 13:37:07 +03:00
+								int ewald32_sigma_long_points_and_shift (
 								    complex double *target, // must be c->nelem_sc long
 								    double *err,
 								    const qpms_ewald32_constants_t *c,
 								    const double eta, const double k, const double unitcell_area,
 								    const size_t npoints, const point2d *Kpoints,
-												dudom


Former-commit-id: 9584e40968c45c3acc25e90b51d28a1bb28b8f0c
											
										
										
											2018-11-14 18:36:15 +02:00
+								    const point2d beta,
-												Ewald summation – stupid implementation of alternative lattice sums


Former-commit-id: de2830e9e5b65fd679fcf5fd1e8ec3e13dba116a
											
										
										
											2018-09-18 13:37:07 +03:00
+								    const point2d particle_shift // target - src
 								    )
 								{
 								  const qpms_y_t nelem_sc = c->nelem_sc;
 								  const qpms_l_t lMax = c->lMax;
 								  // Manual init of the ewald summation targets
 								  complex double *target_c = calloc(nelem_sc, sizeof(complex double));
 								  memset(target, 0, nelem_sc * sizeof(complex double));
 								  double *err_c = NULL;
 								  if (err) {
 								    err_c = calloc(nelem_sc, sizeof(double));
 								    memset(err, 0, nelem_sc * sizeof(double));
 								  }
 								  const double commonfac = 1/(k*k*unitcell_area); // used in the very end (CFC)
 								  assert(commonfac > 0);
 								  // space for Gamma_pq[j]'s
 								  qpms_csf_result Gamma_pq[lMax/2+1];
 								  // CHOOSE POINT BEGIN
 								  for (size_t i = 0; i < npoints; ++i) { // BEGIN POINT LOOP
-												dudom


Former-commit-id: 9584e40968c45c3acc25e90b51d28a1bb28b8f0c
											
										
										
											2018-11-14 18:36:15 +02:00
+								    // Only these following two lines differ from ewald32_sigma_long_points_and_shift()!!!  WTFCOMMENT?!
-												Ewald summation – stupid implementation of alternative lattice sums


Former-commit-id: de2830e9e5b65fd679fcf5fd1e8ec3e13dba116a
											
										
										
											2018-09-18 13:37:07 +03:00
+								    const point2d K_pq = Kpoints[i];
 								    const point2d beta_pq = {K_pq.x + beta.x, K_pq.y + beta.y};
 								    const double rbeta_pq = cart2norm(beta_pq);
 								  // CHOOSE POINT END
 								    const complex double phasefac = cexp(I*cart2_dot(K_pq,particle_shift)); // POINT-DEPENDENT (PFC) // !!!CHECKSIGN!!!
 								    const double arg_pq = atan2(beta_pq.y, beta_pq.x); // POINT-DEPENDENT
 								    // R-DEPENDENT BEGIN
 								    const complex double gamma_pq = lilgamma(rbeta_pq/k);
 								    const complex double z = csq(gamma_pq*k/(2*eta)); // Když o tom tak přemýšlím, tak tohle je vlastně vždy reálné
 								    for(qpms_l_t j = 0; j <= lMax/2; ++j) {
 								      int retval = complex_gamma_inc_e(0.5-j, z, Gamma_pq+j);
 								      // we take the other branch, cf. [Linton, p. 642 in the middle]: FIXME instead use the C11 CMPLX macros and fill in -O*I part to z in the line above
 								      if(creal(z) < 0)
 								        Gamma_pq[j].val = conj(Gamma_pq[j].val); //FIXME as noted above
 								      if(!(retval==0 ||retval==GSL_EUNDRFLW)) abort();
 								    }
 								    // R-DEPENDENT END
 								    // TODO optimisations: all the j-dependent powers can be done for each j only once, stored in array
 								    // and just fetched for each n, m pair
 								    for(qpms_l_t n = 0; n <= lMax; ++n)
 								      for(qpms_m_t m = -n; m <= n; ++m) {
 								        if((m+n) % 2 != 0) // odd coefficients are zero.
 								          continue;
 								        const qpms_y_t y = qpms_mn2y_sc(m, n);
 								        const complex double e_imalpha_pq = cexp(I*m*arg_pq);
 								        complex double jsum, jsum_c; ckahaninit(&jsum, &jsum_c);
 								        double jsum_err, jsum_err_c; kahaninit(&jsum_err, &jsum_err_c); // TODO do I really need to kahan sum errors?
 								        assert((n-abs(m))/2 == c->s1_jMaxes[y]);
 								        for(qpms_l_t j = 0; j <= c->s1_jMaxes[y]/*(n-abs(m))/2*/; ++j) { // FIXME </<= ?
 								          complex double summand = pow(rbeta_pq/k, n-2*j)
 								            * e_imalpha_pq  * c->legendre0[gsl_sf_legendre_array_index(n,abs(m))] * min1pow_m_neg(m) // This line can actually go outside j-loop
 								            * cpow(gamma_pq, 2*j-1) // * Gamma_pq[j] bellow (GGG) after error computation
 								            * c->s1_constfacs[y][j];
 								          if(err) {
 								            // FIXME include also other errors than Gamma_pq's relative error
 								             kahanadd(&jsum_err, &jsum_err_c, Gamma_pq[j].err * cabs(summand));
 								          }
 								          summand *= Gamma_pq[j].val; // GGG
 								          ckahanadd(&jsum, &jsum_c, summand);
 								        }
 								        jsum *= phasefac; // PFC
 								        ckahanadd(target + y, target_c + y, jsum);
 								        if(err) kahanadd(err + y, err_c + y, jsum_err);
 								      }
 								  } // END POINT LOOP
 								  free(err_c);
 								  free(target_c);
 								  for(qpms_y_t y = 0; y < nelem_sc; ++y) // CFC common factor from above
 								    target[y] *= commonfac;
 								  if(err)
 								    for(qpms_y_t y = 0; y < nelem_sc; ++y)
 								      err[y] *= commonfac;
 								  return 0;
 								}
-												SR ewald sum in progress


Former-commit-id: 927486c4e73f5d60dd1f3c94ff5b4878506a5e17
											
										
										
											2018-08-27 14:39:29 +03:00
 								struct sigma2_integrand_params {
 								  int n;
 								  double k, R;
 								};
 								static double sigma2_integrand(double ksi, void *params) {
 								  struct sigma2_integrand_params *p = (struct sigma2_integrand_params *) params;
 								  return exp(-sq(p->R * ksi) + sq(p->k / ksi / 2)) * pow(ksi, 2*p->n);
 								}
 								static int ewald32_sr_integral(double r, double k, int n, double eta,
 								    double *result, double *err, gsl_integration_workspace *workspace)
 								{
 								  struct sigma2_integrand_params p;
 								  const double R0 = r; // Maybe could be chosen otherwise, but fuck it for now.
 								  p.n = n;
 								  eta *= R0;
 								  p.k = k * R0;
 								  p.R = r / R0;  // i.e. p.R = 1
 								  gsl_function F;
 								  F.function = sigma2_integrand;
 								  F.params = &p;
 								  int retval = gsl_integration_qagiu(&F, eta, INTEGRATION_EPSABS,
 								      INTEGRATION_EPSREL, INTEGRATION_WORKSPACE_LIMIT,
 								      workspace, result, err);
 								  double normfac = pow(R0, -2*p.n - 1);
 								  *result *= normfac;
 								  *err *= normfac;
 								  return retval;
 								}
-												Jdunakonferenci


Former-commit-id: e734bb63665d03b986a98e45f937979eacab58c4
											
										
										
											2018-08-27 10:28:34 +03:00
+								int ewald32_sigma_short_shiftedpoints(
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								    complex double *target, // must be c->nelem_sc long
-												Jdunakonferenci


Former-commit-id: e734bb63665d03b986a98e45f937979eacab58c4
											
										
										
											2018-08-27 10:28:34 +03:00
+								    double *err,
 								    const qpms_ewald32_constants_t *c, // N.B. not too useful here
 								    const double eta, const double k,
 								    const size_t npoints, const point2d *Rpoints_plus_particle_shift,
-												SR ewald sum in progress


Former-commit-id: 927486c4e73f5d60dd1f3c94ff5b4878506a5e17
											
										
										
											2018-08-27 14:39:29 +03:00
+								    const point2d beta,
-												Jdunakonferenci


Former-commit-id: e734bb63665d03b986a98e45f937979eacab58c4
											
										
										
											2018-08-27 10:28:34 +03:00
+								    const point2d particle_shift           // used only in the very end to multiply it by the phase
 								    )
 								{
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								  const qpms_y_t nelem_sc = c->nelem_sc;
-												Jdunakonferenci


Former-commit-id: e734bb63665d03b986a98e45f937979eacab58c4
											
										
										
											2018-08-27 10:28:34 +03:00
+								  const qpms_l_t lMax = c->lMax;
-												SR ewald sum in progress


Former-commit-id: 927486c4e73f5d60dd1f3c94ff5b4878506a5e17
											
										
										
											2018-08-27 14:39:29 +03:00
+								  gsl_integration_workspace *workspace =
 								    gsl_integration_workspace_alloc(INTEGRATION_WORKSPACE_LIMIT);
-												Jdunakonferenci


Former-commit-id: e734bb63665d03b986a98e45f937979eacab58c4
											
										
										
											2018-08-27 10:28:34 +03:00
 								  // Manual init of the ewald summation targets
-												konstantisace; dudopráce


Former-commit-id: a146fe83f9dbf17044cc723c325ba70230969e44
											
										
										
											2018-09-10 08:10:13 +03:00
+								  complex double * const target_c = calloc(nelem_sc, sizeof(complex double));
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								  memset(target, 0, nelem_sc * sizeof(complex double));
-												Jdunakonferenci


Former-commit-id: e734bb63665d03b986a98e45f937979eacab58c4
											
										
										
											2018-08-27 10:28:34 +03:00
+								  double *err_c = NULL;
 								  if (err) {
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								    err_c = calloc(nelem_sc, sizeof(double));
 								    memset(err, 0, nelem_sc * sizeof(double));
-												Jdunakonferenci


Former-commit-id: e734bb63665d03b986a98e45f937979eacab58c4
											
										
										
											2018-08-27 10:28:34 +03:00
+								  }
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
-												SR ewald sum in progress


Former-commit-id: 927486c4e73f5d60dd1f3c94ff5b4878506a5e17
											
										
										
											2018-08-27 14:39:29 +03:00
+								// CHOOSE POINT BEGIN
 								  for (size_t i = 0; i < npoints; ++i) { // BEGIN POINT LOOP
-												konstantisace; dudopráce


Former-commit-id: a146fe83f9dbf17044cc723c325ba70230969e44
											
										
										
											2018-09-10 08:10:13 +03:00
+								    const point2d Rpq_shifted = Rpoints_plus_particle_shift[i];
 								    const double r_pq_shifted = cart2norm(Rpq_shifted);
-												SR ewald sum in progress


Former-commit-id: 927486c4e73f5d60dd1f3c94ff5b4878506a5e17
											
										
										
											2018-08-27 14:39:29 +03:00
+								// CHOOSE POINT END
-												Jdunakonferenci


Former-commit-id: e734bb63665d03b986a98e45f937979eacab58c4
											
										
										
											2018-08-27 10:28:34 +03:00
-												konstantisace; dudopráce


Former-commit-id: a146fe83f9dbf17044cc723c325ba70230969e44
											
										
										
											2018-09-10 08:10:13 +03:00
+								    const double Rpq_shifted_arg = atan2(Rpq_shifted.y, Rpq_shifted.x); // POINT-DEPENDENT
 								    const complex double e_beta_Rpq = cexp(I*cart2_dot(beta, Rpq_shifted)); // POINT-DEPENDENT
-												SR ewald sum in progress


Former-commit-id: 927486c4e73f5d60dd1f3c94ff5b4878506a5e17
											
										
										
											2018-08-27 14:39:29 +03:00
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								    for(qpms_l_t n = 0; n <= lMax; ++n) {
-												konstantisace; dudopráce


Former-commit-id: a146fe83f9dbf17044cc723c325ba70230969e44
											
										
										
											2018-09-10 08:10:13 +03:00
+								      const double complex prefacn = - I * pow(2./k, n+1) * M_2_SQRTPI / 2; // TODO put outside the R-loop and multiply in the end
 								      const double R_pq_pown = pow(r_pq_shifted, n);
-												SR ewald sum in progress


Former-commit-id: 927486c4e73f5d60dd1f3c94ff5b4878506a5e17
											
										
										
											2018-08-27 14:39:29 +03:00
+								      // TODO the integral here
 								      double intres, interr;
 								      int retval = ewald32_sr_integral(r_pq_shifted, k, n, eta,
 								          &intres, &interr, workspace);
 								      if (retval) abort();
-												Ewald short-range part etc.


Former-commit-id: 181d2da97f80dfcbe942d27819d831895a2df263
											
										
										
											2018-09-05 09:07:03 +03:00
+								      for (qpms_m_t m = -n; m <= n; ++m){
 								        if((m+n) % 2 != 0) // odd coefficients are zero.
 								          continue; // nothing needed, already done by memset
-												konstantisace; dudopráce


Former-commit-id: a146fe83f9dbf17044cc723c325ba70230969e44
											
										
										
											2018-09-10 08:10:13 +03:00
+								        const complex double e_imf = cexp(I*m*Rpq_shifted_arg);
 								        const double leg = c->legendre0[gsl_sf_legendre_array_index(n, abs(m))];
 								        const qpms_y_t y = qpms_mn2y_sc(m,n);
-												Ewald short-range part etc.


Former-commit-id: 181d2da97f80dfcbe942d27819d831895a2df263
											
										
										
											2018-09-05 09:07:03 +03:00
+								        if(err)
-												ewald.c compiles


Former-commit-id: 7bcd240f3d9b5aba233550e4242736e700f96c35
											
										
										
											2018-09-05 10:58:13 +03:00
+								          kahanadd(err + y, err_c + y, cabs(leg * (prefacn / I) * R_pq_pown
-												Ewald short-range part etc.


Former-commit-id: 181d2da97f80dfcbe942d27819d831895a2df263
											
										
										
											2018-09-05 09:07:03 +03:00
+								              * interr)); // TODO include also other errors
 								        ckahanadd(target + y, target_c + y,
-												Fix spherical harmonics for negative m in ewald.c.


Former-commit-id: 960dd721a009e2b2f82c986677c3faa65d36394c
											
										
										
											2018-09-10 15:28:41 +03:00
+								            prefacn * R_pq_pown * leg * intres * e_beta_Rpq * e_imf * min1pow_m_neg(m));
-												Ewald short-range part etc.


Former-commit-id: 181d2da97f80dfcbe942d27819d831895a2df263
											
										
										
											2018-09-05 09:07:03 +03:00
+								      }
-												ewald.c compiles


Former-commit-id: 7bcd240f3d9b5aba233550e4242736e700f96c35
											
										
										
											2018-09-05 10:58:13 +03:00
-												Ewald short-range part etc.


Former-commit-id: 181d2da97f80dfcbe942d27819d831895a2df263
											
										
										
											2018-09-05 09:07:03 +03:00
+								    }
 								  }
-												Jdunakonferenci


Former-commit-id: e734bb63665d03b986a98e45f937979eacab58c4
											
										
										
											2018-08-27 10:28:34 +03:00
-												SR ewald sum in progress


Former-commit-id: 927486c4e73f5d60dd1f3c94ff5b4878506a5e17
											
										
										
											2018-08-27 14:39:29 +03:00
+								  gsl_integration_workspace_free(workspace);
-												Ewald short-range part etc.


Former-commit-id: 181d2da97f80dfcbe942d27819d831895a2df263
											
										
										
											2018-09-05 09:07:03 +03:00
+								  if(err) free(err_c);
-												Jdunakonferenci


Former-commit-id: e734bb63665d03b986a98e45f937979eacab58c4
											
										
										
											2018-08-27 10:28:34 +03:00
+								  free(target_c);
 								  return 0;
 								}
-												Ewald summation – stupid implementation of alternative lattice sums


Former-commit-id: de2830e9e5b65fd679fcf5fd1e8ec3e13dba116a
											
										
										
											2018-09-18 13:37:07 +03:00
+								int ewald32_sigma_short_points_and_shift(
 								    complex double *target, // must be c->nelem_sc long
 								    double *err,
 								    const qpms_ewald32_constants_t *c, // N.B. not too useful here
 								    const double eta, const double k,
 								    const size_t npoints, const point2d *Rpoints,
 								    const point2d beta,
 								    const point2d particle_shift           // used only in the very end to multiply it by the phase
 								    )
 								{
 								  const qpms_y_t nelem_sc = c->nelem_sc;
 								  const qpms_l_t lMax = c->lMax;
 								  gsl_integration_workspace *workspace =
 								    gsl_integration_workspace_alloc(INTEGRATION_WORKSPACE_LIMIT);
 								  // Manual init of the ewald summation targets
 								  complex double * const target_c = calloc(nelem_sc, sizeof(complex double));
 								  memset(target, 0, nelem_sc * sizeof(complex double));
 								  double *err_c = NULL;
 								  if (err) {
 								    err_c = calloc(nelem_sc, sizeof(double));
 								    memset(err, 0, nelem_sc * sizeof(double));
 								  }
 								// CHOOSE POINT BEGIN
 								  for (size_t i = 0; i < npoints; ++i) { // BEGIN POINT LOOP
 								    //const point2d Rpq_shifted = Rpoints_plus_particle_shift[i];
 								    const point2d Rpq_shifted = cart2_add(Rpoints[i], cart2_scale(-1,particle_shift)); // CHECKSIGN!!!!
 								    const double r_pq_shifted = cart2norm(Rpq_shifted);
 								// CHOOSE POINT END
 								    const double Rpq_shifted_arg = atan2(Rpq_shifted.y, Rpq_shifted.x); // POINT-DEPENDENT
 								    const complex double e_beta_Rpq = cexp(I*cart2_dot(beta, Rpq_shifted)); // POINT-DEPENDENT
 								    for(qpms_l_t n = 0; n <= lMax; ++n) {
 								      const double complex prefacn = - I * pow(2./k, n+1) * M_2_SQRTPI / 2; // TODO put outside the R-loop and multiply in the end
 								      const double R_pq_pown = pow(r_pq_shifted, n);
 								      // TODO the integral here
 								      double intres, interr;
 								      int retval = ewald32_sr_integral(r_pq_shifted, k, n, eta,
 								          &intres, &interr, workspace);
 								      if (retval) abort();
 								      for (qpms_m_t m = -n; m <= n; ++m){
 								        if((m+n) % 2 != 0) // odd coefficients are zero.
 								          continue; // nothing needed, already done by memset
 								        const complex double e_imf = cexp(I*m*Rpq_shifted_arg);
 								        const double leg = c->legendre0[gsl_sf_legendre_array_index(n, abs(m))];
 								        const qpms_y_t y = qpms_mn2y_sc(m,n);
 								        if(err)
 								          kahanadd(err + y, err_c + y, cabs(leg * (prefacn / I) * R_pq_pown
 								              * interr)); // TODO include also other errors
 								        ckahanadd(target + y, target_c + y,
 								            prefacn * R_pq_pown * leg * intres * e_beta_Rpq * e_imf * min1pow_m_neg(m));
 								      }
 								    }
 								  }
 								  gsl_integration_workspace_free(workspace);
 								  if(err) free(err_c);
 								  free(target_c);
 								  return 0;
 								}
-												Half-implemented the general short-range part of ewald sum in 3D,
unchecked, untested, dudom.


Former-commit-id: b3551114b8c7136e378feb6dc78cb575a5bfc162
											
										
										
											2018-11-21 19:49:07 +02:00
+								int ewald3_sigma_short(
-												General 3D Ewald short-range part now compiles.
Unchecked, untested.


Former-commit-id: 40c10a0eef6575cd29e95be5a0908e28c24ded1d
											
										
										
											2018-11-21 21:41:20 +02:00
+								                complex double *target, // must be c->nelem_sc long
 								                double *err, // must be c->nelem_sc long or NULL
-												Half-implemented the general short-range part of ewald sum in 3D,
unchecked, untested, dudom.


Former-commit-id: b3551114b8c7136e378feb6dc78cb575a5bfc162
											
										
										
											2018-11-21 19:49:07 +02:00
+								                const qpms_ewald32_constants_t *c,
 								                const double eta, const double k,
-												General 3D Ewald short-range part now compiles.
Unchecked, untested.


Former-commit-id: 40c10a0eef6575cd29e95be5a0908e28c24ded1d
											
										
										
											2018-11-21 21:41:20 +02:00
+								                const LatticeDimensionality latdim, // apart from asserts and possible optimisations ignored, as the SR formula stays the same
-												Half-implemented the general short-range part of ewald sum in 3D,
unchecked, untested, dudom.


Former-commit-id: b3551114b8c7136e378feb6dc78cb575a5bfc162
											
										
										
											2018-11-21 19:49:07 +02:00
+								                PGenSph *pgen_R, const bool pgen_generates_shifted_points
 								                /* If false, the behaviour corresponds to the old ewald32_sigma_short_points_and_shift,
 								                 * so the function assumes that the generated points correspond to the unshifted Bravais lattice,
 								                 * and adds particle_shift to the generated points before calculations.
 								                 * If true, it assumes that they are already shifted (if calculating interaction between
 								                 * different particles in the unit cell).
 								                 */,
 								                const cart3_t beta,
 								                const cart3_t particle_shift
 								                )
 								{
 								  const qpms_y_t nelem_sc = c->nelem_sc;
 								  const qpms_l_t lMax = c->lMax;
 								  gsl_integration_workspace *workspace =
 								    gsl_integration_workspace_alloc(INTEGRATION_WORKSPACE_LIMIT);
 								  double legendre_buf[gsl_sf_legendre_array_n(c->lMax)]; // work space for the legendre polynomials (used only in the general case)
 								  // Manual init of the ewald summation targets
 								  complex double * const target_c = calloc(nelem_sc, sizeof(complex double));
 								  memset(target, 0, nelem_sc * sizeof(complex double));
 								  double *err_c = NULL;
 								  if (err) {
 								    err_c = calloc(nelem_sc, sizeof(double));
 								    memset(err, 0, nelem_sc * sizeof(double));
 								  }
 								  PGenSphReturnData pgen_retdata;
 								#ifndef NDEBUG
 								  double r_pq_shifted_prev;
 								#endif
 								  // recyclable variables if r_pq_shifted stays the same:
 								  double intres[lMax+1], interr[lMax+1];
 								// CHOOSE POINT BEGIN
-												General 3D Ewald short-range part now compiles.
Unchecked, untested.


Former-commit-id: 40c10a0eef6575cd29e95be5a0908e28c24ded1d
											
										
										
											2018-11-21 21:41:20 +02:00
+								  while ((pgen_retdata = PGenSph_next(pgen_R)).flags & PGEN_NOTDONE) { // BEGIN POINT LOOP
-												Half-implemented the general short-range part of ewald sum in 3D,
unchecked, untested, dudom.


Former-commit-id: b3551114b8c7136e378feb6dc78cb575a5bfc162
											
										
										
											2018-11-21 19:49:07 +02:00
+								// CHOOSE POINT END
 								    cart3_t Rpq_shifted_cart; // I will need both sph and cart representations anyway...
 								    sph_t Rpq_shifted_sph;
 								    if (pgen_generates_shifted_points) {
-												General 3D Ewald short-range part now compiles.
Unchecked, untested.


Former-commit-id: 40c10a0eef6575cd29e95be5a0908e28c24ded1d
											
										
										
											2018-11-21 21:41:20 +02:00
+								      Rpq_shifted_sph = pgen_retdata.point_sph;
 								      Rpq_shifted_cart = sph2cart(Rpq_shifted_sph);
-												Half-implemented the general short-range part of ewald sum in 3D,
unchecked, untested, dudom.


Former-commit-id: b3551114b8c7136e378feb6dc78cb575a5bfc162
											
										
										
											2018-11-21 19:49:07 +02:00
+								    } else { // as in the old _points_and_shift functions
 								      //const point2d Rpq_shifted = Rpoints_plus_particle_shift[i];
 								      const sph_t bravais_point_sph = pgen_retdata.point_sph;
 								      const cart3_t bravais_point_cart = sph2cart(bravais_point_sph);
 								      Rpq_shifted_cart = cart3_add(bravais_point_cart, cart3_scale(-1, particle_shift)); // CHECKSIGN!!!
 								      Rpq_shifted_sph = cart2sph(Rpq_shifted_cart);
 								    }
 								    // TODO eliminate and use the Rpq_shifted_sph members directly (but in compiler optimizations we trust)
 								    const double Rpq_shifted_arg = Rpq_shifted_sph.phi; //atan2(Rpq_shifted.y, Rpq_shifted.x); // POINT-DEPENDENT
 								    const double Rpq_shifted_theta = Rpq_shifted_sph.theta; // POINT-DEPENDENT
 								    const double r_pq_shifted = Rpq_shifted_sph.r;
 								    // if the radius is the same as in previous cycle, most of the calculations can be recycled
-												General 3D Ewald short-range part now compiles.
Unchecked, untested.


Former-commit-id: 40c10a0eef6575cd29e95be5a0908e28c24ded1d
											
										
										
											2018-11-21 21:41:20 +02:00
+								    const bool new_r_pq_shifted = (!pgen_generates_shifted_points) || (pgen_retdata.flags & PGEN_NEWR);
-												Half-implemented the general short-range part of ewald sum in 3D,
unchecked, untested, dudom.


Former-commit-id: b3551114b8c7136e378feb6dc78cb575a5bfc162
											
										
										
											2018-11-21 19:49:07 +02:00
+								    if (!new_r_pq_shifted) assert(r_pq_shifted_prev == r_pq_shifted);
 								    const complex double e_beta_Rpq = cexp(I*cart3_dot(beta, Rpq_shifted_cart)); // POINT-DEPENDENT
 								    LatticeDimensionality speedup_regime = 0;
 								    if ((latdim & LAT_2D_IN_3D_XYONLY) == LAT_2D_IN_3D_XYONLY) speedup_regime = LAT_2D_IN_3D_XYONLY;
 								    if ((latdim & LAT_1D_IN_3D_ZONLY)  == LAT_1D_IN_3D_ZONLY)  speedup_regime = LAT_1D_IN_3D_ZONLY;
 								    const double * legendre_array;
 								    switch(speedup_regime) {
 								      // speedup checks for special geometries and Legendre polynomials
 								      case LAT_1D_IN_3D_ZONLY:
 								        assert((pgen_retdata.flags & PGEN_AT_Z) == PGEN_AT_Z);
 								        assert(Rpq_shifted_theta == M_PI || Rpq_shifted_theta == 0);
 								        legendre_array = (Rpq_shifted_theta == 0) ? c->legendre_plus1 : c->legendre_minus1; // CHECKSIGN
 								        break;
 								      case LAT_2D_IN_3D_XYONLY:
 								        assert((pgen_retdata.flags &PGEN_AT_XY) == PGEN_AT_XY);
 								        assert(Rpq_shifted_theta == M_PI_2);
 								        legendre_array = c->legendre0;
 								        break;
 								      default:
-												General 3D Ewald short-range part now compiles.
Unchecked, untested.


Former-commit-id: 40c10a0eef6575cd29e95be5a0908e28c24ded1d
											
										
										
											2018-11-21 21:41:20 +02:00
+								        if(GSL_SUCCESS != gsl_sf_legendre_array_e(c->legendre_normconv, lMax, cos(Rpq_shifted_theta), c->legendre_csphase, legendre_buf))
-												Half-implemented the general short-range part of ewald sum in 3D,
unchecked, untested, dudom.


Former-commit-id: b3551114b8c7136e378feb6dc78cb575a5bfc162
											
										
										
											2018-11-21 19:49:07 +02:00
+								        abort();
 								        legendre_array = legendre_buf;
 								        break;
 								    }
 								    for(qpms_l_t n = 0; n <= lMax; ++n) {
 								      const double complex prefacn = - I * pow(2./k, n+1) * M_2_SQRTPI / 2; // profiling TODO put outside the R-loop and multiply in the end?
 								      const double R_pq_pown = pow(r_pq_shifted, n); // profiling TODO: maybe put this into the new_r_pq_shifted condition as well?
 								      if (new_r_pq_shifted) {
 								        int retval = ewald32_sr_integral(r_pq_shifted, k, n, eta,
 								            intres + n, interr + n, workspace);
 								        if (retval) abort();
 								      } // otherwise recycle the integrals
 								      for (qpms_m_t m = -n; m <= n; ++m){
 								        complex double e_imf;
 								        // SPEEDUPS for some special geometries
 								        if(speedup_regime == LAT_2D_IN_3D_XYONLY) { //2D lattice inside the xy plane
 								          if((m+n) % 2 != 0) // odd coefficients are zero.
 								            continue; // nothing needed, already done by memset
 								          e_imf = cexp(I*m*Rpq_shifted_arg); // profiling TODO: calculate outside the n-loop?
-												General 3D Ewald short-range part now compiles.
Unchecked, untested.


Former-commit-id: 40c10a0eef6575cd29e95be5a0908e28c24ded1d
											
										
										
											2018-11-21 21:41:20 +02:00
+								        } else if (speedup_regime == LAT_1D_IN_3D_ZONLY) { // 1D lattice along the z axis
-												Half-implemented the general short-range part of ewald sum in 3D,
unchecked, untested, dudom.


Former-commit-id: b3551114b8c7136e378feb6dc78cb575a5bfc162
											
										
										
											2018-11-21 19:49:07 +02:00
+								          if (m != 0) // m-non-zero coefficients are zero
 								            continue; // nothing needed, already done by memset
 								          e_imf = 1;
 								        } else { // general 1D/2D/3D lattice in 3D space
 								          e_imf = cexp(I*m*Rpq_shifted_arg);
 								        }
 								        const double leg = legendre_array[gsl_sf_legendre_array_index(n, abs(m))];
 								        const qpms_y_t y = qpms_mn2y_sc(m,n);
 								        if(err)
 								          kahanadd(err + y, err_c + y, cabs(leg * (prefacn / I) * R_pq_pown
-												General 3D Ewald short-range part now compiles.
Unchecked, untested.


Former-commit-id: 40c10a0eef6575cd29e95be5a0908e28c24ded1d
											
										
										
											2018-11-21 21:41:20 +02:00
+								              * interr[n])); // TODO include also other errors
-												Half-implemented the general short-range part of ewald sum in 3D,
unchecked, untested, dudom.


Former-commit-id: b3551114b8c7136e378feb6dc78cb575a5bfc162
											
										
										
											2018-11-21 19:49:07 +02:00
+								        ckahanadd(target + y, target_c + y,
-												General 3D Ewald short-range part now compiles.
Unchecked, untested.


Former-commit-id: 40c10a0eef6575cd29e95be5a0908e28c24ded1d
											
										
										
											2018-11-21 21:41:20 +02:00
+								            prefacn * R_pq_pown * leg * intres[n] * e_beta_Rpq * e_imf * min1pow_m_neg(m));
-												Half-implemented the general short-range part of ewald sum in 3D,
unchecked, untested, dudom.


Former-commit-id: b3551114b8c7136e378feb6dc78cb575a5bfc162
											
										
										
											2018-11-21 19:49:07 +02:00
+								      }
 								    }
 								#ifndef NDEBUG
 								    r_pq_shifted_prev = r_pq_shifted;
 								#endif
 								  }
 								  gsl_integration_workspace_free(workspace);
 								  if(err) free(err_c);
 								  free(target_c);
 								  return 0;
 								}
-												Ewald summation – stupid implementation of alternative lattice sums


Former-commit-id: de2830e9e5b65fd679fcf5fd1e8ec3e13dba116a
											
										
										
											2018-09-18 13:37:07 +03:00
-												Jdunakonferenci


Former-commit-id: e734bb63665d03b986a98e45f937979eacab58c4
											
										
										
											2018-08-27 10:28:34 +03:00
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								#if 0
 								int ewald32_sigma_long_shiftedpoints_rordered(
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								    complex double *target_sigmalr_y, // must be c->nelem_sc long
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								    const qpms_ewald32_constants_t *c,
 								    double eta, double k, double unitcell_area,
 								    const points2d_rordered_t *Kpoints_plus_beta_rordered,
 								    point2d particle_shift
 								    );
 								int ewald32_sigma_short_points_rordered(
-												Scalar m,n indexing to allow n = 0.


Former-commit-id: 4b6f2f3611a00e2019b54bfe73c407baafdd8355
											
										
										
											2018-09-05 15:39:02 +03:00
+								    complex double *target_sigmasr_y, // must be c->nelem_sc long
-												Ewald summation LR part, stupid.


Former-commit-id: 9795ad00b41e83c30feb027853a13959d8b506ea
											
										
										
											2018-08-27 09:45:11 +03:00
+								    const qpms_ewald32_constants_t *c, // N.B. not too useful here
 								    double eta, double k,
 								    const points2d_rordered_t *Rpoints_plus_particle_shift_rordered,
 								    point2d particle_shift    // used only in the very end to multiply it by the phase
 								    );
 								#endif