Handling of zero packed orbit sizes.
Former-commit-id: 75ff318b4c91477a22f0fcee30fcb8812de1faba
This commit is contained in:
parent
f30c5a88d9
commit
297995690a
|
@ -807,6 +807,8 @@ complex double *qpms_scatsys_irrep_pack_matrix(complex double *target_packed,
|
||||||
const complex double *orig_full, const qpms_scatsys_t *ss,
|
const complex double *orig_full, const qpms_scatsys_t *ss,
|
||||||
qpms_iri_t iri){
|
qpms_iri_t iri){
|
||||||
const size_t packedlen = ss->saecv_sizes[iri];
|
const size_t packedlen = ss->saecv_sizes[iri];
|
||||||
|
if (!packedlen) // THIS IS A BIT PROBLEMATIC, TODO how to deal with empty irreps?
|
||||||
|
return target_packed;
|
||||||
const size_t full_len = ss->fecv_size;
|
const size_t full_len = ss->fecv_size;
|
||||||
if (target_packed == NULL)
|
if (target_packed == NULL)
|
||||||
target_packed = malloc(SQ(packedlen)*sizeof(complex double));
|
target_packed = malloc(SQ(packedlen)*sizeof(complex double));
|
||||||
|
@ -837,6 +839,7 @@ complex double *qpms_scatsys_irrep_pack_matrix(complex double *target_packed,
|
||||||
const complex double *omR = otR->irbases + otR->irbase_offsets[iri];
|
const complex double *omR = otR->irbases + otR->irbase_offsets[iri];
|
||||||
|
|
||||||
size_t fullvec_offsetC = 0;
|
size_t fullvec_offsetC = 0;
|
||||||
|
if(orbit_packedsizeR) { // avoid zgemm crash on empty irrep
|
||||||
for(qpms_ss_pi_t piC = 0; piC < ss->p_count; ++piC) { //Column loop
|
for(qpms_ss_pi_t piC = 0; piC < ss->p_count; ++piC) { //Column loop
|
||||||
const qpms_ss_oti_t otiC = ss->p_orbitinfo[piC].t;
|
const qpms_ss_oti_t otiC = ss->p_orbitinfo[piC].t;
|
||||||
const qpms_ss_orbit_type_t *const otC = ss->orbit_types + otiC;
|
const qpms_ss_orbit_type_t *const otC = ss->orbit_types + otiC;
|
||||||
|
@ -853,6 +856,7 @@ complex double *qpms_scatsys_irrep_pack_matrix(complex double *target_packed,
|
||||||
// This is the orbit-level matrix projecting the whole orbit onto the irrep.
|
// This is the orbit-level matrix projecting the whole orbit onto the irrep.
|
||||||
const complex double *omC = otC->irbases + otC->irbase_offsets[iri];
|
const complex double *omC = otC->irbases + otC->irbase_offsets[iri];
|
||||||
|
|
||||||
|
if(orbit_packedsizeC) { // avoid zgemm crash on empty irrep
|
||||||
// tmp[oiR|piR,piC] = ∑_K M[piR,K] U*[K,piC]
|
// tmp[oiR|piR,piC] = ∑_K M[piR,K] U*[K,piC]
|
||||||
cblas_zgemm(CblasRowMajor, CblasNoTrans, CblasConjTrans,
|
cblas_zgemm(CblasRowMajor, CblasNoTrans, CblasConjTrans,
|
||||||
particle_fullsizeR /*M*/, orbit_packedsizeC /*N*/, particle_fullsizeC /*K*/,
|
particle_fullsizeR /*M*/, orbit_packedsizeC /*N*/, particle_fullsizeC /*K*/,
|
||||||
|
@ -870,12 +874,12 @@ complex double *qpms_scatsys_irrep_pack_matrix(complex double *target_packed,
|
||||||
tmp /*B*/, orbit_packedsizeC /*ldB*/, &one /*beta*/,
|
tmp /*B*/, orbit_packedsizeC /*ldB*/, &one /*beta*/,
|
||||||
target_packed + packedlen*packed_orbit_offsetR + packed_orbit_offsetC /*C*/,
|
target_packed + packedlen*packed_orbit_offsetR + packed_orbit_offsetC /*C*/,
|
||||||
packedlen /*ldC*/);
|
packedlen /*ldC*/);
|
||||||
|
}
|
||||||
fullvec_offsetC += otC->bspecn;
|
fullvec_offsetC += otC->bspecn;
|
||||||
}
|
}
|
||||||
fullvec_offsetR += otR->bspecn;
|
fullvec_offsetR += otR->bspecn;
|
||||||
}
|
}
|
||||||
|
}
|
||||||
free(tmp);
|
free(tmp);
|
||||||
return target_packed;
|
return target_packed;
|
||||||
}
|
}
|
||||||
|
@ -892,6 +896,8 @@ complex double *qpms_scatsys_irrep_unpack_matrix(complex double *target_full,
|
||||||
if (target_full == NULL) abort();
|
if (target_full == NULL) abort();
|
||||||
if(!add) memset(target_full, 0, SQ(full_len)*sizeof(complex double));
|
if(!add) memset(target_full, 0, SQ(full_len)*sizeof(complex double));
|
||||||
|
|
||||||
|
if(!packedlen) return target_full; // Empty irrep, do nothing.
|
||||||
|
|
||||||
// Workspace for the intermediate particle-orbit matrix result
|
// Workspace for the intermediate particle-orbit matrix result
|
||||||
complex double *tmp = malloc(sizeof(complex double) * SQ(ss->max_bspecn)
|
complex double *tmp = malloc(sizeof(complex double) * SQ(ss->max_bspecn)
|
||||||
* ss->sym->order); if (!tmp) abort();
|
* ss->sym->order); if (!tmp) abort();
|
||||||
|
@ -916,6 +922,7 @@ complex double *qpms_scatsys_irrep_unpack_matrix(complex double *target_full,
|
||||||
const complex double *omR = otR->irbases + otR->irbase_offsets[iri];
|
const complex double *omR = otR->irbases + otR->irbase_offsets[iri];
|
||||||
|
|
||||||
size_t fullvec_offsetC = 0;
|
size_t fullvec_offsetC = 0;
|
||||||
|
if (orbit_packedsizeR) // avoid crash on empty irrep
|
||||||
for(qpms_ss_pi_t piC = 0; piC < ss->p_count; ++piC) { //Column loop
|
for(qpms_ss_pi_t piC = 0; piC < ss->p_count; ++piC) { //Column loop
|
||||||
const qpms_ss_oti_t otiC = ss->p_orbitinfo[piC].t;
|
const qpms_ss_oti_t otiC = ss->p_orbitinfo[piC].t;
|
||||||
const qpms_ss_orbit_type_t *const otC = ss->orbit_types + otiC;
|
const qpms_ss_orbit_type_t *const otC = ss->orbit_types + otiC;
|
||||||
|
@ -931,6 +938,7 @@ complex double *qpms_scatsys_irrep_unpack_matrix(complex double *target_full,
|
||||||
const size_t orbit_packedsizeC = otC->irbase_sizes[iri];
|
const size_t orbit_packedsizeC = otC->irbase_sizes[iri];
|
||||||
// This is the orbit-level matrix projecting the whole orbit onto the irrep.
|
// This is the orbit-level matrix projecting the whole orbit onto the irrep.
|
||||||
const complex double *omC = otC->irbases + otC->irbase_offsets[iri];
|
const complex double *omC = otC->irbases + otC->irbase_offsets[iri];
|
||||||
|
if (orbit_packedsizeC) { // avoid crash on empty irrep
|
||||||
// tmp = P U
|
// tmp = P U
|
||||||
// tmp[oiR|piR,piC] = ∑_K M[piR,K] U[K,piC]
|
// tmp[oiR|piR,piC] = ∑_K M[piR,K] U[K,piC]
|
||||||
cblas_zgemm(CblasRowMajor, CblasNoTrans, CblasNoTrans,
|
cblas_zgemm(CblasRowMajor, CblasNoTrans, CblasNoTrans,
|
||||||
|
@ -949,7 +957,7 @@ complex double *qpms_scatsys_irrep_unpack_matrix(complex double *target_full,
|
||||||
tmp /*B*/, particle_fullsizeC /*ldB*/, &one /*beta*/,
|
tmp /*B*/, particle_fullsizeC /*ldB*/, &one /*beta*/,
|
||||||
target_full + full_len*fullvec_offsetR + fullvec_offsetC /*C*/,
|
target_full + full_len*fullvec_offsetR + fullvec_offsetC /*C*/,
|
||||||
full_len /*ldC*/);
|
full_len /*ldC*/);
|
||||||
|
}
|
||||||
fullvec_offsetC += otC->bspecn;
|
fullvec_offsetC += otC->bspecn;
|
||||||
}
|
}
|
||||||
fullvec_offsetR += otR->bspecn;
|
fullvec_offsetR += otR->bspecn;
|
||||||
|
@ -965,6 +973,7 @@ complex double *qpms_scatsys_irrep_pack_vector(complex double *target_packed,
|
||||||
const complex double *orig_full, const qpms_scatsys_t *ss,
|
const complex double *orig_full, const qpms_scatsys_t *ss,
|
||||||
const qpms_iri_t iri) {
|
const qpms_iri_t iri) {
|
||||||
const size_t packedlen = ss->saecv_sizes[iri];
|
const size_t packedlen = ss->saecv_sizes[iri];
|
||||||
|
if (!packedlen) return target_packed; // Empty irrep
|
||||||
if (target_packed == NULL)
|
if (target_packed == NULL)
|
||||||
target_packed = malloc(packedlen*sizeof(complex double));
|
target_packed = malloc(packedlen*sizeof(complex double));
|
||||||
if (target_packed == NULL) abort();
|
if (target_packed == NULL) abort();
|
||||||
|
@ -988,13 +997,12 @@ complex double *qpms_scatsys_irrep_pack_vector(complex double *target_packed,
|
||||||
const size_t orbit_packedsize = ot->irbase_sizes[iri];
|
const size_t orbit_packedsize = ot->irbase_sizes[iri];
|
||||||
// This is the orbit-level matrix projecting the whole orbit onto the irrep.
|
// This is the orbit-level matrix projecting the whole orbit onto the irrep.
|
||||||
const complex double *om = ot->irbases + ot->irbase_offsets[iri];
|
const complex double *om = ot->irbases + ot->irbase_offsets[iri];
|
||||||
|
if (orbit_packedsize) // avoid crash on empty irrep
|
||||||
cblas_zgemv(CblasRowMajor/*order*/, CblasNoTrans/*transA*/,
|
cblas_zgemv(CblasRowMajor/*order*/, CblasNoTrans/*transA*/,
|
||||||
orbit_packedsize/*M*/, particle_fullsize/*N*/, &one/*alpha*/,
|
orbit_packedsize/*M*/, particle_fullsize/*N*/, &one/*alpha*/,
|
||||||
om + opi*particle_fullsize/*A*/, orbit_fullsize/*lda*/,
|
om + opi*particle_fullsize/*A*/, orbit_fullsize/*lda*/,
|
||||||
orig_full+fullvec_offset/*X*/, 1/*incX*/,
|
orig_full+fullvec_offset/*X*/, 1/*incX*/,
|
||||||
&one/*beta*/, target_packed+packed_orbit_offset/*Y*/, 1/*incY*/);
|
&one/*beta*/, target_packed+packed_orbit_offset/*Y*/, 1/*incY*/);
|
||||||
|
|
||||||
fullvec_offset += ot->bspecn;
|
fullvec_offset += ot->bspecn;
|
||||||
}
|
}
|
||||||
return target_packed;
|
return target_packed;
|
||||||
|
@ -1013,6 +1021,7 @@ complex double *qpms_scatsys_irrep_unpack_vector(complex double *target_full,
|
||||||
|
|
||||||
const complex double one = 1;
|
const complex double one = 1;
|
||||||
const size_t packedlen = ss->saecv_sizes[iri];
|
const size_t packedlen = ss->saecv_sizes[iri];
|
||||||
|
if (!packedlen) return target_full; // Completely empty irrep
|
||||||
|
|
||||||
size_t fullvec_offset = 0;
|
size_t fullvec_offset = 0;
|
||||||
for(qpms_ss_pi_t pi = 0; pi < ss->p_count; ++pi) {
|
for(qpms_ss_pi_t pi = 0; pi < ss->p_count; ++pi) {
|
||||||
|
@ -1030,6 +1039,7 @@ complex double *qpms_scatsys_irrep_unpack_vector(complex double *target_full,
|
||||||
// This is the orbit-level matrix projecting the whole orbit onto the irrep.
|
// This is the orbit-level matrix projecting the whole orbit onto the irrep.
|
||||||
const complex double *om = ot->irbases + ot->irbase_offsets[iri];
|
const complex double *om = ot->irbases + ot->irbase_offsets[iri];
|
||||||
|
|
||||||
|
if (orbit_packedsize) // empty irrep, avoid zgemv crashing.
|
||||||
cblas_zgemv(CblasRowMajor/*order*/, CblasConjTrans/*transA*/,
|
cblas_zgemv(CblasRowMajor/*order*/, CblasConjTrans/*transA*/,
|
||||||
orbit_packedsize/*M*/, particle_fullsize/*N*/, &one/*alpha*/, om + opi*particle_fullsize/*A*/,
|
orbit_packedsize/*M*/, particle_fullsize/*N*/, &one/*alpha*/, om + opi*particle_fullsize/*A*/,
|
||||||
orbit_fullsize/*lda*/, orig_packed+packed_orbit_offset /*X*/, 1/*incX*/, &one/*beta*/,
|
orbit_fullsize/*lda*/, orig_packed+packed_orbit_offset /*X*/, 1/*incX*/, &one/*beta*/,
|
||||||
|
|
Loading…
Reference in New Issue