ewald.cpp
No OneTemporary
Actions

Subscribers

None

File Metadata

Created: Sun, Jul 6, 03:40

ewald.cpp
View Options

	/* ----------------------------------------------------------------------
	LAMMPS - Large-scale Atomic/Molecular Massively Parallel Simulator
	http://lammps.sandia.gov, Sandia National Laboratories
	Steve Plimpton, sjplimp@sandia.gov

	Copyright (2003) Sandia Corporation. Under the terms of Contract
	DE-AC04-94AL85000 with Sandia Corporation, the U.S. Government retains
	certain rights in this software. This software is distributed under
	the GNU General Public License.

	See the README file in the top-level LAMMPS directory.
	------------------------------------------------------------------------- */

	/* ----------------------------------------------------------------------
	Contributing authors: Roy Pollock (LLNL), Paul Crozier (SNL)
	per-atom energy/virial added by German Samolyuk (ORNL), Stan Moore (BYU)
	------------------------------------------------------------------------- */

	#include "mpi.h"
	#include "stdlib.h"
	#include "stdio.h"
	#include "string.h"
	#include "math.h"
	#include "ewald.h"
	#include "atom.h"
	#include "comm.h"
	#include "force.h"
	#include "pair.h"
	#include "domain.h"
	#include "math_const.h"
	#include "memory.h"
	#include "error.h"

	using namespace LAMMPS_NS;
	using namespace MathConst;

	#define SMALL 0.00001

	/* ---------------------------------------------------------------------- */

	Ewald::Ewald(LAMMPS lmp, int narg, char *arg) : KSpace(lmp, narg, arg)
	{
	if (narg != 1) error->all(FLERR,"Illegal kspace_style ewald command");

	precision = atof(arg[0]);

	kmax = 0;
	kxvecs = kyvecs = kzvecs = NULL;
	ug = NULL;
	eg = vg = NULL;
	sfacrl = sfacim = sfacrl_all = sfacim_all = NULL;

	nmax = 0;
	ek = NULL;
	cs = sn = NULL;

	kcount = 0;
	}

	/* ----------------------------------------------------------------------
	free all memory
	------------------------------------------------------------------------- */

	Ewald::~Ewald()
	{
	deallocate();
	memory->destroy(ek);
	memory->destroy3d_offset(cs,-kmax_created);
	memory->destroy3d_offset(sn,-kmax_created);
	}

	/* ---------------------------------------------------------------------- */

	void Ewald::init()
	{
	if (comm->me == 0) {
	if (screen) fprintf(screen,"Ewald initialization ...\n");
	if (logfile) fprintf(logfile,"Ewald initialization ...\n");
	}

	// error check

	if (domain->triclinic)
	error->all(FLERR,"Cannot use Ewald with triclinic box");
	if (domain->dimension == 2)
	error->all(FLERR,"Cannot use Ewald with 2d simulation");

	if (!atom->q_flag) error->all(FLERR,"Kspace style requires atom attribute q");

	if (slabflag == 0 && domain->nonperiodic > 0)
	error->all(FLERR,"Cannot use nonperiodic boundaries with Ewald");
	if (slabflag == 1) {
	if (domain->xperiodic != 1 \|\| domain->yperiodic != 1 \|\|
	domain->boundary[2][0] != 1 \|\| domain->boundary[2][1] != 1)
	error->all(FLERR,"Incorrect boundaries with slab Ewald");
	}

	// extract short-range Coulombic cutoff from pair style

	scale = 1.0;

	if (force->pair == NULL)
	error->all(FLERR,"KSpace style is incompatible with Pair style");
	int itmp;
	double p_cutoff = (double ) force->pair->extract("cut_coul",itmp);
	if (p_cutoff == NULL)
	error->all(FLERR,"KSpace style is incompatible with Pair style");
	double cutoff = *p_cutoff;

	qsum = qsqsum = 0.0;
	for (int i = 0; i < atom->nlocal; i++) {
	qsum += atom->q[i];
	qsqsum += atom->q[i]*atom->q[i];
	}

	double tmp;
	MPI_Allreduce(&qsum,&tmp,1,MPI_DOUBLE,MPI_SUM,world);
	qsum = tmp;
	MPI_Allreduce(&qsqsum,&tmp,1,MPI_DOUBLE,MPI_SUM,world);
	qsqsum = tmp;

	if (qsqsum == 0.0)
	error->all(FLERR,"Cannot use kspace solver on system with no charge");
	if (fabs(qsum) > SMALL && comm->me == 0) {
	char str[128];
	sprintf(str,"System is not charge neutral, net charge = %g",qsum);
	error->warning(FLERR,str);
	}

	// setup K-space resolution

	if (!gewaldflag) g_ewald = (1.35 - 0.15*log(precision))/cutoff;
	gsqmx = -4.0g_ewaldg_ewald*log(precision);

	if (comm->me == 0) {
	if (screen) fprintf(screen," G vector (1/distance) = %g\n",g_ewald);
	if (logfile) fprintf(logfile," G vector (1/distnace) = %g\n",g_ewald);
	}

	// setup Ewald coefficients so can print stats

	setup();

	if (comm->me == 0) {
	if (screen) fprintf(screen," vectors: actual 1d max = %d %d %d\n",
	kcount,kmax,kmax3d);
	if (logfile) fprintf(logfile," vectors: actual 1d max = %d %d %d\n",
	kcount,kmax,kmax3d);
	}
	}

	/* ----------------------------------------------------------------------
	adjust Ewald coeffs, called initially and whenever volume has changed
	------------------------------------------------------------------------- */

	void Ewald::setup()
	{
	// volume-dependent factors

	double xprd = domain->xprd;
	double yprd = domain->yprd;
	double zprd = domain->zprd;

	// adjustment of z dimension for 2d slab Ewald
	// 3d Ewald just uses zprd since slab_volfactor = 1.0

	double zprd_slab = zprd*slab_volfactor;
	volume = xprd * yprd * zprd_slab;

	unitk[0] = 2.0*MY_PI/xprd;
	unitk[1] = 2.0*MY_PI/yprd;
	unitk[2] = 2.0*MY_PI/zprd_slab;

	// determine kmax
	// function of current box size, precision, G_ewald (short-range cutoff)

	int nkxmx = static_cast<int> ((g_ewaldxprd/MY_PI) sqrt(-log(precision)));
	int nkymx = static_cast<int> ((g_ewaldyprd/MY_PI) sqrt(-log(precision)));
	int nkzmx =
	static_cast<int> ((g_ewaldzprd_slab/MY_PI) sqrt(-log(precision)));

	int kmax_old = kmax;
	kmax = MAX(nkxmx,nkymx);
	kmax = MAX(kmax,nkzmx);
	kmax3d = 4kmaxkmaxkmax + 6kmaxkmax + 3kmax;

	// if size has grown, reallocate k-dependent and nlocal-dependent arrays

	if (kmax > kmax_old) {
	deallocate();
	allocate();

	memory->destroy(ek);
	memory->destroy3d_offset(cs,-kmax_created);
	memory->destroy3d_offset(sn,-kmax_created);
	nmax = atom->nmax;
	memory->create(ek,nmax,3,"ewald:ek");
	memory->create3d_offset(cs,-kmax,kmax,3,nmax,"ewald:cs");
	memory->create3d_offset(sn,-kmax,kmax,3,nmax,"ewald:sn");
	kmax_created = kmax;
	}

	// pre-compute Ewald coefficients

	coeffs();
	}

	/* ----------------------------------------------------------------------
	compute the Ewald long-range force, energy, virial
	------------------------------------------------------------------------- */

	void Ewald::compute(int eflag, int vflag)
	{
	int i,j,k;

	// set energy/virial flags

	if (eflag \|\| vflag) ev_setup(eflag,vflag);
	else evflag = evflag_atom = eflag_global = vflag_global =
	eflag_atom = vflag_atom = 0;

	// extend size of per-atom arrays if necessary

	if (atom->nlocal > nmax) {
	memory->destroy(ek);
	memory->destroy3d_offset(cs,-kmax_created);
	memory->destroy3d_offset(sn,-kmax_created);
	nmax = atom->nmax;
	memory->create(ek,nmax,3,"ewald:ek");
	memory->create3d_offset(cs,-kmax,kmax,3,nmax,"ewald:cs");
	memory->create3d_offset(sn,-kmax,kmax,3,nmax,"ewald:sn");
	kmax_created = kmax;
	}

	// partial structure factors on each processor
	// total structure factor by summing over procs

	eik_dot_r();
	MPI_Allreduce(sfacrl,sfacrl_all,kcount,MPI_DOUBLE,MPI_SUM,world);
	MPI_Allreduce(sfacim,sfacim_all,kcount,MPI_DOUBLE,MPI_SUM,world);

	// K-space portion of electric field
	// double loop over K-vectors and local atoms
	// perform per-atom calculations if needed

	double **f = atom->f;
	double *q = atom->q;
	int nlocal = atom->nlocal;

	int kx,ky,kz;
	double cypz,sypz,exprl,expim,partial,partial_peratom;

	for (i = 0; i < nlocal; i++) {
	ek[i][0] = 0.0;
	ek[i][1] = 0.0;
	ek[i][2] = 0.0;
	}

	for (k = 0; k < kcount; k++) {
	kx = kxvecs[k];
	ky = kyvecs[k];
	kz = kzvecs[k];

	for (i = 0; i < nlocal; i++) {
	cypz = cs[ky][1][i]cs[kz][2][i] - sn[ky][1][i]sn[kz][2][i];
	sypz = sn[ky][1][i]cs[kz][2][i] + cs[ky][1][i]sn[kz][2][i];
	exprl = cs[kx][0][i]cypz - sn[kx][0][i]sypz;
	expim = sn[kx][0][i]cypz + cs[kx][0][i]sypz;
	partial = expimsfacrl_all[k] - exprlsfacim_all[k];
	ek[i][0] += partial*eg[k][0];
	ek[i][1] += partial*eg[k][1];
	ek[i][2] += partial*eg[k][2];

	if (evflag_atom) {
	partial_peratom = exprlsfacrl_all[k] + expimsfacim_all[k];
	if (eflag_atom) eatom[i] += q[i]ug[k]partial_peratom;
	if (vflag_atom)
	for (j = 0; j < 6; j++)
	vatom[i][j] += ug[k]vg[k][j]partial_peratom;
	}
	}
	}

	// convert E-field to force

	const double qscale = force->qqrd2e * scale;

	for (i = 0; i < nlocal; i++) {
	f[i][0] += qscale * q[i]*ek[i][0];
	f[i][1] += qscale * q[i]*ek[i][1];
	f[i][2] += qscale * q[i]*ek[i][2];
	}

	// global energy

	if (eflag_global) {
	for (k = 0; k < kcount; k++)
	energy += ug[k] * (sfacrl_all[k]*sfacrl_all[k] +
	sfacim_all[k]*sfacim_all[k]);
	energy -= g_ewald*qsqsum/MY_PIS +
	MY_PI2qsumqsum / (g_ewaldg_ewaldvolume);
	energy *= qscale;
	}

	// global virial

	if (vflag_global) {
	double uk;
	for (k = 0; k < kcount; k++) {
	uk = ug[k] * (sfacrl_all[k]sfacrl_all[k] + sfacim_all[k]sfacim_all[k]);
	for (j = 0; j < 6; j++) virial[j] += uk*vg[k][j];
	}
	for (j = 0; j < 6; j++) virial[j] *= qscale;
	}

	// per-atom energy/virial
	// energy includes self-energy correction

	if (evflag_atom) {
	if (eflag_atom) {
	for (i = 0; i < nlocal; i++) {
	eatom[i] -= g_ewaldq[i]q[i]/MY_PIS + MY_PI2q[i]qsum /
	(g_ewaldg_ewaldvolume);
	eatom[i] *= qscale;
	}
	}

	if (vflag_atom)
	for (i = 0; i < nlocal; i++)
	for (j = 0; j < 6; j++) vatom[i][j] = q[i]qscale;
	}

	// 2d slab correction

	if (slabflag) slabcorr();
	}

	/* ---------------------------------------------------------------------- */

	void Ewald::eik_dot_r()
	{
	int i,k,l,m,n,ic;
	double cstr1,sstr1,cstr2,sstr2,cstr3,sstr3,cstr4,sstr4;
	double sqk,clpm,slpm;

	double **x = atom->x;
	double *q = atom->q;
	int nlocal = atom->nlocal;

	n = 0;

	// (k,0,0), (0,l,0), (0,0,m)

	for (ic = 0; ic < 3; ic++) {
	sqk = unitk[ic]*unitk[ic];
	if (sqk <= gsqmx) {
	cstr1 = 0.0;
	sstr1 = 0.0;
	for (i = 0; i < nlocal; i++) {
	cs[0][ic][i] = 1.0;
	sn[0][ic][i] = 0.0;
	cs[1][ic][i] = cos(unitk[ic]*x[i][ic]);
	sn[1][ic][i] = sin(unitk[ic]*x[i][ic]);
	cs[-1][ic][i] = cs[1][ic][i];
	sn[-1][ic][i] = -sn[1][ic][i];
	cstr1 += q[i]*cs[1][ic][i];
	sstr1 += q[i]*sn[1][ic][i];
	}
	sfacrl[n] = cstr1;
	sfacim[n++] = sstr1;
	}
	}

	for (m = 2; m <= kmax; m++) {
	for (ic = 0; ic < 3; ic++) {
	sqk = munitk[ic] m*unitk[ic];
	if (sqk <= gsqmx) {
	cstr1 = 0.0;
	sstr1 = 0.0;
	for (i = 0; i < nlocal; i++) {
	cs[m][ic][i] = cs[m-1][ic][i]*cs[1][ic][i] -
	sn[m-1][ic][i]*sn[1][ic][i];
	sn[m][ic][i] = sn[m-1][ic][i]*cs[1][ic][i] +
	cs[m-1][ic][i]*sn[1][ic][i];
	cs[-m][ic][i] = cs[m][ic][i];
	sn[-m][ic][i] = -sn[m][ic][i];
	cstr1 += q[i]*cs[m][ic][i];
	sstr1 += q[i]*sn[m][ic][i];
	}
	sfacrl[n] = cstr1;
	sfacim[n++] = sstr1;
	}
	}
	}

	// 1 = (k,l,0), 2 = (k,-l,0)

	for (k = 1; k <= kmax; k++) {
	for (l = 1; l <= kmax; l++) {
	sqk = (kunitk[0] kunitk[0]) + (lunitk[1] * l*unitk[1]);
	if (sqk <= gsqmx) {
	cstr1 = 0.0;
	sstr1 = 0.0;
	cstr2 = 0.0;
	sstr2 = 0.0;
	for (i = 0; i < nlocal; i++) {
	cstr1 += q[i](cs[k][0][i]cs[l][1][i] - sn[k][0][i]*sn[l][1][i]);
	sstr1 += q[i](sn[k][0][i]cs[l][1][i] + cs[k][0][i]*sn[l][1][i]);
	cstr2 += q[i](cs[k][0][i]cs[l][1][i] + sn[k][0][i]*sn[l][1][i]);
	sstr2 += q[i](sn[k][0][i]cs[l][1][i] - cs[k][0][i]*sn[l][1][i]);
	}
	sfacrl[n] = cstr1;
	sfacim[n++] = sstr1;
	sfacrl[n] = cstr2;
	sfacim[n++] = sstr2;
	}
	}
	}

	// 1 = (0,l,m), 2 = (0,l,-m)

	for (l = 1; l <= kmax; l++) {
	for (m = 1; m <= kmax; m++) {
	sqk = (lunitk[1] lunitk[1]) + (munitk[2] * m*unitk[2]);
	if (sqk <= gsqmx) {
	cstr1 = 0.0;
	sstr1 = 0.0;
	cstr2 = 0.0;
	sstr2 = 0.0;
	for (i = 0; i < nlocal; i++) {
	cstr1 += q[i](cs[l][1][i]cs[m][2][i] - sn[l][1][i]*sn[m][2][i]);
	sstr1 += q[i](sn[l][1][i]cs[m][2][i] + cs[l][1][i]*sn[m][2][i]);
	cstr2 += q[i](cs[l][1][i]cs[m][2][i] + sn[l][1][i]*sn[m][2][i]);
	sstr2 += q[i](sn[l][1][i]cs[m][2][i] - cs[l][1][i]*sn[m][2][i]);
	}
	sfacrl[n] = cstr1;
	sfacim[n++] = sstr1;
	sfacrl[n] = cstr2;
	sfacim[n++] = sstr2;
	}
	}
	}

	// 1 = (k,0,m), 2 = (k,0,-m)

	for (k = 1; k <= kmax; k++) {
	for (m = 1; m <= kmax; m++) {
	sqk = (kunitk[0] kunitk[0]) + (munitk[2] * m*unitk[2]);
	if (sqk <= gsqmx) {
	cstr1 = 0.0;
	sstr1 = 0.0;
	cstr2 = 0.0;
	sstr2 = 0.0;
	for (i = 0; i < nlocal; i++) {
	cstr1 += q[i](cs[k][0][i]cs[m][2][i] - sn[k][0][i]*sn[m][2][i]);
	sstr1 += q[i](sn[k][0][i]cs[m][2][i] + cs[k][0][i]*sn[m][2][i]);
	cstr2 += q[i](cs[k][0][i]cs[m][2][i] + sn[k][0][i]*sn[m][2][i]);
	sstr2 += q[i](sn[k][0][i]cs[m][2][i] - cs[k][0][i]*sn[m][2][i]);
	}
	sfacrl[n] = cstr1;
	sfacim[n++] = sstr1;
	sfacrl[n] = cstr2;
	sfacim[n++] = sstr2;
	}
	}
	}

	// 1 = (k,l,m), 2 = (k,-l,m), 3 = (k,l,-m), 4 = (k,-l,-m)

	for (k = 1; k <= kmax; k++) {
	for (l = 1; l <= kmax; l++) {
	for (m = 1; m <= kmax; m++) {
	sqk = (kunitk[0] kunitk[0]) + (lunitk[1] * l*unitk[1]) +
	(munitk[2] m*unitk[2]);
	if (sqk <= gsqmx) {
	cstr1 = 0.0;
	sstr1 = 0.0;
	cstr2 = 0.0;
	sstr2 = 0.0;
	cstr3 = 0.0;
	sstr3 = 0.0;
	cstr4 = 0.0;
	sstr4 = 0.0;
	for (i = 0; i < nlocal; i++) {
	clpm = cs[l][1][i]cs[m][2][i] - sn[l][1][i]sn[m][2][i];
	slpm = sn[l][1][i]cs[m][2][i] + cs[l][1][i]sn[m][2][i];
	cstr1 += q[i](cs[k][0][i]clpm - sn[k][0][i]*slpm);
	sstr1 += q[i](sn[k][0][i]clpm + cs[k][0][i]*slpm);

	clpm = cs[l][1][i]cs[m][2][i] + sn[l][1][i]sn[m][2][i];
	slpm = -sn[l][1][i]cs[m][2][i] + cs[l][1][i]sn[m][2][i];
	cstr2 += q[i](cs[k][0][i]clpm - sn[k][0][i]*slpm);
	sstr2 += q[i](sn[k][0][i]clpm + cs[k][0][i]*slpm);

	clpm = cs[l][1][i]cs[m][2][i] + sn[l][1][i]sn[m][2][i];
	slpm = sn[l][1][i]cs[m][2][i] - cs[l][1][i]sn[m][2][i];
	cstr3 += q[i](cs[k][0][i]clpm - sn[k][0][i]*slpm);
	sstr3 += q[i](sn[k][0][i]clpm + cs[k][0][i]*slpm);

	clpm = cs[l][1][i]cs[m][2][i] - sn[l][1][i]sn[m][2][i];
	slpm = -sn[l][1][i]cs[m][2][i] - cs[l][1][i]sn[m][2][i];
	cstr4 += q[i](cs[k][0][i]clpm - sn[k][0][i]*slpm);
	sstr4 += q[i](sn[k][0][i]clpm + cs[k][0][i]*slpm);
	}
	sfacrl[n] = cstr1;
	sfacim[n++] = sstr1;
	sfacrl[n] = cstr2;
	sfacim[n++] = sstr2;
	sfacrl[n] = cstr3;
	sfacim[n++] = sstr3;
	sfacrl[n] = cstr4;
	sfacim[n++] = sstr4;
	}
	}
	}
	}
	}

	/* ----------------------------------------------------------------------
	pre-compute coefficients for each Ewald K-vector
	------------------------------------------------------------------------- */

	void Ewald::coeffs()
	{
	int k,l,m;
	double sqk,vterm;

	double unitkx = unitk[0];
	double unitky = unitk[1];
	double unitkz = unitk[2];
	double g_ewald_sq_inv = 1.0 / (g_ewald*g_ewald);
	double preu = 4.0*MY_PI/volume;

	kcount = 0;

	// (k,0,0), (0,l,0), (0,0,m)

	for (m = 1; m <= kmax; m++) {
	sqk = (munitkx) (m*unitkx);
	if (sqk <= gsqmx) {
	kxvecs[kcount] = m;
	kyvecs[kcount] = 0;
	kzvecs[kcount] = 0;
	ug[kcount] = preuexp(-0.25sqk*g_ewald_sq_inv)/sqk;
	eg[kcount][0] = 2.0unitkxm*ug[kcount];
	eg[kcount][1] = 0.0;
	eg[kcount][2] = 0.0;
	vterm = -2.0(1.0/sqk + 0.25g_ewald_sq_inv);
	vg[kcount][0] = 1.0 + vterm(unitkxm)(unitkxm);
	vg[kcount][1] = 1.0;
	vg[kcount][2] = 1.0;
	vg[kcount][3] = 0.0;
	vg[kcount][4] = 0.0;
	vg[kcount][5] = 0.0;
	kcount++;
	}
	sqk = (munitky) (m*unitky);
	if (sqk <= gsqmx) {
	kxvecs[kcount] = 0;
	kyvecs[kcount] = m;
	kzvecs[kcount] = 0;
	ug[kcount] = preuexp(-0.25sqk*g_ewald_sq_inv)/sqk;
	eg[kcount][0] = 0.0;
	eg[kcount][1] = 2.0unitkym*ug[kcount];
	eg[kcount][2] = 0.0;
	vterm = -2.0(1.0/sqk + 0.25g_ewald_sq_inv);
	vg[kcount][0] = 1.0;
	vg[kcount][1] = 1.0 + vterm(unitkym)(unitkym);
	vg[kcount][2] = 1.0;
	vg[kcount][3] = 0.0;
	vg[kcount][4] = 0.0;
	vg[kcount][5] = 0.0;
	kcount++;
	}
	sqk = (munitkz) (m*unitkz);
	if (sqk <= gsqmx) {
	kxvecs[kcount] = 0;
	kyvecs[kcount] = 0;
	kzvecs[kcount] = m;
	ug[kcount] = preuexp(-0.25sqk*g_ewald_sq_inv)/sqk;
	eg[kcount][0] = 0.0;
	eg[kcount][1] = 0.0;
	eg[kcount][2] = 2.0unitkzm*ug[kcount];
	vterm = -2.0(1.0/sqk + 0.25g_ewald_sq_inv);
	vg[kcount][0] = 1.0;
	vg[kcount][1] = 1.0;
	vg[kcount][2] = 1.0 + vterm(unitkzm)(unitkzm);
	vg[kcount][3] = 0.0;
	vg[kcount][4] = 0.0;
	vg[kcount][5] = 0.0;
	kcount++;
	}
	}

	// 1 = (k,l,0), 2 = (k,-l,0)

	for (k = 1; k <= kmax; k++) {
	for (l = 1; l <= kmax; l++) {
	sqk = (unitkxk) (unitkxk) + (unitkyl) * (unitky*l);
	if (sqk <= gsqmx) {
	kxvecs[kcount] = k;
	kyvecs[kcount] = l;
	kzvecs[kcount] = 0;
	ug[kcount] = preuexp(-0.25sqk*g_ewald_sq_inv)/sqk;
	eg[kcount][0] = 2.0unitkxk*ug[kcount];
	eg[kcount][1] = 2.0unitkyl*ug[kcount];
	eg[kcount][2] = 0.0;
	vterm = -2.0(1.0/sqk + 0.25g_ewald_sq_inv);
	vg[kcount][0] = 1.0 + vterm(unitkxk)(unitkxk);
	vg[kcount][1] = 1.0 + vterm(unitkyl)(unitkyl);
	vg[kcount][2] = 1.0;
	vg[kcount][3] = vtermunitkxkunitkyl;
	vg[kcount][4] = 0.0;
	vg[kcount][5] = 0.0;
	kcount++;

	kxvecs[kcount] = k;
	kyvecs[kcount] = -l;
	kzvecs[kcount] = 0;
	ug[kcount] = preuexp(-0.25sqk*g_ewald_sq_inv)/sqk;
	eg[kcount][0] = 2.0unitkxk*ug[kcount];
	eg[kcount][1] = -2.0unitkyl*ug[kcount];
	eg[kcount][2] = 0.0;
	vg[kcount][0] = 1.0 + vterm(unitkxk)(unitkxk);
	vg[kcount][1] = 1.0 + vterm(unitkyl)(unitkyl);
	vg[kcount][2] = 1.0;
	vg[kcount][3] = -vtermunitkxkunitkyl;
	vg[kcount][4] = 0.0;
	vg[kcount][5] = 0.0;
	kcount++;;
	}
	}
	}

	// 1 = (0,l,m), 2 = (0,l,-m)

	for (l = 1; l <= kmax; l++) {
	for (m = 1; m <= kmax; m++) {
	sqk = (unitkyl) (unitkyl) + (unitkzm) * (unitkz*m);
	if (sqk <= gsqmx) {
	kxvecs[kcount] = 0;
	kyvecs[kcount] = l;
	kzvecs[kcount] = m;
	ug[kcount] = preuexp(-0.25sqk*g_ewald_sq_inv)/sqk;
	eg[kcount][0] = 0.0;
	eg[kcount][1] = 2.0unitkyl*ug[kcount];
	eg[kcount][2] = 2.0unitkzm*ug[kcount];
	vterm = -2.0(1.0/sqk + 0.25g_ewald_sq_inv);
	vg[kcount][0] = 1.0;
	vg[kcount][1] = 1.0 + vterm(unitkyl)(unitkyl);
	vg[kcount][2] = 1.0 + vterm(unitkzm)(unitkzm);
	vg[kcount][3] = 0.0;
	vg[kcount][4] = 0.0;
	vg[kcount][5] = vtermunitkylunitkzm;
	kcount++;

	kxvecs[kcount] = 0;
	kyvecs[kcount] = l;
	kzvecs[kcount] = -m;
	ug[kcount] = preuexp(-0.25sqk*g_ewald_sq_inv)/sqk;
	eg[kcount][0] = 0.0;
	eg[kcount][1] = 2.0unitkyl*ug[kcount];
	eg[kcount][2] = -2.0unitkzm*ug[kcount];
	vg[kcount][0] = 1.0;
	vg[kcount][1] = 1.0 + vterm(unitkyl)(unitkyl);
	vg[kcount][2] = 1.0 + vterm(unitkzm)(unitkzm);
	vg[kcount][3] = 0.0;
	vg[kcount][4] = 0.0;
	vg[kcount][5] = -vtermunitkylunitkzm;
	kcount++;
	}
	}
	}

	// 1 = (k,0,m), 2 = (k,0,-m)

	for (k = 1; k <= kmax; k++) {
	for (m = 1; m <= kmax; m++) {
	sqk = (unitkxk) (unitkxk) + (unitkzm) * (unitkz*m);
	if (sqk <= gsqmx) {
	kxvecs[kcount] = k;
	kyvecs[kcount] = 0;
	kzvecs[kcount] = m;
	ug[kcount] = preuexp(-0.25sqk*g_ewald_sq_inv)/sqk;
	eg[kcount][0] = 2.0unitkxk*ug[kcount];
	eg[kcount][1] = 0.0;
	eg[kcount][2] = 2.0unitkzm*ug[kcount];
	vterm = -2.0(1.0/sqk + 0.25g_ewald_sq_inv);
	vg[kcount][0] = 1.0 + vterm(unitkxk)(unitkxk);
	vg[kcount][1] = 1.0;
	vg[kcount][2] = 1.0 + vterm(unitkzm)(unitkzm);
	vg[kcount][3] = 0.0;
	vg[kcount][4] = vtermunitkxkunitkzm;
	vg[kcount][5] = 0.0;
	kcount++;

	kxvecs[kcount] = k;
	kyvecs[kcount] = 0;
	kzvecs[kcount] = -m;
	ug[kcount] = preuexp(-0.25sqk*g_ewald_sq_inv)/sqk;
	eg[kcount][0] = 2.0unitkxk*ug[kcount];
	eg[kcount][1] = 0.0;
	eg[kcount][2] = -2.0unitkzm*ug[kcount];
	vg[kcount][0] = 1.0 + vterm(unitkxk)(unitkxk);
	vg[kcount][1] = 1.0;
	vg[kcount][2] = 1.0 + vterm(unitkzm)(unitkzm);
	vg[kcount][3] = 0.0;
	vg[kcount][4] = -vtermunitkxkunitkzm;
	vg[kcount][5] = 0.0;
	kcount++;
	}
	}
	}

	// 1 = (k,l,m), 2 = (k,-l,m), 3 = (k,l,-m), 4 = (k,-l,-m)

	for (k = 1; k <= kmax; k++) {
	for (l = 1; l <= kmax; l++) {
	for (m = 1; m <= kmax; m++) {
	sqk = (unitkxk) (unitkxk) + (unitkyl) * (unitky*l) +
	(unitkzm) (unitkz*m);
	if (sqk <= gsqmx) {
	kxvecs[kcount] = k;
	kyvecs[kcount] = l;
	kzvecs[kcount] = m;
	ug[kcount] = preuexp(-0.25sqk*g_ewald_sq_inv)/sqk;
	eg[kcount][0] = 2.0unitkxk*ug[kcount];
	eg[kcount][1] = 2.0unitkyl*ug[kcount];
	eg[kcount][2] = 2.0unitkzm*ug[kcount];
	vterm = -2.0(1.0/sqk + 0.25g_ewald_sq_inv);
	vg[kcount][0] = 1.0 + vterm(unitkxk)(unitkxk);
	vg[kcount][1] = 1.0 + vterm(unitkyl)(unitkyl);
	vg[kcount][2] = 1.0 + vterm(unitkzm)(unitkzm);
	vg[kcount][3] = vtermunitkxkunitkyl;
	vg[kcount][4] = vtermunitkxkunitkzm;
	vg[kcount][5] = vtermunitkylunitkzm;
	kcount++;

	kxvecs[kcount] = k;
	kyvecs[kcount] = -l;
	kzvecs[kcount] = m;
	ug[kcount] = preuexp(-0.25sqk*g_ewald_sq_inv)/sqk;
	eg[kcount][0] = 2.0unitkxk*ug[kcount];
	eg[kcount][1] = -2.0unitkyl*ug[kcount];
	eg[kcount][2] = 2.0unitkzm*ug[kcount];
	vg[kcount][0] = 1.0 + vterm(unitkxk)(unitkxk);
	vg[kcount][1] = 1.0 + vterm(unitkyl)(unitkyl);
	vg[kcount][2] = 1.0 + vterm(unitkzm)(unitkzm);
	vg[kcount][3] = -vtermunitkxkunitkyl;
	vg[kcount][4] = vtermunitkxkunitkzm;
	vg[kcount][5] = -vtermunitkylunitkzm;
	kcount++;

	kxvecs[kcount] = k;
	kyvecs[kcount] = l;
	kzvecs[kcount] = -m;
	ug[kcount] = preuexp(-0.25sqk*g_ewald_sq_inv)/sqk;
	eg[kcount][0] = 2.0unitkxk*ug[kcount];
	eg[kcount][1] = 2.0unitkyl*ug[kcount];
	eg[kcount][2] = -2.0unitkzm*ug[kcount];
	vg[kcount][0] = 1.0 + vterm(unitkxk)(unitkxk);
	vg[kcount][1] = 1.0 + vterm(unitkyl)(unitkyl);
	vg[kcount][2] = 1.0 + vterm(unitkzm)(unitkzm);
	vg[kcount][3] = vtermunitkxkunitkyl;
	vg[kcount][4] = -vtermunitkxkunitkzm;
	vg[kcount][5] = -vtermunitkylunitkzm;
	kcount++;

	kxvecs[kcount] = k;
	kyvecs[kcount] = -l;
	kzvecs[kcount] = -m;
	ug[kcount] = preuexp(-0.25sqk*g_ewald_sq_inv)/sqk;
	eg[kcount][0] = 2.0unitkxk*ug[kcount];
	eg[kcount][1] = -2.0unitkyl*ug[kcount];
	eg[kcount][2] = -2.0unitkzm*ug[kcount];
	vg[kcount][0] = 1.0 + vterm(unitkxk)(unitkxk);
	vg[kcount][1] = 1.0 + vterm(unitkyl)(unitkyl);
	vg[kcount][2] = 1.0 + vterm(unitkzm)(unitkzm);
	vg[kcount][3] = -vtermunitkxkunitkyl;
	vg[kcount][4] = -vtermunitkxkunitkzm;
	vg[kcount][5] = vtermunitkylunitkzm;
	kcount++;;
	}
	}
	}
	}
	}

	/* ----------------------------------------------------------------------
	allocate memory that depends on # of K-vectors
	------------------------------------------------------------------------- */

	void Ewald::allocate()
	{
	kxvecs = new int[kmax3d];
	kyvecs = new int[kmax3d];
	kzvecs = new int[kmax3d];

	ug = new double[kmax3d];
	memory->create(eg,kmax3d,3,"ewald:eg");
	memory->create(vg,kmax3d,6,"ewald:vg");

	sfacrl = new double[kmax3d];
	sfacim = new double[kmax3d];
	sfacrl_all = new double[kmax3d];
	sfacim_all = new double[kmax3d];
	}

	/* ----------------------------------------------------------------------
	deallocate memory that depends on # of K-vectors
	------------------------------------------------------------------------- */

	void Ewald::deallocate()
	{
	delete [] kxvecs;
	delete [] kyvecs;
	delete [] kzvecs;

	delete [] ug;
	memory->destroy(eg);
	memory->destroy(vg);

	delete [] sfacrl;
	delete [] sfacim;
	delete [] sfacrl_all;
	delete [] sfacim_all;
	}

	/* ----------------------------------------------------------------------
	Slab-geometry correction term to dampen inter-slab interactions between
	periodically repeating slabs. Yields good approximation to 2-D Ewald if
	adequate empty space is left between repeating slabs (J. Chem. Phys.
	111, 3155). Slabs defined here to be parallel to the xy plane.
	------------------------------------------------------------------------- */

	void Ewald::slabcorr()
	{
	// compute local contribution to global dipole moment

	double *q = atom->q;
	double **x = atom->x;
	int nlocal = atom->nlocal;

	double dipole = 0.0;
	for (int i = 0; i < nlocal; i++) dipole += q[i]*x[i][2];

	// sum local contributions to get global dipole moment

	double dipole_all;
	MPI_Allreduce(&dipole,&dipole_all,1,MPI_DOUBLE,MPI_SUM,world);

	// compute corrections

	const double e_slabcorr = 2.0MY_PIdipole_all*dipole_all/volume;
	const double qscale = force->qqrd2e * scale;

	if (eflag_global) energy += qscale * e_slabcorr;

	// per-atom energy

	if (eflag_atom) {
	double efact = 2.0MY_PIdipole_all/volume;
	for (int i = 0; i < nlocal; i++) eatom[i] += qscale * q[i]x[i][2]efact;
	}

	// add on force corrections

	double ffact = -4.0MY_PIdipole_all/volume;
	double **f = atom->f;

	for (int i = 0; i < nlocal; i++) f[i][2] += qscale * q[i]*ffact;
	}

	/* ----------------------------------------------------------------------
	memory usage of local arrays
	------------------------------------------------------------------------- */

	double Ewald::memory_usage()
	{
	double bytes = 3 * kmax3d * sizeof(int);
	bytes += (1 + 3 + 6) * kmax3d * sizeof(double);
	bytes += 4 * kmax3d * sizeof(double);
	bytes += nmax3 sizeof(double);
	bytes += 2 * (2kmax+1)3nmax sizeof(double);
	return bytes;
	}

ewald.cppNo OneTemporaryActions

File Metadata

ewald.cppView Options

Event Timeline

ewald.cpp
No OneTemporary
Actions

ewald.cpp
View Options