Page Menu
Home
c4science
Search
Configure Global Search
Log In
Files
F91408485
pair_buck_coul_cut_kokkos.cpp
No One
Temporary
Actions
Download File
Edit File
Delete File
View Transforms
Subscribe
Mute Notifications
Award Token
Subscribers
None
File Metadata
Details
File Info
Storage
Attached
Created
Sun, Nov 10, 20:08
Size
12 KB
Mime Type
text/x-c
Expires
Tue, Nov 12, 20:08 (2 d)
Engine
blob
Format
Raw Data
Handle
22258899
Attached To
rLAMMPS lammps
pair_buck_coul_cut_kokkos.cpp
View Options
/* ----------------------------------------------------------------------
LAMMPS - Large-scale Atomic/Molecular Massively Parallel Simulator
http://lammps.sandia.gov, Sandia National Laboratories
Steve Plimpton, sjplimp@sandia.gov
Copyright (2003) Sandia Corporation. Under the terms of Contract
DE-AC04-94AL85000 with Sandia Corporation, the U.S. Government retains
certain rights in this software. This software is distributed under
the GNU General Public License.
See the README file in the top-level LAMMPS directory.
------------------------------------------------------------------------- */
/* ----------------------------------------------------------------------
Contributing author: Ray Shan (SNL)
------------------------------------------------------------------------- */
#include <math.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "pair_buck_coul_cut_kokkos.h"
#include "kokkos.h"
#include "atom_kokkos.h"
#include "comm.h"
#include "force.h"
#include "neighbor.h"
#include "neigh_list.h"
#include "neigh_request.h"
#include "update.h"
#include "integrate.h"
#include "respa.h"
#include "math_const.h"
#include "memory.h"
#include "error.h"
#include "atom_masks.h"
using
namespace
LAMMPS_NS
;
using
namespace
MathConst
;
#define KOKKOS_CUDA_MAX_THREADS 256
#define KOKKOS_CUDA_MIN_BLOCKS 8
/* ---------------------------------------------------------------------- */
template
<
class
DeviceType
>
PairBuckCoulCutKokkos
<
DeviceType
>::
PairBuckCoulCutKokkos
(
LAMMPS
*
lmp
)
:
PairBuckCoulCut
(
lmp
)
{
respa_enable
=
0
;
atomKK
=
(
AtomKokkos
*
)
atom
;
execution_space
=
ExecutionSpaceFromDevice
<
DeviceType
>::
space
;
datamask_read
=
X_MASK
|
F_MASK
|
TYPE_MASK
|
Q_MASK
|
ENERGY_MASK
|
VIRIAL_MASK
;
datamask_modify
=
F_MASK
|
ENERGY_MASK
|
VIRIAL_MASK
;
cutsq
=
NULL
;
cut_ljsq
=
NULL
;
cut_coulsq
=
NULL
;
}
/* ---------------------------------------------------------------------- */
template
<
class
DeviceType
>
PairBuckCoulCutKokkos
<
DeviceType
>::~
PairBuckCoulCutKokkos
()
{
if
(
!
copymode
)
{
memory
->
destroy_kokkos
(
k_eatom
,
eatom
);
memory
->
destroy_kokkos
(
k_vatom
,
vatom
);
k_cutsq
=
DAT
::
tdual_ffloat_2d
();
k_cut_ljsq
=
DAT
::
tdual_ffloat_2d
();
k_cut_coulsq
=
DAT
::
tdual_ffloat_2d
();
memory
->
sfree
(
cutsq
);
memory
->
sfree
(
cut_ljsq
);
memory
->
sfree
(
cut_coulsq
);
eatom
=
NULL
;
vatom
=
NULL
;
cutsq
=
NULL
;
cut_ljsq
=
NULL
;
cut_coulsq
=
NULL
;
}
}
/* ---------------------------------------------------------------------- */
template
<
class
DeviceType
>
void
PairBuckCoulCutKokkos
<
DeviceType
>::
compute
(
int
eflag_in
,
int
vflag_in
)
{
eflag
=
eflag_in
;
vflag
=
vflag_in
;
if
(
neighflag
==
FULL
||
neighflag
==
FULLCLUSTER
)
no_virial_fdotr_compute
=
1
;
if
(
eflag
||
vflag
)
ev_setup
(
eflag
,
vflag
);
else
evflag
=
vflag_fdotr
=
0
;
// reallocate per-atom arrays if necessary
if
(
eflag_atom
)
{
memory
->
destroy_kokkos
(
k_eatom
,
eatom
);
memory
->
create_kokkos
(
k_eatom
,
eatom
,
maxeatom
,
"pair:eatom"
);
d_eatom
=
k_eatom
.
view
<
DeviceType
>
();
}
if
(
vflag_atom
)
{
memory
->
destroy_kokkos
(
k_vatom
,
vatom
);
memory
->
create_kokkos
(
k_vatom
,
vatom
,
maxvatom
,
6
,
"pair:vatom"
);
d_vatom
=
k_vatom
.
view
<
DeviceType
>
();
}
atomKK
->
sync
(
execution_space
,
datamask_read
);
k_cutsq
.
template
sync
<
DeviceType
>
();
k_cut_ljsq
.
template
sync
<
DeviceType
>
();
k_cut_coulsq
.
template
sync
<
DeviceType
>
();
k_params
.
template
sync
<
DeviceType
>
();
if
(
eflag
||
vflag
)
atomKK
->
modified
(
execution_space
,
datamask_modify
);
else
atomKK
->
modified
(
execution_space
,
F_MASK
);
x
=
atomKK
->
k_x
.
view
<
DeviceType
>
();
c_x
=
atomKK
->
k_x
.
view
<
DeviceType
>
();
f
=
atomKK
->
k_f
.
view
<
DeviceType
>
();
q
=
atomKK
->
k_q
.
view
<
DeviceType
>
();
type
=
atomKK
->
k_type
.
view
<
DeviceType
>
();
nlocal
=
atom
->
nlocal
;
nall
=
atom
->
nlocal
+
atom
->
nghost
;
qqrd2e
=
force
->
qqrd2e
;
newton_pair
=
force
->
newton_pair
;
special_lj
[
0
]
=
force
->
special_lj
[
0
];
special_lj
[
1
]
=
force
->
special_lj
[
1
];
special_lj
[
2
]
=
force
->
special_lj
[
2
];
special_lj
[
3
]
=
force
->
special_lj
[
3
];
special_coul
[
0
]
=
force
->
special_coul
[
0
];
special_coul
[
1
]
=
force
->
special_coul
[
1
];
special_coul
[
2
]
=
force
->
special_coul
[
2
];
special_coul
[
3
]
=
force
->
special_coul
[
3
];
// loop over neighbors of my atoms
copymode
=
1
;
EV_FLOAT
ev
=
pair_compute
<
PairBuckCoulCutKokkos
<
DeviceType
>
,
void
>
(
this
,(
NeighListKokkos
<
DeviceType
>*
)
list
);
DeviceType
::
fence
();
if
(
eflag
)
{
eng_vdwl
+=
ev
.
evdwl
;
eng_coul
+=
ev
.
ecoul
;
}
if
(
vflag_global
)
{
virial
[
0
]
+=
ev
.
v
[
0
];
virial
[
1
]
+=
ev
.
v
[
1
];
virial
[
2
]
+=
ev
.
v
[
2
];
virial
[
3
]
+=
ev
.
v
[
3
];
virial
[
4
]
+=
ev
.
v
[
4
];
virial
[
5
]
+=
ev
.
v
[
5
];
}
if
(
vflag_fdotr
)
virial_fdotr_compute
();
if
(
eflag_atom
)
{
k_eatom
.
template
modify
<
DeviceType
>
();
k_eatom
.
template
sync
<
LMPHostType
>
();
}
if
(
vflag_atom
)
{
k_vatom
.
template
modify
<
DeviceType
>
();
k_vatom
.
template
sync
<
LMPHostType
>
();
}
copymode
=
0
;
}
/* ----------------------------------------------------------------------
compute Buckingham pair force between atoms i and j
---------------------------------------------------------------------- */
template
<
class
DeviceType
>
template
<
bool
STACKPARAMS
,
class
Specialisation
>
KOKKOS_INLINE_FUNCTION
F_FLOAT
PairBuckCoulCutKokkos
<
DeviceType
>::
compute_fpair
(
const
F_FLOAT
&
rsq
,
const
int
&
i
,
const
int
&
j
,
const
int
&
itype
,
const
int
&
jtype
)
const
{
const
F_FLOAT
r2inv
=
1.0
/
rsq
;
const
F_FLOAT
r6inv
=
r2inv
*
r2inv
*
r2inv
;
const
F_FLOAT
r
=
sqrt
(
rsq
);
const
F_FLOAT
rexp
=
exp
(
-
r
*
(
STACKPARAMS
?
m_params
[
itype
][
jtype
].
rhoinv:
params
(
itype
,
jtype
).
rhoinv
));
const
F_FLOAT
forcebuck
=
(
STACKPARAMS
?
m_params
[
itype
][
jtype
].
buck1:
params
(
itype
,
jtype
).
buck1
)
*
r
*
rexp
-
(
STACKPARAMS
?
m_params
[
itype
][
jtype
].
buck2:
params
(
itype
,
jtype
).
buck2
)
*
r6inv
;
return
forcebuck
*
r2inv
;
}
/* ----------------------------------------------------------------------
compute Buckingham pair potential energy between atoms i and j
---------------------------------------------------------------------- */
template
<
class
DeviceType
>
template
<
bool
STACKPARAMS
,
class
Specialisation
>
KOKKOS_INLINE_FUNCTION
F_FLOAT
PairBuckCoulCutKokkos
<
DeviceType
>::
compute_evdwl
(
const
F_FLOAT
&
rsq
,
const
int
&
i
,
const
int
&
j
,
const
int
&
itype
,
const
int
&
jtype
)
const
{
const
F_FLOAT
r2inv
=
1.0
/
rsq
;
const
F_FLOAT
r6inv
=
r2inv
*
r2inv
*
r2inv
;
const
F_FLOAT
r
=
sqrt
(
rsq
);
const
F_FLOAT
rexp
=
exp
(
-
r
*
(
STACKPARAMS
?
m_params
[
itype
][
jtype
].
rhoinv:
params
(
itype
,
jtype
).
rhoinv
));
return
(
STACKPARAMS
?
m_params
[
itype
][
jtype
].
a:
params
(
itype
,
jtype
).
a
)
*
rexp
-
(
STACKPARAMS
?
m_params
[
itype
][
jtype
].
c:
params
(
itype
,
jtype
).
c
)
*
r6inv
-
(
STACKPARAMS
?
m_params
[
itype
][
jtype
].
offset:
params
(
itype
,
jtype
).
offset
);
}
/* ----------------------------------------------------------------------
compute coulomb pair force between atoms i and j
---------------------------------------------------------------------- */
template
<
class
DeviceType
>
template
<
bool
STACKPARAMS
,
class
Specialisation
>
KOKKOS_INLINE_FUNCTION
F_FLOAT
PairBuckCoulCutKokkos
<
DeviceType
>::
compute_fcoul
(
const
F_FLOAT
&
rsq
,
const
int
&
i
,
const
int
&
j
,
const
int
&
itype
,
const
int
&
jtype
,
const
F_FLOAT
&
factor_coul
,
const
F_FLOAT
&
qtmp
)
const
{
const
F_FLOAT
r2inv
=
1.0
/
rsq
;
const
F_FLOAT
rinv
=
sqrt
(
r2inv
);
F_FLOAT
forcecoul
;
forcecoul
=
qqrd2e
*
qtmp
*
q
(
j
)
*
rinv
;
return
factor_coul
*
forcecoul
*
r2inv
;
}
/* ----------------------------------------------------------------------
compute coulomb pair potential energy between atoms i and j
---------------------------------------------------------------------- */
template
<
class
DeviceType
>
template
<
bool
STACKPARAMS
,
class
Specialisation
>
KOKKOS_INLINE_FUNCTION
F_FLOAT
PairBuckCoulCutKokkos
<
DeviceType
>::
compute_ecoul
(
const
F_FLOAT
&
rsq
,
const
int
&
i
,
const
int
&
j
,
const
int
&
itype
,
const
int
&
jtype
,
const
F_FLOAT
&
factor_coul
,
const
F_FLOAT
&
qtmp
)
const
{
const
F_FLOAT
r2inv
=
1.0
/
rsq
;
const
F_FLOAT
rinv
=
sqrt
(
r2inv
);
return
factor_coul
*
qqrd2e
*
qtmp
*
q
(
j
)
*
rinv
;
}
/* ----------------------------------------------------------------------
allocate all arrays
------------------------------------------------------------------------- */
template
<
class
DeviceType
>
void
PairBuckCoulCutKokkos
<
DeviceType
>::
allocate
()
{
PairBuckCoulCut
::
allocate
();
int
n
=
atom
->
ntypes
;
memory
->
destroy
(
cutsq
);
memory
->
create_kokkos
(
k_cutsq
,
cutsq
,
n
+
1
,
n
+
1
,
"pair:cutsq"
);
d_cutsq
=
k_cutsq
.
template
view
<
DeviceType
>
();
memory
->
destroy
(
cut_ljsq
);
memory
->
create_kokkos
(
k_cut_ljsq
,
cut_ljsq
,
n
+
1
,
n
+
1
,
"pair:cut_ljsq"
);
d_cut_ljsq
=
k_cut_ljsq
.
template
view
<
DeviceType
>
();
memory
->
destroy
(
cut_coulsq
);
memory
->
create_kokkos
(
k_cut_coulsq
,
cut_coulsq
,
n
+
1
,
n
+
1
,
"pair:cut_coulsq"
);
d_cut_coulsq
=
k_cut_coulsq
.
template
view
<
DeviceType
>
();
k_params
=
Kokkos
::
DualView
<
params_buck_coul
**
,
Kokkos
::
LayoutRight
,
DeviceType
>
(
"PairBuckCoulCut::params"
,
n
+
1
,
n
+
1
);
params
=
k_params
.
d_view
;
}
/* ----------------------------------------------------------------------
global settings
------------------------------------------------------------------------- */
template
<
class
DeviceType
>
void
PairBuckCoulCutKokkos
<
DeviceType
>::
settings
(
int
narg
,
char
**
arg
)
{
if
(
narg
>
2
)
error
->
all
(
FLERR
,
"Illegal pair_style command"
);
PairBuckCoulCut
::
settings
(
1
,
arg
);
}
/* ----------------------------------------------------------------------
init specific to this pair style
------------------------------------------------------------------------- */
template
<
class
DeviceType
>
void
PairBuckCoulCutKokkos
<
DeviceType
>::
init_style
()
{
PairBuckCoulCut
::
init_style
();
// error if rRESPA with inner levels
if
(
update
->
whichflag
==
1
&&
strstr
(
update
->
integrate_style
,
"respa"
))
{
int
respa
=
0
;
if
(((
Respa
*
)
update
->
integrate
)
->
level_inner
>=
0
)
respa
=
1
;
if
(((
Respa
*
)
update
->
integrate
)
->
level_middle
>=
0
)
respa
=
2
;
if
(
respa
)
error
->
all
(
FLERR
,
"Cannot use Kokkos pair style with rRESPA inner/middle"
);
}
// irequest = neigh request made by parent class
neighflag
=
lmp
->
kokkos
->
neighflag
;
int
irequest
=
neighbor
->
nrequest
-
1
;
neighbor
->
requests
[
irequest
]
->
kokkos_host
=
Kokkos
::
Impl
::
is_same
<
DeviceType
,
LMPHostType
>::
value
&&
!
Kokkos
::
Impl
::
is_same
<
DeviceType
,
LMPDeviceType
>::
value
;
neighbor
->
requests
[
irequest
]
->
kokkos_device
=
Kokkos
::
Impl
::
is_same
<
DeviceType
,
LMPDeviceType
>::
value
;
if
(
neighflag
==
FULL
)
{
neighbor
->
requests
[
irequest
]
->
full
=
1
;
neighbor
->
requests
[
irequest
]
->
half
=
0
;
neighbor
->
requests
[
irequest
]
->
full_cluster
=
0
;
}
else
if
(
neighflag
==
HALF
||
neighflag
==
HALFTHREAD
)
{
neighbor
->
requests
[
irequest
]
->
full
=
0
;
neighbor
->
requests
[
irequest
]
->
half
=
1
;
neighbor
->
requests
[
irequest
]
->
full_cluster
=
0
;
}
else
if
(
neighflag
==
N2
)
{
neighbor
->
requests
[
irequest
]
->
full_cluster
=
0
;
neighbor
->
requests
[
irequest
]
->
full
=
0
;
neighbor
->
requests
[
irequest
]
->
half
=
0
;
}
else
if
(
neighflag
==
FULLCLUSTER
)
{
neighbor
->
requests
[
irequest
]
->
full
=
1
;
neighbor
->
requests
[
irequest
]
->
half
=
0
;
neighbor
->
requests
[
irequest
]
->
full_cluster
=
1
;
}
else
{
error
->
all
(
FLERR
,
"Cannot use chosen neighbor list style with buck/coul/cut/kk"
);
}
}
/* ----------------------------------------------------------------------
init for one type pair i,j and corresponding j,i
------------------------------------------------------------------------- */
template
<
class
DeviceType
>
double
PairBuckCoulCutKokkos
<
DeviceType
>::
init_one
(
int
i
,
int
j
)
{
double
cutone
=
PairBuckCoulCut
::
init_one
(
i
,
j
);
double
cut_ljsqm
=
cut_ljsq
[
i
][
j
];
double
cut_coulsqm
=
cut_coulsq
[
i
][
j
];
k_params
.
h_view
(
i
,
j
).
a
=
a
[
i
][
j
];
k_params
.
h_view
(
i
,
j
).
c
=
c
[
i
][
j
];
k_params
.
h_view
(
i
,
j
).
rhoinv
=
rhoinv
[
i
][
j
];
k_params
.
h_view
(
i
,
j
).
buck1
=
buck1
[
i
][
j
];
k_params
.
h_view
(
i
,
j
).
buck2
=
buck2
[
i
][
j
];
k_params
.
h_view
(
i
,
j
).
offset
=
offset
[
i
][
j
];
k_params
.
h_view
(
i
,
j
).
cut_ljsq
=
cut_ljsqm
;
k_params
.
h_view
(
i
,
j
).
cut_coulsq
=
cut_coulsqm
;
k_params
.
h_view
(
j
,
i
)
=
k_params
.
h_view
(
i
,
j
);
if
(
i
<
MAX_TYPES_STACKPARAMS
+
1
&&
j
<
MAX_TYPES_STACKPARAMS
+
1
)
{
m_params
[
i
][
j
]
=
m_params
[
j
][
i
]
=
k_params
.
h_view
(
i
,
j
);
m_cutsq
[
j
][
i
]
=
m_cutsq
[
i
][
j
]
=
cutone
*
cutone
;
m_cut_ljsq
[
j
][
i
]
=
m_cut_ljsq
[
i
][
j
]
=
cut_ljsqm
;
m_cut_coulsq
[
j
][
i
]
=
m_cut_coulsq
[
i
][
j
]
=
cut_coulsqm
;
}
k_cutsq
.
h_view
(
i
,
j
)
=
cutone
*
cutone
;
k_cutsq
.
template
modify
<
LMPHostType
>
();
k_cut_ljsq
.
h_view
(
i
,
j
)
=
cut_ljsqm
;
k_cut_ljsq
.
template
modify
<
LMPHostType
>
();
k_cut_coulsq
.
h_view
(
i
,
j
)
=
cut_coulsqm
;
k_cut_coulsq
.
template
modify
<
LMPHostType
>
();
k_params
.
template
modify
<
LMPHostType
>
();
return
cutone
;
}
template
class
PairBuckCoulCutKokkos
<
LMPDeviceType
>
;
#ifdef KOKKOS_HAVE_CUDA
template
class
PairBuckCoulCutKokkos
<
LMPHostType
>
;
#endif
Event Timeline
Log In to Comment