LAMMPS 23Jun22 with GPU support (Intel MPI)
ウェブページ
バージョン
23Jun22 Update 2
ビルド環境
- GCC 11.2.1 (gcc-toolset-11)
- Intel MKL 2023.1.0
- Intel MPI 2021.9.0
- CUDA 11.6
ビルドに必要なファイル
- lammps-stable.tar.gz
- (一部ファイルは以下スクリプト中で取得)
ビルド手順
#!/bin/sh
VERSION=23Jun22
NAME=lammps-23Jun2022
INSTALL_PREFIX=/apl/lammps/2022-Jun23-impi-CUDA
BASEDIR=/home/users/${USER}/Software/LAMMPS/${VERSION}
LAMMPS_TARBALL=${BASEDIR}/lammps-stable.tar.gz
WORKDIR=/gwork/users/${USER}/lammps-23Sep2022-cuda
LAMMPS_WORKDIR=${WORKDIR}/${NAME}
GPU_ARCH=sm_80
VMD_MOLFILE_INC=/home/users/${USER}/Software/VMD/1.9.4/vmd-1.9.4a57/plugins/include
PARALLEL=12
#------------------------------------------------------------------
umask 0022
export LANG=C
ulimit -s unlimited
module -s purge
module -s load gcc-toolset/11
module -s load intelmpi/2021.9.0
module -s load mkl/2023.1.0
module -s load cuda/11.6
export CC=mpicc
export CXX=mpicxx
export FC=mpif90
export MPICC=mpicc
export MPICXX=mpicxx
export MPIFC=mpif90
PYTHONEXE=/usr/bin/python3.6m
PYTHONINC=/usr/include/python3.6m
cd ${WORKDIR}
if [ -d ${NAME} ]; then
mv ${NAME} lammps_erase
rm -rf lammps_erase &
fi
tar zxf ${LAMMPS_TARBALL}
cd ${NAME}
mkdir build && cd build
# Disabled PKGs:
# FFMPEG, ADIOS, MDI, VTK: noavail
# MSCG: gsl too old
# MESSAGE: ZeroMQ support not enabled
# QUIP: failed to build
# ML-HDNNP: failed to build
# MK-IAP: failed to build
# KIM: CDDL is imcompatible with GPL
# LATTE: technical problem of cmake? (LAPACK and BLAS)
# MPIIO: not maintained?
cmake ../cmake \
-DLAMMPS_MACHINE=rccs-cuda \
-DENABLE_TESTING=on \
-DCMAKE_INSTALL_PREFIX=${INSTALL_PREFIX} \
-DCMAKE_C_COMPILER=mpicc \
-DCMAKE_CXX_COMPILER=mpicxx \
-DCMAKE_Fortran_COMPILER=mpif90 \
-DCMAKE_MPI_C_COMPILER=mpicc \
-DCMAKE_MPI_CXX_COMPILER=mpicxx \
-DCMAKE_MPI_Fortran_COMPILER=mpif90 \
-DPython_EXECUTABLE=${PYTHONEXE} \
-DPython_INCLUDE_DIR=${PYTHONINC} \
-DLAMMPS_EXCEPTIONS=on \
-DBUILD_SHARED_LIBS=on \
-DBUILD_TOOLS=on \
-DBUILD_MPI=on \
-DBUILD_OMP=on \
-DFFT=MKL \
-DFFT_SINGLE=on \
-DFFT_MKL_THREADS=on \
-DWITH_JPEG=yes \
-DWITH_PNG=yes \
-DWITH_GZIP=yes \
-DPKG_ASPHERE=on \
-DPKG_ATC=on \
-DPKG_AWPMD=on \
-DPKG_BOCS=on \
-DPKG_BODY=on \
-DPKG_BROWNIAN=on \
-DPKG_CG-DNA=on \
-DPKG_CG-SDK=on \
-DPKG_CLASS2=on \
-DPKG_COLLOID=on \
-DPKG_COLVARS=on \
-DPKG_COMPRESS=on \
-DPKG_CORESHELL=on \
-DPKG_DIELECTRIC=on \
-DPKG_DIFFRACTION=on \
-DPKG_DIPOLE=on \
-DPKG_DPD-BASIC=on \
-DPKG_DPD-MESO=on \
-DPKG_DPD-REACT=on \
-DPKG_DPD-SMOOTH=on \
-DPKG_DRUDE=on \
-DPKG_EFF=on \
-DPKG_EXTRA-COMPUTE=on \
-DPKG_EXTRA-DUMP=on \
-DPKG_EXTRA-FIX=on \
-DPKG_EXTRA-MOLECULE=on \
-DPKG_EXTRA-PAIR=on \
-DPKG_FEP=on \
-DPKG_GPU=on \
-DGPU_API=cuda \
-DGPU_ARCH=${GPU_ARCH} \
-DPKG_GRANULAR=on \
-DPKG_H5MD=on \
-DPKG_INTEL=on \
-DPKG_INTERLAYER=on \
-DPKG_KIM=off \
-DDOWNLOAD_KIM=no \
-DPKG_KOKKOS=on \
-DKokkos_ARCH_ZEN3=yes \
-DKokkos_ENABLE_OPENMP=yes \
-DPKG_KSPACE=on \
-DPKG_LATBOLTZ=on \
-DPKG_MACHDYN=on \
-DDOWNLOAD_EIGEN3=on \
-DPKG_MANIFOLD=on \
-DPKG_MANYBODY=on \
-DPKG_MC=on \
-DPKG_MDI=off \
-DPKG_MEAM=on \
-DPKG_MESONT=on \
-DPKG_MESSAGE=on \
-DPKG_MGPT=on \
-DPKG_MISC=on \
-DPKG_ML-HDNNP=off \
-DDOWNLOAD_N2P2=no \
-DPKG_ML-IAP=off \
-DPKG_ML-PACE=on \
-DPKG_ML-QUIP=off \
-DDOWNLOAD_QUIP=no \
-DPKG_ML-RANN=on \
-DPKG_ML-SNAP=on \
-DPKG_MOFFF=on \
-DPKG_MOLECULE=on \
-DPKG_MOLFILE=on \
-DMOLFILE_INCLUDE_DIR=${VMD_MOLFILE_INC} \
-DPKG_MPIIO=off \
-DPKG_MSCG=off \
-DPKG_NETCDF=on \
-DPKG_OPENMP=on \
-DPKG_OPT=on \
-DPKG_ORIENT=on \
-DPKG_PERI=on \
-DPKG_PHONON=on \
-DPKG_PLUGIN=on \
-DPKG_PLUMED=on \
-DDOWNLOAD_PLUMED=yes \
-DPKG_POEMS=on \
-DPKG_PTM=on \
-DPKG_PYTHON=on \
-DPKG_QEQ=on \
-DPKG_QMMM=on \
-DPKG_QTB=on \
-DPKG_REACTION=on \
-DPKG_REAXFF=on \
-DPKG_REPLICA=on \
-DPKG_RIGID=on \
-DPKG_SCAFACOS=on \
-DDOWNLOAD_SCAFACOS=yes \
-DPKG_SHOCK=on \
-DPKG_SMTBQ=on \
-DPKG_SPH=on \
-DPKG_SPIN=on \
-DPKG_SRD=on \
-DPKG_TALLY=on \
-DPKG_UEF=on \
-DPKG_VORONOI=on \
-DDOWNLOAD_VORO=yes \
-DPKG_VTK=off \
-DPKG_YAFF=on \
-DBLAS_LIBRARIES="-Wl,--no-as-needed -lmkl_intel_lp64 -lmkl_gnu_thread -lmkl_core -lgomp -lpthread -lm -ldl" \
-DCMAKE_BUILD_TYPE=Release
make VERBOSE=1 -j ${PARALLEL}
make install
cp -a ../examples ${INSTALL_PREFIX}
cd ${INSTALL_PREFIX}
for f in etc/profile.d/*; do
ln -s $f .
done
cd lib64
if [ -f liblammps_rccs-cuda.so ]; then
ln -s liblammps_rccs-cuda.so liblammps.so
fi
if [ -f liblammps_rccs-cuda.so.0 ]; then
ln -s liblammps_rccs-cuda.so.0 liblammps.so.0
fi
テスト
以下のジョブで実行#!/bin/sh
#PBS -l select=1:ncpus=16:mpiprocs=8:ompthreads=2:ngpus=2
#PBS -l walltime=24:00:00
NAME=lammps-23Jun2022
WORKDIR=/gwork/users/${USER}/lammps-23Sep2022-cuda
LAMMPS_WORKDIR=${WORKDIR}/${NAME}
#------------------------------------------------------------------
umask 0022
export LANG=C
ulimit -s unlimited
module -s purge
module -s load gcc-toolset/11
module -s load intelmpi/2021.9.0
module -s load mkl/2023.1.0
module -s load cuda/11.6
export CC=mpicc
export CXX=mpicxx
export FC=mpif90
export MPICC=mpicc
export MPICXX=mpicxx
export MPIFC=mpif90
cd ${LAMMPS_WORKDIR}
cd build
make test # may errors will occur...
テスト結果
失敗したテストのリストThe following tests FAILED:
35 - SimpleCommands (SEGFAULT)
43 - ComputeGlobal (Failed)
68 - MolPairStyle:beck (SEGFAULT)
69 - MolPairStyle:born (SEGFAULT)
74 - MolPairStyle:born_coul_table_cs (SEGFAULT)
76 - MolPairStyle:born_coul_wolf_cs (SEGFAULT)
77 - MolPairStyle:buck (SEGFAULT)
78 - MolPairStyle:buck_coul_cut (SEGFAULT)
79 - MolPairStyle:buck_coul_long (SEGFAULT)
81 - MolPairStyle:buck_coul_table (SEGFAULT)
84 - MolPairStyle:buck_long_coul_off (SEGFAULT)
86 - MolPairStyle:buck_mdf (SEGFAULT)
88 - MolPairStyle:buck_table_coul_off (SEGFAULT)
89 - MolPairStyle:buck_table_coul_table (SEGFAULT)
95 - MolPairStyle:coul_diel (SEGFAULT)
96 - MolPairStyle:coul_dsf (SEGFAULT)
99 - MolPairStyle:coul_long_cs (SEGFAULT)
100 - MolPairStyle:coul_long_soft (SEGFAULT)
103 - MolPairStyle:coul_slater_long (Failed)
105 - MolPairStyle:coul_streitz_wolf (SEGFAULT)
106 - MolPairStyle:coul_table (SEGFAULT)
119 - MolPairStyle:hybrid_multiple (SEGFAULT)
122 - MolPairStyle:lj_charmm_coul_charmm (SEGFAULT)
124 - MolPairStyle:lj_charmm_coul_long (SEGFAULT)
125 - MolPairStyle:lj_charmm_coul_long_soft (SEGFAULT)
126 - MolPairStyle:lj_charmm_coul_table (SEGFAULT)
127 - MolPairStyle:lj_charmmfsw_coul_charmmfsw (SEGFAULT)
135 - MolPairStyle:lj_class2_coul_long_soft (SEGFAULT)
136 - MolPairStyle:lj_class2_coul_table (SEGFAULT)
139 - MolPairStyle:lj_cubic (SEGFAULT)
140 - MolPairStyle:lj_cut (SEGFAULT)
142 - MolPairStyle:lj_cut_coul_cut_soft (SEGFAULT)
145 - MolPairStyle:lj_cut_coul_long (SEGFAULT)
147 - MolPairStyle:lj_cut_coul_long_soft (SEGFAULT)
148 - MolPairStyle:lj_cut_coul_table (SEGFAULT)
150 - MolPairStyle:lj_cut_coul_wolf (SEGFAULT)
153 - MolPairStyle:lj_cut_soft (SEGFAULT)
154 - MolPairStyle:lj_cut_tip4p_cut (SEGFAULT)
157 - MolPairStyle:lj_cut_tip4p_table (SEGFAULT)
166 - MolPairStyle:lj_long_cut_dipole_long (SEGFAULT)
167 - MolPairStyle:lj_long_cut_tip4p_long (SEGFAULT)
168 - MolPairStyle:lj_long_dipole_long (SEGFAULT)
170 - MolPairStyle:lj_mdf (SEGFAULT)
173 - MolPairStyle:lj_sdk_coul_table (SEGFAULT)
175 - MolPairStyle:lj_smooth (SEGFAULT)
181 - MolPairStyle:lj_table_coul_table (SEGFAULT)
182 - MolPairStyle:lj_table_tip4p_long (SEGFAULT)
183 - MolPairStyle:lj_table_tip4p_table (SEGFAULT)
184 - MolPairStyle:mie_cut (SEGFAULT)
185 - MolPairStyle:mm3_switch3_coulgauss_long (SEGFAULT)
187 - MolPairStyle:morse (SEGFAULT)
190 - MolPairStyle:nm_cut (SEGFAULT)
191 - MolPairStyle:nm_cut_coul_cut (SEGFAULT)
192 - MolPairStyle:nm_cut_coul_long (SEGFAULT)
193 - MolPairStyle:nm_cut_coul_table (SEGFAULT)
197 - MolPairStyle:soft (SEGFAULT)
204 - MolPairStyle:wf_cut (SEGFAULT)
206 - MolPairStyle:zbl (SEGFAULT)
211 - AtomicPairStyle:born (SEGFAULT)
212 - AtomicPairStyle:buck_coul_cut_qeq_point (Failed)
213 - AtomicPairStyle:buck_coul_cut_qeq_shielded (Failed)
214 - AtomicPairStyle:colloid (SEGFAULT)
216 - AtomicPairStyle:colloid_multi_tri (SEGFAULT)
218 - AtomicPairStyle:colloid_tiled_tri (SEGFAULT)
225 - AtomicPairStyle:eam_fs (SEGFAULT)
227 - AtomicPairStyle:eam_he (SEGFAULT)
228 - AtomicPairStyle:eam_he_real (SEGFAULT)
230 - AtomicPairStyle:edip (SEGFAULT)
231 - AtomicPairStyle:eim (SEGFAULT)
232 - AtomicPairStyle:gauss (SEGFAULT)
233 - AtomicPairStyle:hybrid-eam (SEGFAULT)
234 - AtomicPairStyle:hybrid-eam_fs (SEGFAULT)
235 - AtomicPairStyle:kim_lj (SEGFAULT)
237 - AtomicPairStyle:meam (SEGFAULT)
238 - AtomicPairStyle:meam_spline (Failed)
239 - AtomicPairStyle:meam_sw_spline (SEGFAULT)
242 - AtomicPairStyle:reaxff-acks2 (SEGFAULT)
243 - AtomicPairStyle:reaxff-acks2_efield (Failed)
244 - AtomicPairStyle:reaxff (Failed)
245 - AtomicPairStyle:reaxff_lgvdw (Failed)
246 - AtomicPairStyle:reaxff_noqeq (Failed)
247 - AtomicPairStyle:reaxff_tabulate (Failed)
248 - AtomicPairStyle:reaxff_tabulate_flag (Failed)
254 - AtomicPairStyle:table_linear (SEGFAULT)
260 - ManybodyPairStyle:airebo_00 (SEGFAULT)
266 - ManybodyPairStyle:comb3 (SEGFAULT)
268 - ManybodyPairStyle:drip_real (SEGFAULT)
273 - ManybodyPairStyle:ilp-graphene-hbn (Failed)
274 - ManybodyPairStyle:ilp-graphene-hbn_notaper (SEGFAULT)
275 - ManybodyPairStyle:kolmogorov_crespi_full (SEGFAULT)
279 - ManybodyPairStyle:lebedeva_z (SEGFAULT)
281 - ManybodyPairStyle:mliap_nn (SEGFAULT)
288 - ManybodyPairStyle:pace_recursive (SEGFAULT)
289 - ManybodyPairStyle:polymorphic_sw (SEGFAULT)
290 - ManybodyPairStyle:polymorphic_tersoff (SEGFAULT)
291 - ManybodyPairStyle:quip-sw (SEGFAULT)
297 - ManybodyPairStyle:sw-mod-multi (SEGFAULT)
298 - ManybodyPairStyle:sw-multi (SEGFAULT)
301 - ManybodyPairStyle:tersoff_mod (SEGFAULT)
306 - ManybodyPairStyle:tersoff_table (SEGFAULT)
309 - ManybodyPairStyle:vashishta (SEGFAULT)
310 - ManybodyPairStyle:vashishta_table (SEGFAULT)
349 - KSpaceStyle:ewald (SEGFAULT)
350 - KSpaceStyle:ewald_conp_charge (SEGFAULT)
352 - KSpaceStyle:ewald_disp (SEGFAULT)
356 - KSpaceStyle:ewald_slab (SEGFAULT)
357 - KSpaceStyle:ewald_tilted (SEGFAULT)
360 - KSpaceStyle:pppm_ad (SEGFAULT)
361 - KSpaceStyle:pppm_cg (SEGFAULT)
362 - KSpaceStyle:pppm_cg_ad (Failed)
363 - KSpaceStyle:pppm_cg_tiled (Failed)
365 - KSpaceStyle:pppm_dipole (SEGFAULT)
370 - KSpaceStyle:pppm_disp_tip4p (Failed)
372 - KSpaceStyle:pppm_nozforce (SEGFAULT)
373 - KSpaceStyle:pppm_slab (SEGFAULT)
374 - KSpaceStyle:pppm_stagger (SEGFAULT)
375 - KSpaceStyle:pppm_stagger_tiled (SEGFAULT)
378 - KSpaceStyle:pppm_tip4p (SEGFAULT)
379 - KSpaceStyle:pppm_tip4p_ad (SEGFAULT)
381 - KSpaceStyle:pppm_tip4p_slab (SEGFAULT)
383 - KSpaceStyle:scafacos_direct (Failed)
384 - KSpaceStyle:scafacos_ewald (Failed)
385 - KSpaceStyle:scafacos_fmm (Failed)
386 - KSpaceStyle:scafacos_fmm_tuned (Failed)
387 - KSpaceStyle:scafacos_p2nfft (Failed)
388 - FixTimestep:adapt_coul (Failed)
393 - FixTimestep:addtorque_const (Failed)
459 - FixTimestep:spring_rg (Failed)
466 - FixTimestep:wall_harmonic_const (Failed)
482 - DihedralStyle:quadratic (Failed)
484 - DihedralStyle:table_cut_linear (Failed)
486 - DihedralStyle:table_linear (Failed)
487 - DihedralStyle:table_spline (Failed)
メモ
- CPU版の情報も参照ください。
- GPU 版でインテルコンパイラを使うと LJ 系で明確なスローダウンを確認。GCC+OpenMPIでも同様の問題有り。GCC+IntelMPI の組み合わせではなぜか問題無し。