diff --git a/doc/src/compute_sna_atom.txt b/doc/src/compute_sna_atom.txt index 1c3787e696638191373d0b563f461c37d42dddad..268e23ac2808d82f8750b95bd652cd4d50f6b9d2 100644 --- a/doc/src/compute_sna_atom.txt +++ b/doc/src/compute_sna_atom.txt @@ -161,9 +161,9 @@ function. The keyword {bzeroflag} determines whether or not {B0}, the bispectrum components of an atom with no neighbors, are subtracted from -the calculated bispectrum components. This optional keyword is only -available for compute {sna/atom}, as {snad/atom} and {snav/atom} -are unaffected by the removal of constant terms. +the calculated bispectrum components. This optional keyword +normally only affects compute {sna/atom}. However, when +{quadraticflag} is on, it also affects {snad/atom} and {snav/atom}. The keyword {quadraticflag} determines whether or not the quadratic analogs to the bispectrum quantities are generated. @@ -230,13 +230,18 @@ are 30, 90, and 180, respectively. With {quadratic} value=1, the numbers of columns are 930, 2790, and 5580, respectively. If the {quadratic} keyword value is set to 1, then additional -columns are appended to each per-atom array, corresponding to +columns are generated, corresponding to the products of all distinct pairs of bispectrum components. If the number of bispectrum components is {K}, then the number of distinct pairs -is {K}({K}+1)/2. These are output in subblocks of {K}({K}+1)/2 columns, using the same -ordering of sub-blocks as was used for the bispectrum -components. Within each sub-block, the ordering is upper-triangular, -(1,1),(1,2)...(1,{K}),(2,1)...({K}-1,{K}-1),({K}-1,{K}),({K},{K}) +is {K}({K}+1)/2. +For compute {sna/atom} these columns are appended to existing {K} columns. +The ordering of quadratic terms is upper-triangular, +(1,1),(1,2)...(1,{K}),(2,1)...({K}-1,{K}-1),({K}-1,{K}),({K},{K}). +For computes {snad/atom} and {snav/atom} each set of {K}({K}+1)/2 +additional columns is inserted directly after each of sub-block +of linear terms i.e. linear and quadratic terms are contiguous. +So the nesting order from inside to outside is bispectrum component, +linear then quadratic, vector/tensor component, type. These values can be accessed by any command that uses per-atom values from a compute as input. See "Section diff --git a/examples/snap/log.20Apr18.snap.Mo_Chen.g++.1 b/examples/snap/log.20Apr18.snap.Mo_Chen.g++.1 new file mode 100644 index 0000000000000000000000000000000000000000..c5e0f6abab7b7eb657e529096265fa9d3a9bfcff --- /dev/null +++ b/examples/snap/log.20Apr18.snap.Mo_Chen.g++.1 @@ -0,0 +1,127 @@ +LAMMPS (20 Apr 2018) +OMP_NUM_THREADS environment is not set. Defaulting to 1 thread. (../comm.cpp:90) + using 1 OpenMP thread(s) per MPI task +# Demonstrate SNAP Ta potential + +# Initialize simulation + +variable nsteps index 100 +variable nrep equal 4 +variable a equal 3.160 +units metal + +# generate the box and atom positions using a BCC lattice + +variable nx equal ${nrep} +variable nx equal 4 +variable ny equal ${nrep} +variable ny equal 4 +variable nz equal ${nrep} +variable nz equal 4 + +boundary p p p + +lattice bcc $a +lattice bcc 3.16 +Lattice spacing in x,y,z = 3.16 3.16 3.16 +region box block 0 ${nx} 0 ${ny} 0 ${nz} +region box block 0 4 0 ${ny} 0 ${nz} +region box block 0 4 0 4 0 ${nz} +region box block 0 4 0 4 0 4 +create_box 1 box +Created orthogonal box = (0 0 0) to (12.64 12.64 12.64) + 1 by 1 by 1 MPI processor grid +create_atoms 1 box +Created 128 atoms + Time spent = 0.000223637 secs + +mass 1 183.84 + +# choose potential + +include Mo_Chen_PRM2017.snap + +# DATE: 2017-09-18 CONTRIBUTOR: Chi Chen <chc273@eng.ucsd.edu> CITATION: C. Chen, Z. Deng, R. Tran, H. Tang, I.-H. Chu, S. P. Ong, "Accurate force field for molybdenum by machine learning large materials data" Physical Review Materials 1, 04 3603 (2017) +# Generated by Materials Virtual Lab +# Definition of SNAP potential. +pair_style snap +pair_coeff * * Mo_Chen_PRM2017.snapcoeff Mo Mo_Chen_PRM2017.snapparam Mo +Reading potential file Mo_Chen_PRM2017.snapcoeff with DATE: 2017-09-18 +SNAP Element = Mo, Radius 0.5, Weight 1 +Reading potential file Mo_Chen_PRM2017.snapparam with DATE: 2017-09-18 +SNAP keyword rcutfac 4.615858 +SNAP keyword twojmax 6 + + +# Setup output + +thermo 10 +thermo_modify norm yes + +# Set up NVE run + +timestep 0.5e-3 +neighbor 1.0 bin +neigh_modify once no every 1 delay 0 check yes + +# Run MD + +velocity all create 300.0 4928459 +fix 1 all nve +run ${nsteps} +run 100 +Neighbor list info ... + update every 1 steps, delay 0 steps, check yes + max neighbors/atom: 2000, page size: 100000 + master list distance cutoff = 5.61586 + ghost atom cutoff = 5.61586 + binsize = 2.80793, bins = 5 5 5 + 1 neighbor lists, perpetual/occasional/extra = 1 0 0 + (1) pair snap, perpetual + attributes: full, newton on + pair build: full/bin/atomonly + stencil: full/bin/3d + bin: standard +Per MPI rank memory allocation (min/avg/max) = 3.507 | 3.507 | 3.507 Mbytes +Step Temp E_pair E_mol TotEng Press + 0 300 -22.405975 0 -22.3675 2575.7657 + 10 294.77555 -22.405305 0 -22.3675 2756.6894 + 20 279.53011 -22.40335 0 -22.3675 3285.8272 + 30 255.52174 -22.40027 0 -22.3675 4122.8933 + 40 224.7299 -22.396321 0 -22.367499 5204.3499 + 50 189.67529 -22.391825 0 -22.367499 6449.1308 + 60 153.18862 -22.387145 0 -22.367499 7765.911 + 70 118.14998 -22.382652 0 -22.367499 9061.1616 + 80 87.224916 -22.378685 0 -22.367499 10247.68 + 90 62.623892 -22.37553 0 -22.367498 11250.067 + 100 45.9103 -22.373386 0 -22.367498 12011.726 +Loop time of 3.3917 on 1 procs for 100 steps with 128 atoms + +Performance: 1.274 ns/day, 18.843 hours/ns, 29.484 timesteps/s +99.7% CPU use with 1 MPI tasks x 1 OpenMP threads + +MPI task timing breakdown: +Section | min time | avg time | max time |%varavg| %total +--------------------------------------------------------------- +Pair | 3.3906 | 3.3906 | 3.3906 | 0.0 | 99.97 +Neigh | 0 | 0 | 0 | 0.0 | 0.00 +Comm | 0.00039721 | 0.00039721 | 0.00039721 | 0.0 | 0.01 +Output | 0.00023007 | 0.00023007 | 0.00023007 | 0.0 | 0.01 +Modify | 0.00021887 | 0.00021887 | 0.00021887 | 0.0 | 0.01 +Other | | 0.0002868 | | | 0.01 + +Nlocal: 128 ave 128 max 128 min +Histogram: 1 0 0 0 0 0 0 0 0 0 +Nghost: 727 ave 727 max 727 min +Histogram: 1 0 0 0 0 0 0 0 0 0 +Neighs: 0 ave 0 max 0 min +Histogram: 1 0 0 0 0 0 0 0 0 0 +FullNghs: 7424 ave 7424 max 7424 min +Histogram: 1 0 0 0 0 0 0 0 0 0 + +Total # of neighbors = 7424 +Ave neighs/atom = 58 +Neighbor list builds = 0 +Dangerous builds = 0 + +Total wall time: 0:00:03 diff --git a/examples/snap/log.20Apr18.snap.Mo_Chen.g++.4 b/examples/snap/log.20Apr18.snap.Mo_Chen.g++.4 new file mode 100644 index 0000000000000000000000000000000000000000..c25f1f5530856ab7dc5492526aa168c9dafd6fad --- /dev/null +++ b/examples/snap/log.20Apr18.snap.Mo_Chen.g++.4 @@ -0,0 +1,127 @@ +LAMMPS (20 Apr 2018) +OMP_NUM_THREADS environment is not set. Defaulting to 1 thread. (../comm.cpp:90) + using 1 OpenMP thread(s) per MPI task +# Demonstrate SNAP Ta potential + +# Initialize simulation + +variable nsteps index 100 +variable nrep equal 4 +variable a equal 3.160 +units metal + +# generate the box and atom positions using a BCC lattice + +variable nx equal ${nrep} +variable nx equal 4 +variable ny equal ${nrep} +variable ny equal 4 +variable nz equal ${nrep} +variable nz equal 4 + +boundary p p p + +lattice bcc $a +lattice bcc 3.16 +Lattice spacing in x,y,z = 3.16 3.16 3.16 +region box block 0 ${nx} 0 ${ny} 0 ${nz} +region box block 0 4 0 ${ny} 0 ${nz} +region box block 0 4 0 4 0 ${nz} +region box block 0 4 0 4 0 4 +create_box 1 box +Created orthogonal box = (0 0 0) to (12.64 12.64 12.64) + 1 by 2 by 2 MPI processor grid +create_atoms 1 box +Created 128 atoms + Time spent = 0.000277281 secs + +mass 1 183.84 + +# choose potential + +include Mo_Chen_PRM2017.snap + +# DATE: 2017-09-18 CONTRIBUTOR: Chi Chen <chc273@eng.ucsd.edu> CITATION: C. Chen, Z. Deng, R. Tran, H. Tang, I.-H. Chu, S. P. Ong, "Accurate force field for molybdenum by machine learning large materials data" Physical Review Materials 1, 04 3603 (2017) +# Generated by Materials Virtual Lab +# Definition of SNAP potential. +pair_style snap +pair_coeff * * Mo_Chen_PRM2017.snapcoeff Mo Mo_Chen_PRM2017.snapparam Mo +Reading potential file Mo_Chen_PRM2017.snapcoeff with DATE: 2017-09-18 +SNAP Element = Mo, Radius 0.5, Weight 1 +Reading potential file Mo_Chen_PRM2017.snapparam with DATE: 2017-09-18 +SNAP keyword rcutfac 4.615858 +SNAP keyword twojmax 6 + + +# Setup output + +thermo 10 +thermo_modify norm yes + +# Set up NVE run + +timestep 0.5e-3 +neighbor 1.0 bin +neigh_modify once no every 1 delay 0 check yes + +# Run MD + +velocity all create 300.0 4928459 +fix 1 all nve +run ${nsteps} +run 100 +Neighbor list info ... + update every 1 steps, delay 0 steps, check yes + max neighbors/atom: 2000, page size: 100000 + master list distance cutoff = 5.61586 + ghost atom cutoff = 5.61586 + binsize = 2.80793, bins = 5 5 5 + 1 neighbor lists, perpetual/occasional/extra = 1 0 0 + (1) pair snap, perpetual + attributes: full, newton on + pair build: full/bin/atomonly + stencil: full/bin/3d + bin: standard +Per MPI rank memory allocation (min/avg/max) = 3.486 | 3.486 | 3.486 Mbytes +Step Temp E_pair E_mol TotEng Press + 0 300 -22.405975 0 -22.3675 2575.7657 + 10 294.63153 -22.405286 0 -22.3675 2753.4662 + 20 278.98535 -22.40328 0 -22.3675 3272.416 + 30 254.38916 -22.400125 0 -22.3675 4091.8933 + 40 222.91191 -22.396088 0 -22.367499 5148.5505 + 50 187.16984 -22.391504 0 -22.367499 6362.2454 + 60 150.08253 -22.386747 0 -22.367499 7643.2732 + 70 114.60307 -22.382197 0 -22.367499 8900.2448 + 80 83.449257 -22.378201 0 -22.367499 10047.619 + 90 58.862643 -22.375048 0 -22.367498 11012.233 + 100 42.41931 -22.372939 0 -22.367498 11740.641 +Loop time of 1.91636 on 4 procs for 100 steps with 128 atoms + +Performance: 2.254 ns/day, 10.646 hours/ns, 52.182 timesteps/s +97.9% CPU use with 4 MPI tasks x 1 OpenMP threads + +MPI task timing breakdown: +Section | min time | avg time | max time |%varavg| %total +--------------------------------------------------------------- +Pair | 1.8147 | 1.8411 | 1.8875 | 2.1 | 96.07 +Neigh | 0 | 0 | 0 | 0.0 | 0.00 +Comm | 0.022276 | 0.069629 | 0.095057 | 10.7 | 3.63 +Output | 0.00032496 | 0.00065821 | 0.0016179 | 0.0 | 0.03 +Modify | 0.00019503 | 0.00020915 | 0.00023341 | 0.0 | 0.01 +Other | | 0.00481 | | | 0.25 + +Nlocal: 32 ave 32 max 32 min +Histogram: 4 0 0 0 0 0 0 0 0 0 +Nghost: 431 ave 431 max 431 min +Histogram: 4 0 0 0 0 0 0 0 0 0 +Neighs: 0 ave 0 max 0 min +Histogram: 4 0 0 0 0 0 0 0 0 0 +FullNghs: 1856 ave 1856 max 1856 min +Histogram: 4 0 0 0 0 0 0 0 0 0 + +Total # of neighbors = 7424 +Ave neighs/atom = 58 +Neighbor list builds = 0 +Dangerous builds = 0 + +Total wall time: 0:00:01 diff --git a/examples/snap/log.5Oct16.snap.Ta06A.g++.1 b/examples/snap/log.20Apr18.snap.Ta06A.g++.1 similarity index 71% rename from examples/snap/log.5Oct16.snap.Ta06A.g++.1 rename to examples/snap/log.20Apr18.snap.Ta06A.g++.1 index 647ffac8b4326efa8ce7f6fca6b4ee9e577d32f5..d2296852a051bc6d12c58924a802357574a47d6e 100644 --- a/examples/snap/log.5Oct16.snap.Ta06A.g++.1 +++ b/examples/snap/log.20Apr18.snap.Ta06A.g++.1 @@ -1,4 +1,6 @@ -LAMMPS (5 Oct 2016) +LAMMPS (20 Apr 2018) +OMP_NUM_THREADS environment is not set. Defaulting to 1 thread. (../comm.cpp:90) + using 1 OpenMP thread(s) per MPI task # Demonstrate SNAP Ta potential # Initialize simulation @@ -31,12 +33,13 @@ Created orthogonal box = (0 0 0) to (13.264 13.264 13.264) 1 by 1 by 1 MPI processor grid create_atoms 1 box Created 128 atoms + Time spent = 0.000328064 secs mass 1 180.88 # choose potential -include Ta06A_pot.snap +include Ta06A.snap # DATE: 2014-09-05 CONTRIBUTOR: Aidan Thompson athomps@sandia.gov CITATION: Thompson, Swiler, Trott, Foiles and Tucker, arxiv.org, 1409.3880 (2014) # Definition of SNAP potential Ta_Cand06A @@ -48,10 +51,9 @@ variable zblz equal 73 # Specify hybrid with SNAP, ZBL -pair_style hybrid/overlay snap zbl ${zblcutinner} ${zblcutouter} -pair_style hybrid/overlay snap zbl 4 ${zblcutouter} -pair_style hybrid/overlay snap zbl 4 4.8 - +pair_style hybrid/overlay zbl ${zblcutinner} ${zblcutouter} snap +pair_style hybrid/overlay zbl 4 ${zblcutouter} snap +pair_style hybrid/overlay zbl 4 4.8 snap pair_coeff 1 1 zbl ${zblz} ${zblz} pair_coeff 1 1 zbl 73 ${zblz} pair_coeff 1 1 zbl 73 73 @@ -61,10 +63,11 @@ SNAP Element = Ta, Radius 0.5, Weight 1 Reading potential file Ta06A.snapparam with DATE: 2014-09-05 SNAP keyword rcutfac 4.67637 SNAP keyword twojmax 6 -SNAP keyword gamma 1 SNAP keyword rfac0 0.99363 SNAP keyword rmin0 0 SNAP keyword diagonalstyle 3 +SNAP keyword bzeroflag 0 +SNAP keyword quadraticflag 0 # Setup output @@ -85,13 +88,23 @@ fix 1 all nve run ${nsteps} run 100 Neighbor list info ... - 2 neighbor list requests update every 1 steps, delay 0 steps, check yes max neighbors/atom: 2000, page size: 100000 master list distance cutoff = 5.8 ghost atom cutoff = 5.8 - binsize = 2.9 -> bins = 5 5 5 -Memory usage per processor = 2.92823 Mbytes + binsize = 2.9, bins = 5 5 5 + 2 neighbor lists, perpetual/occasional/extra = 2 0 0 + (1) pair zbl, perpetual, half/full from (2) + attributes: half, newton on + pair build: halffull/newton + stencil: none + bin: none + (2) pair snap, perpetual + attributes: full, newton on + pair build: full/bin/atomonly + stencil: full/bin/3d + bin: standard +Per MPI rank memory allocation (min/avg/max) = 4.138 | 4.138 | 4.138 Mbytes Step Temp E_pair E_mol TotEng Press 0 300 -11.85157 0 -11.813095 2717.1661 10 295.96579 -11.851053 0 -11.813095 2696.1559 @@ -104,20 +117,20 @@ Step Temp E_pair E_mol TotEng Press 80 124.04276 -11.829003 0 -11.813094 1537.703 90 97.37622 -11.825582 0 -11.813094 1734.9662 100 75.007873 -11.822714 0 -11.813094 1930.8005 -Loop time of 3.43062 on 1 procs for 100 steps with 128 atoms +Loop time of 2.53266 on 1 procs for 100 steps with 128 atoms -Performance: 1.259 ns/day, 19.059 hours/ns, 29.149 timesteps/s -99.9% CPU use with 1 MPI tasks x no OpenMP threads +Performance: 1.706 ns/day, 14.070 hours/ns, 39.484 timesteps/s +99.5% CPU use with 1 MPI tasks x 1 OpenMP threads MPI task timing breakdown: Section | min time | avg time | max time |%varavg| %total --------------------------------------------------------------- -Pair | 3.4295 | 3.4295 | 3.4295 | 0.0 | 99.97 +Pair | 2.5313 | 2.5313 | 2.5313 | 0.0 | 99.95 Neigh | 0 | 0 | 0 | 0.0 | 0.00 -Comm | 0.00043988 | 0.00043988 | 0.00043988 | 0.0 | 0.01 -Output | 0.00010014 | 0.00010014 | 0.00010014 | 0.0 | 0.00 -Modify | 0.00024533 | 0.00024533 | 0.00024533 | 0.0 | 0.01 -Other | | 0.0002978 | | | 0.01 +Comm | 0.00051379 | 0.00051379 | 0.00051379 | 0.0 | 0.02 +Output | 0.00023317 | 0.00023317 | 0.00023317 | 0.0 | 0.01 +Modify | 0.00023675 | 0.00023675 | 0.00023675 | 0.0 | 0.01 +Other | | 0.0003583 | | | 0.01 Nlocal: 128 ave 128 max 128 min Histogram: 1 0 0 0 0 0 0 0 0 0 @@ -133,4 +146,4 @@ Ave neighs/atom = 58 Neighbor list builds = 0 Dangerous builds = 0 -Total wall time: 0:00:03 +Total wall time: 0:00:02 diff --git a/examples/snap/log.5Oct16.snap.Ta06A.g++.4 b/examples/snap/log.20Apr18.snap.Ta06A.g++.4 similarity index 71% rename from examples/snap/log.5Oct16.snap.Ta06A.g++.4 rename to examples/snap/log.20Apr18.snap.Ta06A.g++.4 index 19d64c557c33538c702da0ddfb4fa1b30c336f8e..4d26481d5de2ccb00bbc364d70af786f458ec2e2 100644 --- a/examples/snap/log.5Oct16.snap.Ta06A.g++.4 +++ b/examples/snap/log.20Apr18.snap.Ta06A.g++.4 @@ -1,4 +1,6 @@ -LAMMPS (5 Oct 2016) +LAMMPS (20 Apr 2018) +OMP_NUM_THREADS environment is not set. Defaulting to 1 thread. (../comm.cpp:90) + using 1 OpenMP thread(s) per MPI task # Demonstrate SNAP Ta potential # Initialize simulation @@ -31,12 +33,13 @@ Created orthogonal box = (0 0 0) to (13.264 13.264 13.264) 1 by 2 by 2 MPI processor grid create_atoms 1 box Created 128 atoms + Time spent = 0.000288486 secs mass 1 180.88 # choose potential -include Ta06A_pot.snap +include Ta06A.snap # DATE: 2014-09-05 CONTRIBUTOR: Aidan Thompson athomps@sandia.gov CITATION: Thompson, Swiler, Trott, Foiles and Tucker, arxiv.org, 1409.3880 (2014) # Definition of SNAP potential Ta_Cand06A @@ -48,10 +51,9 @@ variable zblz equal 73 # Specify hybrid with SNAP, ZBL -pair_style hybrid/overlay snap zbl ${zblcutinner} ${zblcutouter} -pair_style hybrid/overlay snap zbl 4 ${zblcutouter} -pair_style hybrid/overlay snap zbl 4 4.8 - +pair_style hybrid/overlay zbl ${zblcutinner} ${zblcutouter} snap +pair_style hybrid/overlay zbl 4 ${zblcutouter} snap +pair_style hybrid/overlay zbl 4 4.8 snap pair_coeff 1 1 zbl ${zblz} ${zblz} pair_coeff 1 1 zbl 73 ${zblz} pair_coeff 1 1 zbl 73 73 @@ -61,10 +63,11 @@ SNAP Element = Ta, Radius 0.5, Weight 1 Reading potential file Ta06A.snapparam with DATE: 2014-09-05 SNAP keyword rcutfac 4.67637 SNAP keyword twojmax 6 -SNAP keyword gamma 1 SNAP keyword rfac0 0.99363 SNAP keyword rmin0 0 SNAP keyword diagonalstyle 3 +SNAP keyword bzeroflag 0 +SNAP keyword quadraticflag 0 # Setup output @@ -85,13 +88,23 @@ fix 1 all nve run ${nsteps} run 100 Neighbor list info ... - 2 neighbor list requests update every 1 steps, delay 0 steps, check yes max neighbors/atom: 2000, page size: 100000 master list distance cutoff = 5.8 ghost atom cutoff = 5.8 - binsize = 2.9 -> bins = 5 5 5 -Memory usage per processor = 2.91109 Mbytes + binsize = 2.9, bins = 5 5 5 + 2 neighbor lists, perpetual/occasional/extra = 2 0 0 + (1) pair zbl, perpetual, half/full from (2) + attributes: half, newton on + pair build: halffull/newton + stencil: none + bin: none + (2) pair snap, perpetual + attributes: full, newton on + pair build: full/bin/atomonly + stencil: full/bin/3d + bin: standard +Per MPI rank memory allocation (min/avg/max) = 4.118 | 4.118 | 4.118 Mbytes Step Temp E_pair E_mol TotEng Press 0 300 -11.85157 0 -11.813095 2717.1661 10 295.8664 -11.85104 0 -11.813095 2702.935 @@ -104,20 +117,20 @@ Step Temp E_pair E_mol TotEng Press 80 121.80051 -11.828715 0 -11.813094 1627.6911 90 95.262635 -11.825311 0 -11.813094 1812.9327 100 73.194645 -11.822481 0 -11.813094 1995.2199 -Loop time of 0.89193 on 4 procs for 100 steps with 128 atoms +Loop time of 1.3621 on 4 procs for 100 steps with 128 atoms -Performance: 4.843 ns/day, 4.955 hours/ns, 112.116 timesteps/s -99.9% CPU use with 4 MPI tasks x no OpenMP threads +Performance: 3.172 ns/day, 7.567 hours/ns, 73.416 timesteps/s +98.7% CPU use with 4 MPI tasks x 1 OpenMP threads MPI task timing breakdown: Section | min time | avg time | max time |%varavg| %total --------------------------------------------------------------- -Pair | 0.84444 | 0.86772 | 0.88108 | 1.6 | 97.29 +Pair | 1.2867 | 1.309 | 1.35 | 2.1 | 96.10 Neigh | 0 | 0 | 0 | 0.0 | 0.00 -Comm | 0.009577 | 0.023049 | 0.046417 | 9.8 | 2.58 -Output | 0.00024009 | 0.00026137 | 0.00027895 | 0.1 | 0.03 -Modify | 8.2493e-05 | 9.352e-05 | 0.00010061 | 0.1 | 0.01 -Other | | 0.0008071 | | | 0.09 +Comm | 0.0096083 | 0.050652 | 0.072999 | 10.9 | 3.72 +Output | 0.00031447 | 0.00060236 | 0.0014303 | 0.0 | 0.04 +Modify | 0.00014234 | 0.00016212 | 0.00018811 | 0.0 | 0.01 +Other | | 0.001728 | | | 0.13 Nlocal: 32 ave 32 max 32 min Histogram: 4 0 0 0 0 0 0 0 0 0 @@ -133,4 +146,4 @@ Ave neighs/atom = 58 Neighbor list builds = 0 Dangerous builds = 0 -Total wall time: 0:00:00 +Total wall time: 0:00:01 diff --git a/examples/snap/log.21Feb17.snap.W.2940.g++.1 b/examples/snap/log.20Apr18.snap.W.2940.g++.1 similarity index 79% rename from examples/snap/log.21Feb17.snap.W.2940.g++.1 rename to examples/snap/log.20Apr18.snap.W.2940.g++.1 index 8c74380b8b7246dad9bf1079f17ad1ef8e56f7b8..19b2bfb40d88b1fd6dd62ab892dba1f463a48b03 100644 --- a/examples/snap/log.21Feb17.snap.W.2940.g++.1 +++ b/examples/snap/log.20Apr18.snap.W.2940.g++.1 @@ -1,4 +1,6 @@ -LAMMPS (13 Feb 2017) +LAMMPS (20 Apr 2018) +OMP_NUM_THREADS environment is not set. Defaulting to 1 thread. (../comm.cpp:90) + using 1 OpenMP thread(s) per MPI task # Demonstrate SNAP Ta potential # Initialize simulation @@ -31,20 +33,21 @@ Created orthogonal box = (0 0 0) to (12.7212 12.7212 12.7212) 1 by 1 by 1 MPI processor grid create_atoms 1 box Created 128 atoms + Time spent = 0.000190258 secs mass 1 183.84 # choose potential -include W_2940_2017_2.pot.snap -# DATE: 2017-02-20 CONTRIBUTOR: Mitchell Wood mitwood@sandia.gov CITATION: Wood, M. A. and Thompson, A. P. to appear in arxiv Feb2017 +include W_2940_2017_2.snap +# DATE: 2017-02-20 CONTRIBUTOR: Mitchell Wood mitwood@sandia.gov CITATION: Wood, M. A. and Thompson, A. P. "Quantum-Accurate Molecular Dynamics Potential for Tungsten" arXiv:1702.07042 [physics.comp-ph] # # Definition of SNAP+ZBL potential. variable zblcutinner equal 4 variable zblcutouter equal 4.8 variable zblz equal 74 -# Specify hybrid with SNAP, ZBL, and long-range Coulomb +# Specify hybrid with SNAP and ZBL pair_style hybrid/overlay zbl ${zblcutinner} ${zblcutouter} snap pair_style hybrid/overlay zbl 4 ${zblcutouter} snap @@ -58,10 +61,11 @@ SNAP Element = W, Radius 0.5, Weight 1 Reading potential file W_2940_2017_2.snapparam with DATE: 2017-02-20 SNAP keyword rcutfac 4.73442 SNAP keyword twojmax 8 -SNAP keyword gamma 1 SNAP keyword rfac0 0.99363 SNAP keyword rmin0 0 SNAP keyword diagonalstyle 3 +SNAP keyword bzeroflag 0 +SNAP keyword quadraticflag 0 #Nomenclature on the snap files are Element_DakotaID_Year_Month @@ -99,7 +103,7 @@ Neighbor list info ... pair build: full/bin/atomonly stencil: full/bin/3d bin: standard -Memory usage per processor = 5.14696 Mbytes +Per MPI rank memory allocation (min/avg/max) = 5.15 | 5.15 | 5.15 Mbytes Step Temp E_pair E_mol TotEng Press 0 300 -11.028325 0 -10.98985 3010.497 10 293.40666 -11.027479 0 -10.989849 3246.0559 @@ -112,20 +116,20 @@ Step Temp E_pair E_mol TotEng Press 80 58.605244 -10.997364 0 -10.989848 11289.914 90 39.754503 -10.994946 0 -10.989848 11824.945 100 32.524085 -10.994019 0 -10.989848 11932.118 -Loop time of 11.8271 on 1 procs for 100 steps with 128 atoms +Loop time of 9.69738 on 1 procs for 100 steps with 128 atoms -Performance: 0.365 ns/day, 65.706 hours/ns, 8.455 timesteps/s -99.9% CPU use with 1 MPI tasks x no OpenMP threads +Performance: 0.445 ns/day, 53.874 hours/ns, 10.312 timesteps/s +99.8% CPU use with 1 MPI tasks x 1 OpenMP threads MPI task timing breakdown: Section | min time | avg time | max time |%varavg| %total --------------------------------------------------------------- -Pair | 11.826 | 11.826 | 11.826 | 0.0 | 99.99 +Pair | 9.6961 | 9.6961 | 9.6961 | 0.0 | 99.99 Neigh | 0 | 0 | 0 | 0.0 | 0.00 -Comm | 0.00044084 | 0.00044084 | 0.00044084 | 0.0 | 0.00 -Output | 0.00013232 | 0.00013232 | 0.00013232 | 0.0 | 0.00 -Modify | 0.00021887 | 0.00021887 | 0.00021887 | 0.0 | 0.00 -Other | | 0.0002718 | | | 0.00 +Comm | 0.00044036 | 0.00044036 | 0.00044036 | 0.0 | 0.00 +Output | 0.00024843 | 0.00024843 | 0.00024843 | 0.0 | 0.00 +Modify | 0.00023937 | 0.00023937 | 0.00023937 | 0.0 | 0.00 +Other | | 0.0003347 | | | 0.00 Nlocal: 128 ave 128 max 128 min Histogram: 1 0 0 0 0 0 0 0 0 0 @@ -141,4 +145,4 @@ Ave neighs/atom = 58 Neighbor list builds = 0 Dangerous builds = 0 -Total wall time: 0:00:11 +Total wall time: 0:00:09 diff --git a/examples/snap/log.21Feb17.snap.W.2940.g++.4 b/examples/snap/log.20Apr18.snap.W.2940.g++.4 similarity index 79% rename from examples/snap/log.21Feb17.snap.W.2940.g++.4 rename to examples/snap/log.20Apr18.snap.W.2940.g++.4 index 97ed5cc8d12728a0e1d9fb2bc79729188ad7c569..dfa63fc6ea208d4552b8533a1a32fd73bc88d4fe 100644 --- a/examples/snap/log.21Feb17.snap.W.2940.g++.4 +++ b/examples/snap/log.20Apr18.snap.W.2940.g++.4 @@ -1,4 +1,6 @@ -LAMMPS (13 Feb 2017) +LAMMPS (20 Apr 2018) +OMP_NUM_THREADS environment is not set. Defaulting to 1 thread. (../comm.cpp:90) + using 1 OpenMP thread(s) per MPI task # Demonstrate SNAP Ta potential # Initialize simulation @@ -31,20 +33,21 @@ Created orthogonal box = (0 0 0) to (12.7212 12.7212 12.7212) 1 by 2 by 2 MPI processor grid create_atoms 1 box Created 128 atoms + Time spent = 0.000309944 secs mass 1 183.84 # choose potential -include W_2940_2017_2.pot.snap -# DATE: 2017-02-20 CONTRIBUTOR: Mitchell Wood mitwood@sandia.gov CITATION: Wood, M. A. and Thompson, A. P. to appear in arxiv Feb2017 +include W_2940_2017_2.snap +# DATE: 2017-02-20 CONTRIBUTOR: Mitchell Wood mitwood@sandia.gov CITATION: Wood, M. A. and Thompson, A. P. "Quantum-Accurate Molecular Dynamics Potential for Tungsten" arXiv:1702.07042 [physics.comp-ph] # # Definition of SNAP+ZBL potential. variable zblcutinner equal 4 variable zblcutouter equal 4.8 variable zblz equal 74 -# Specify hybrid with SNAP, ZBL, and long-range Coulomb +# Specify hybrid with SNAP and ZBL pair_style hybrid/overlay zbl ${zblcutinner} ${zblcutouter} snap pair_style hybrid/overlay zbl 4 ${zblcutouter} snap @@ -58,10 +61,11 @@ SNAP Element = W, Radius 0.5, Weight 1 Reading potential file W_2940_2017_2.snapparam with DATE: 2017-02-20 SNAP keyword rcutfac 4.73442 SNAP keyword twojmax 8 -SNAP keyword gamma 1 SNAP keyword rfac0 0.99363 SNAP keyword rmin0 0 SNAP keyword diagonalstyle 3 +SNAP keyword bzeroflag 0 +SNAP keyword quadraticflag 0 #Nomenclature on the snap files are Element_DakotaID_Year_Month @@ -99,7 +103,7 @@ Neighbor list info ... pair build: full/bin/atomonly stencil: full/bin/3d bin: standard -Memory usage per processor = 5.12833 Mbytes +Per MPI rank memory allocation (min/avg/max) = 5.13 | 5.13 | 5.13 Mbytes Step Temp E_pair E_mol TotEng Press 0 300 -11.028325 0 -10.98985 3010.497 10 293.22504 -11.027456 0 -10.989849 3258.275 @@ -112,20 +116,20 @@ Step Temp E_pair E_mol TotEng Press 80 56.127265 -10.997046 0 -10.989848 11551.687 90 38.025013 -10.994724 0 -10.989847 12069.936 100 31.768127 -10.993922 0 -10.989847 12145.648 -Loop time of 3.03545 on 4 procs for 100 steps with 128 atoms +Loop time of 5.15615 on 4 procs for 100 steps with 128 atoms -Performance: 1.423 ns/day, 16.864 hours/ns, 32.944 timesteps/s -99.9% CPU use with 4 MPI tasks x no OpenMP threads +Performance: 0.838 ns/day, 28.645 hours/ns, 19.394 timesteps/s +98.9% CPU use with 4 MPI tasks x 1 OpenMP threads MPI task timing breakdown: Section | min time | avg time | max time |%varavg| %total --------------------------------------------------------------- -Pair | 2.9594 | 2.9866 | 3.0319 | 1.6 | 98.39 +Pair | 5.0497 | 5.0762 | 5.092 | 0.8 | 98.45 Neigh | 0 | 0 | 0 | 0.0 | 0.00 -Comm | 0.0024238 | 0.047825 | 0.075032 | 12.5 | 1.58 -Output | 0.00021601 | 0.00024045 | 0.00027442 | 0.0 | 0.01 -Modify | 9.6798e-05 | 0.00011188 | 0.00011802 | 0.0 | 0.00 -Other | | 0.000698 | | | 0.02 +Comm | 0.060802 | 0.07661 | 0.10305 | 6.1 | 1.49 +Output | 0.00040722 | 0.00078458 | 0.0018959 | 0.0 | 0.02 +Modify | 0.0002389 | 0.00024962 | 0.00027442 | 0.0 | 0.00 +Other | | 0.002315 | | | 0.04 Nlocal: 32 ave 32 max 32 min Histogram: 4 0 0 0 0 0 0 0 0 0 @@ -141,4 +145,4 @@ Ave neighs/atom = 58 Neighbor list builds = 0 Dangerous builds = 0 -Total wall time: 0:00:03 +Total wall time: 0:00:05 diff --git a/examples/snap/log.21Feb17.snap.hybrid.WSNAP.HePair.g++.1 b/examples/snap/log.20Apr18.snap.hybrid.WSNAP.HePair.g++.1 similarity index 83% rename from examples/snap/log.21Feb17.snap.hybrid.WSNAP.HePair.g++.1 rename to examples/snap/log.20Apr18.snap.hybrid.WSNAP.HePair.g++.1 index 846eef269ce580ca63d730be0fb1ced38da1bf58..3f40936308b21d4e3d0ed1e8e83145c5cfd9d0f7 100644 --- a/examples/snap/log.21Feb17.snap.hybrid.WSNAP.HePair.g++.1 +++ b/examples/snap/log.20Apr18.snap.hybrid.WSNAP.HePair.g++.1 @@ -1,4 +1,6 @@ -LAMMPS (13 Feb 2017) +LAMMPS (20 Apr 2018) +OMP_NUM_THREADS environment is not set. Defaulting to 1 thread. (../comm.cpp:90) + using 1 OpenMP thread(s) per MPI task # Demonstrate SNAP Ta potential # Initialize simulation @@ -31,6 +33,7 @@ Created orthogonal box = (0 0 0) to (12.7212 12.7212 12.7212) 1 by 1 by 1 MPI processor grid create_atoms 1 box Created 128 atoms + Time spent = 0.000431538 secs mass 1 183.84 mass 2 4.0026 @@ -42,15 +45,15 @@ group helium type 2 5 atoms in group helium # choose potential -include W.SNAP_HePair.pot -# DATE: 2017-02-20 CONTRIBUTOR: Mitchell Wood mitwood@sandia.gov CITATION: Wood, M. A. and Thompson, A. P. to appear in arxiv Feb2017, W-He and He-He from Juslin, N. and Wirth, B. D. Journal of Nuclear Materials, 423, (2013) p61-63 +include W_2940_2017_2_He_JW2013.snap +# DATE: 2017-02-20 CONTRIBUTOR: Mitchell Wood mitwood@sandia.gov CITATION: Wood, M. A. and Thompson, A. P. "Quantum-Accurate Molecular Dynamics Potential for Tungsten" arXiv:1702.07042 [physics.comp-ph] # # Definition of SNAP+ZBL+Tabulated potential. variable zblcutinner equal 4 variable zblcutouter equal 4.8 variable zblz equal 74 -# Specify hybrid with SNAP, ZBL, and long-range Coulomb +# Specify hybrid with SNAP and ZBL pair_style hybrid/overlay zbl ${zblcutinner} ${zblcutouter} snap table spline 10000 table spline 10000 pair_style hybrid/overlay zbl 4 ${zblcutouter} snap table spline 10000 table spline 10000 @@ -64,18 +67,19 @@ SNAP Element = W, Radius 0.5, Weight 1 Reading potential file W_2940_2017_2.snapparam with DATE: 2017-02-20 SNAP keyword rcutfac 4.73442 SNAP keyword twojmax 8 -SNAP keyword gamma 1 SNAP keyword rfac0 0.99363 SNAP keyword rmin0 0 SNAP keyword diagonalstyle 3 +SNAP keyword bzeroflag 0 +SNAP keyword quadraticflag 0 pair_coeff 2 2 table 1 He_He_JW2013.table HeHe Reading potential file He_He_JW2013.table with DATE: 2017-02-20 WARNING: 1 of 4999 force values in table are inconsistent with -dE/dr. - Should only be flagged at inflection points (../pair_table.cpp:476) + Should only be flagged at inflection points (../pair_table.cpp:481) pair_coeff 1 2 table 2 W_He_JW2013.table WHe Reading potential file W_He_JW2013.table with DATE: 2017-02-20 WARNING: 3 of 325 force values in table are inconsistent with -dE/dr. - Should only be flagged at inflection points (../pair_table.cpp:476) + Should only be flagged at inflection points (../pair_table.cpp:481) #Hybrid/overlay will take all pair styles and add their contributions equally, order of pair_coeff doesnt matter here #This is not the case for pair_style hybrid ... where only one pair_coeff is read for each type combination, order matters here. @@ -134,7 +138,7 @@ Neighbor list info ... pair build: full/bin/atomonly stencil: full/bin/3d bin: standard -Memory usage per processor = 7.6729 Mbytes +Per MPI rank memory allocation (min/avg/max) = 7.676 | 7.676 | 7.676 Mbytes Step Temp E_pair E_mol TotEng Press 0 300 -10.438105 0 -10.39963 -5445.2808 10 290.48923 -10.436885 0 -10.399629 -5646.4813 @@ -147,20 +151,20 @@ Step Temp E_pair E_mol TotEng Press 80 85.903126 -10.410645 0 -10.399628 857.74986 90 65.223651 -10.407993 0 -10.399628 1494.2746 100 59.833542 -10.407302 0 -10.399628 1938.9164 -Loop time of 11.0736 on 1 procs for 100 steps with 128 atoms +Loop time of 8.902 on 1 procs for 100 steps with 128 atoms -Performance: 0.390 ns/day, 61.520 hours/ns, 9.030 timesteps/s -99.9% CPU use with 1 MPI tasks x no OpenMP threads +Performance: 0.485 ns/day, 49.456 hours/ns, 11.233 timesteps/s +99.8% CPU use with 1 MPI tasks x 1 OpenMP threads MPI task timing breakdown: Section | min time | avg time | max time |%varavg| %total --------------------------------------------------------------- -Pair | 11.072 | 11.072 | 11.072 | 0.0 | 99.99 -Neigh | 0.00041604 | 0.00041604 | 0.00041604 | 0.0 | 0.00 -Comm | 0.00046253 | 0.00046253 | 0.00046253 | 0.0 | 0.00 -Output | 0.0001657 | 0.0001657 | 0.0001657 | 0.0 | 0.00 -Modify | 0.0002265 | 0.0002265 | 0.0002265 | 0.0 | 0.00 -Other | | 0.0003119 | | | 0.00 +Pair | 8.9002 | 8.9002 | 8.9002 | 0.0 | 99.98 +Neigh | 0.00043058 | 0.00043058 | 0.00043058 | 0.0 | 0.00 +Comm | 0.00045776 | 0.00045776 | 0.00045776 | 0.0 | 0.01 +Output | 0.00025344 | 0.00025344 | 0.00025344 | 0.0 | 0.00 +Modify | 0.00022483 | 0.00022483 | 0.00022483 | 0.0 | 0.00 +Other | | 0.0003953 | | | 0.00 Nlocal: 128 ave 128 max 128 min Histogram: 1 0 0 0 0 0 0 0 0 0 @@ -176,4 +180,4 @@ Ave neighs/atom = 53.5156 Neighbor list builds = 1 Dangerous builds = 0 -Total wall time: 0:00:11 +Total wall time: 0:00:09 diff --git a/examples/snap/log.21Feb17.snap.hybrid.WSNAP.HePair.g++.4 b/examples/snap/log.20Apr18.snap.hybrid.WSNAP.HePair.g++.4 similarity index 84% rename from examples/snap/log.21Feb17.snap.hybrid.WSNAP.HePair.g++.4 rename to examples/snap/log.20Apr18.snap.hybrid.WSNAP.HePair.g++.4 index 9bcbd288aa664cf29025090e8c0937e2580d905a..4ec85a63d014085449367848dbfd2c6f787a41e4 100644 --- a/examples/snap/log.21Feb17.snap.hybrid.WSNAP.HePair.g++.4 +++ b/examples/snap/log.20Apr18.snap.hybrid.WSNAP.HePair.g++.4 @@ -1,4 +1,6 @@ -LAMMPS (13 Feb 2017) +LAMMPS (20 Apr 2018) +OMP_NUM_THREADS environment is not set. Defaulting to 1 thread. (../comm.cpp:90) + using 1 OpenMP thread(s) per MPI task # Demonstrate SNAP Ta potential # Initialize simulation @@ -31,6 +33,7 @@ Created orthogonal box = (0 0 0) to (12.7212 12.7212 12.7212) 1 by 2 by 2 MPI processor grid create_atoms 1 box Created 128 atoms + Time spent = 0.000274658 secs mass 1 183.84 mass 2 4.0026 @@ -42,15 +45,15 @@ group helium type 2 5 atoms in group helium # choose potential -include W.SNAP_HePair.pot -# DATE: 2017-02-20 CONTRIBUTOR: Mitchell Wood mitwood@sandia.gov CITATION: Wood, M. A. and Thompson, A. P. to appear in arxiv Feb2017, W-He and He-He from Juslin, N. and Wirth, B. D. Journal of Nuclear Materials, 423, (2013) p61-63 +include W_2940_2017_2_He_JW2013.snap +# DATE: 2017-02-20 CONTRIBUTOR: Mitchell Wood mitwood@sandia.gov CITATION: Wood, M. A. and Thompson, A. P. "Quantum-Accurate Molecular Dynamics Potential for Tungsten" arXiv:1702.07042 [physics.comp-ph] # # Definition of SNAP+ZBL+Tabulated potential. variable zblcutinner equal 4 variable zblcutouter equal 4.8 variable zblz equal 74 -# Specify hybrid with SNAP, ZBL, and long-range Coulomb +# Specify hybrid with SNAP and ZBL pair_style hybrid/overlay zbl ${zblcutinner} ${zblcutouter} snap table spline 10000 table spline 10000 pair_style hybrid/overlay zbl 4 ${zblcutouter} snap table spline 10000 table spline 10000 @@ -64,18 +67,19 @@ SNAP Element = W, Radius 0.5, Weight 1 Reading potential file W_2940_2017_2.snapparam with DATE: 2017-02-20 SNAP keyword rcutfac 4.73442 SNAP keyword twojmax 8 -SNAP keyword gamma 1 SNAP keyword rfac0 0.99363 SNAP keyword rmin0 0 SNAP keyword diagonalstyle 3 +SNAP keyword bzeroflag 0 +SNAP keyword quadraticflag 0 pair_coeff 2 2 table 1 He_He_JW2013.table HeHe Reading potential file He_He_JW2013.table with DATE: 2017-02-20 WARNING: 1 of 4999 force values in table are inconsistent with -dE/dr. - Should only be flagged at inflection points (../pair_table.cpp:476) + Should only be flagged at inflection points (../pair_table.cpp:481) pair_coeff 1 2 table 2 W_He_JW2013.table WHe Reading potential file W_He_JW2013.table with DATE: 2017-02-20 WARNING: 3 of 325 force values in table are inconsistent with -dE/dr. - Should only be flagged at inflection points (../pair_table.cpp:476) + Should only be flagged at inflection points (../pair_table.cpp:481) #Hybrid/overlay will take all pair styles and add their contributions equally, order of pair_coeff doesnt matter here #This is not the case for pair_style hybrid ... where only one pair_coeff is read for each type combination, order matters here. @@ -134,7 +138,7 @@ Neighbor list info ... pair build: full/bin/atomonly stencil: full/bin/3d bin: standard -Memory usage per processor = 7.65426 Mbytes +Per MPI rank memory allocation (min/avg/max) = 7.656 | 7.656 | 7.656 Mbytes Step Temp E_pair E_mol TotEng Press 0 300 -10.438105 0 -10.39963 -5445.2808 10 292.13979 -10.437097 0 -10.39963 -5516.3963 @@ -147,20 +151,20 @@ Step Temp E_pair E_mol TotEng Press 80 79.985938 -10.409886 0 -10.399628 2392.1106 90 62.568933 -10.407652 0 -10.399628 3141.7027 100 56.697933 -10.406899 0 -10.399628 3583.9538 -Loop time of 2.8757 on 4 procs for 100 steps with 128 atoms +Loop time of 4.82103 on 4 procs for 100 steps with 128 atoms -Performance: 1.502 ns/day, 15.976 hours/ns, 34.774 timesteps/s -99.9% CPU use with 4 MPI tasks x no OpenMP threads +Performance: 0.896 ns/day, 26.783 hours/ns, 20.742 timesteps/s +99.0% CPU use with 4 MPI tasks x 1 OpenMP threads MPI task timing breakdown: Section | min time | avg time | max time |%varavg| %total --------------------------------------------------------------- -Pair | 2.7363 | 2.8122 | 2.8636 | 2.9 | 97.79 +Pair | 4.4837 | 4.6734 | 4.7605 | 5.2 | 96.94 Neigh | 0 | 0 | 0 | 0.0 | 0.00 -Comm | 0.011014 | 0.062439 | 0.13842 | 19.3 | 2.17 -Output | 0.00023842 | 0.00025076 | 0.0002861 | 0.0 | 0.01 -Modify | 9.2506e-05 | 9.9301e-05 | 0.00010395 | 0.0 | 0.00 -Other | | 0.0006654 | | | 0.02 +Comm | 0.057389 | 0.14453 | 0.33421 | 29.4 | 3.00 +Output | 0.00038719 | 0.00073916 | 0.0017841 | 0.0 | 0.02 +Modify | 0.00018716 | 0.00022203 | 0.00026417 | 0.0 | 0.00 +Other | | 0.002119 | | | 0.04 Nlocal: 32 ave 32 max 32 min Histogram: 4 0 0 0 0 0 0 0 0 0 @@ -176,4 +180,4 @@ Ave neighs/atom = 53.5156 Neighbor list builds = 0 Dangerous builds = 0 -Total wall time: 0:00:02 +Total wall time: 0:00:04 diff --git a/src/SNAP/compute_sna_atom.cpp b/src/SNAP/compute_sna_atom.cpp index 4b114d9ce777714ee305311398421979b99f69b7..9f56cee3f1500bce3f63680e3b6fb5e398468236 100644 --- a/src/SNAP/compute_sna_atom.cpp +++ b/src/SNAP/compute_sna_atom.cpp @@ -276,9 +276,13 @@ void ComputeSNAAtom::compute_peratom() for (int icoeff = 0; icoeff < ncoeff; icoeff++) { double bi = snaptr[tid]->bvec[icoeff]; + // diagonal element of quadratic matrix + + sna[i][ncount++] = 0.5*bi*bi; + // upper-triangular elements of quadratic matrix - for (int jcoeff = icoeff; jcoeff < ncoeff; jcoeff++) + for (int jcoeff = icoeff+1; jcoeff < ncoeff; jcoeff++) sna[i][ncount++] = bi*snaptr[tid]->bvec[jcoeff]; } } diff --git a/src/SNAP/compute_snad_atom.cpp b/src/SNAP/compute_snad_atom.cpp index 54a6ce761248c3ee6fcb2c4ab14fce16e5520e00..3db0c84854f97c3d9646afacc87e7fb599fbc9f2 100644 --- a/src/SNAP/compute_snad_atom.cpp +++ b/src/SNAP/compute_snad_atom.cpp @@ -95,6 +95,11 @@ ComputeSNADAtom::ComputeSNADAtom(LAMMPS *lmp, int narg, char **arg) : error->all(FLERR,"Illegal compute snad/atom command"); rmin0 = atof(arg[iarg+1]); iarg += 2; + } else if (strcmp(arg[iarg],"bzeroflag") == 0) { + if (iarg+2 > narg) + error->all(FLERR,"Illegal compute snad/atom command"); + bzeroflag = atoi(arg[iarg+1]); + iarg += 2; } else if (strcmp(arg[iarg],"switchflag") == 0) { if (iarg+2 > narg) error->all(FLERR,"Illegal compute snad/atom command"); @@ -121,16 +126,11 @@ ComputeSNADAtom::ComputeSNADAtom(LAMMPS *lmp, int narg, char **arg) : } ncoeff = snaptr[0]->ncoeff; - twoncoeff = 2*ncoeff; - threencoeff = 3*ncoeff; - size_peratom_cols = threencoeff*atom->ntypes; - if (quadraticflag) { - ncoeffq = (ncoeff*(ncoeff+1))/2; - twoncoeffq = 2*ncoeffq; - threencoeffq = 3*ncoeffq; - size_peratom_cols += - threencoeffq*atom->ntypes; - } + nperdim = ncoeff; + if (quadraticflag) nperdim += (ncoeff*(ncoeff+1))/2; + yoffset = nperdim; + zoffset = 2*nperdim; + size_peratom_cols = 3*nperdim*atom->ntypes; comm_reverse = size_peratom_cols; peratom_flag = 1; @@ -248,9 +248,10 @@ void ComputeSNADAtom::compute_peratom() const int* const jlist = firstneigh[i]; const int jnum = numneigh[i]; - const int typeoffset = threencoeff*(atom->type[i]-1); - const int quadraticoffset = threencoeff*atom->ntypes + - threencoeffq*(atom->type[i]-1); + // const int typeoffset = threencoeff*(atom->type[i]-1); + // const int quadraticoffset = threencoeff*atom->ntypes + + // threencoeffq*(atom->type[i]-1); + const int typeoffset = 3*nperdim*(atom->type[i]-1); // insure rij, inside, and typej are of size jnum @@ -304,16 +305,17 @@ void ComputeSNADAtom::compute_peratom() for (int icoeff = 0; icoeff < ncoeff; icoeff++) { snadi[icoeff] += snaptr[tid]->dbvec[icoeff][0]; - snadi[icoeff+ncoeff] += snaptr[tid]->dbvec[icoeff][1]; - snadi[icoeff+twoncoeff] += snaptr[tid]->dbvec[icoeff][2]; + snadi[icoeff+yoffset] += snaptr[tid]->dbvec[icoeff][1]; + snadi[icoeff+zoffset] += snaptr[tid]->dbvec[icoeff][2]; snadj[icoeff] -= snaptr[tid]->dbvec[icoeff][0]; - snadj[icoeff+ncoeff] -= snaptr[tid]->dbvec[icoeff][1]; - snadj[icoeff+twoncoeff] -= snaptr[tid]->dbvec[icoeff][2]; + snadj[icoeff+yoffset] -= snaptr[tid]->dbvec[icoeff][1]; + snadj[icoeff+zoffset] -= snaptr[tid]->dbvec[icoeff][2]; } if (quadraticflag) { - double *snadi = snad[i]+quadraticoffset; - double *snadj = snad[j]+quadraticoffset; + const int quadraticoffset = ncoeff; + snadi += quadraticoffset; + snadj += quadraticoffset; int ncount = 0; for (int icoeff = 0; icoeff < ncoeff; icoeff++) { double bi = snaptr[tid]->bvec[icoeff]; @@ -321,21 +323,36 @@ void ComputeSNADAtom::compute_peratom() double biy = snaptr[tid]->dbvec[icoeff][1]; double biz = snaptr[tid]->dbvec[icoeff][2]; + // diagonal elements of quadratic matrix + + double dbxtmp = bi*bix; + double dbytmp = bi*biy; + double dbztmp = bi*biz; + + snadi[ncount] += dbxtmp; + snadi[ncount+yoffset] += dbytmp; + snadi[ncount+zoffset] += dbztmp; + snadj[ncount] -= dbxtmp; + snadj[ncount+yoffset] -= dbytmp; + snadj[ncount+zoffset] -= dbztmp; + ncount++; + // upper-triangular elements of quadratic matrix - for (int jcoeff = icoeff; jcoeff < ncoeff; jcoeff++) { + for (int jcoeff = icoeff+1; jcoeff < ncoeff; jcoeff++) { double dbxtmp = bi*snaptr[tid]->dbvec[jcoeff][0] + bix*snaptr[tid]->bvec[jcoeff]; double dbytmp = bi*snaptr[tid]->dbvec[jcoeff][1] + biy*snaptr[tid]->bvec[jcoeff]; double dbztmp = bi*snaptr[tid]->dbvec[jcoeff][2] + biz*snaptr[tid]->bvec[jcoeff]; - snadi[ncount] += dbxtmp; - snadi[ncount+ncoeffq] += dbytmp; - snadi[ncount+twoncoeffq] += dbztmp; - snadj[ncount] -= dbxtmp; - snadj[ncount+ncoeffq] -= dbytmp; - snadj[ncount+twoncoeffq] -= dbztmp; + + snadi[ncount] += dbxtmp; + snadi[ncount+yoffset] += dbytmp; + snadi[ncount+zoffset] += dbztmp; + snadj[ncount] -= dbxtmp; + snadj[ncount+yoffset] -= dbytmp; + snadj[ncount+zoffset] -= dbztmp; ncount++; } } @@ -361,7 +378,7 @@ int ComputeSNADAtom::pack_reverse_comm(int n, int first, double *buf) for (i = first; i < last; i++) for (icoeff = 0; icoeff < size_peratom_cols; icoeff++) buf[m++] = snad[i][icoeff]; - return comm_reverse; + return m; } /* ---------------------------------------------------------------------- */ @@ -387,8 +404,7 @@ double ComputeSNADAtom::memory_usage() double bytes = nmax*size_peratom_cols * sizeof(double); bytes += 3*njmax*sizeof(double); bytes += njmax*sizeof(int); - bytes += threencoeff*atom->ntypes; - if (quadraticflag) bytes += threencoeffq*atom->ntypes; + bytes += 3*nperdim*atom->ntypes; bytes += snaptr[0]->memory_usage()*comm->nthreads; return bytes; } diff --git a/src/SNAP/compute_snad_atom.h b/src/SNAP/compute_snad_atom.h index 5e40632d8c5c61f7970428ce79ed1241c794c54c..a33e6047c2c2bd0fca6d25d8a2b948fef9f7d4f9 100644 --- a/src/SNAP/compute_snad_atom.h +++ b/src/SNAP/compute_snad_atom.h @@ -37,7 +37,7 @@ class ComputeSNADAtom : public Compute { private: int nmax, njmax, diagonalstyle; - int ncoeff, twoncoeff, threencoeff, ncoeffq, twoncoeffq, threencoeffq; + int ncoeff, nperdim, yoffset, zoffset; double **cutsq; class NeighList *list; double **snad; diff --git a/src/SNAP/compute_snav_atom.cpp b/src/SNAP/compute_snav_atom.cpp index 0278be5a97414f8dd9fb9ba681edd33255ecfbed..578f86ae5b50224d880d9ac6cebc63987f8b1ac9 100644 --- a/src/SNAP/compute_snav_atom.cpp +++ b/src/SNAP/compute_snav_atom.cpp @@ -96,6 +96,11 @@ ComputeSNAVAtom::ComputeSNAVAtom(LAMMPS *lmp, int narg, char **arg) : error->all(FLERR,"Illegal compute snav/atom command"); switchflag = atoi(arg[iarg+1]); iarg += 2; + } else if (strcmp(arg[iarg],"bzeroflag") == 0) { + if (iarg+2 > narg) + error->all(FLERR,"Illegal compute snav/atom command"); + bzeroflag = atoi(arg[iarg+1]); + iarg += 2; } else if (strcmp(arg[iarg],"quadraticflag") == 0) { if (iarg+2 > narg) error->all(FLERR,"Illegal compute snav/atom command"); @@ -117,22 +122,9 @@ ComputeSNAVAtom::ComputeSNAVAtom(LAMMPS *lmp, int narg, char **arg) : } ncoeff = snaptr[0]->ncoeff; - twoncoeff = 2*ncoeff; - threencoeff = 3*ncoeff; - fourncoeff = 4*ncoeff; - fivencoeff = 5*ncoeff; - sixncoeff = 6*ncoeff; - size_peratom_cols = sixncoeff*atom->ntypes; - if (quadraticflag) { - ncoeffq = ncoeff*ncoeff; - twoncoeffq = 2*ncoeffq; - threencoeffq = 3*ncoeffq; - fourncoeffq = 4*ncoeffq; - fivencoeffq = 5*ncoeffq; - sixncoeffq = 6*ncoeffq; - size_peratom_cols += - sixncoeffq*atom->ntypes; - } + nperdim = ncoeff; + if (quadraticflag) nperdim += (ncoeff*(ncoeff+1))/2; + size_peratom_cols = 6*nperdim*atom->ntypes; comm_reverse = size_peratom_cols; peratom_flag = 1; @@ -251,9 +243,7 @@ void ComputeSNAVAtom::compute_peratom() const int* const jlist = firstneigh[i]; const int jnum = numneigh[i]; - const int typeoffset = sixncoeff*(atom->type[i]-1); - const int quadraticoffset = sixncoeff*atom->ntypes + - sixncoeffq*(atom->type[i]-1); + const int typeoffset = 6*nperdim*(atom->type[i]-1); // insure rij, inside, and typej are of size jnum @@ -307,23 +297,24 @@ void ComputeSNAVAtom::compute_peratom() double *snavj = snav[j]+typeoffset; for (int icoeff = 0; icoeff < ncoeff; icoeff++) { - snavi[icoeff] += snaptr[tid]->dbvec[icoeff][0]*xtmp; - snavi[icoeff+ncoeff] += snaptr[tid]->dbvec[icoeff][1]*ytmp; - snavi[icoeff+twoncoeff] += snaptr[tid]->dbvec[icoeff][2]*ztmp; - snavi[icoeff+threencoeff] += snaptr[tid]->dbvec[icoeff][1]*ztmp; - snavi[icoeff+fourncoeff] += snaptr[tid]->dbvec[icoeff][0]*ztmp; - snavi[icoeff+fivencoeff] += snaptr[tid]->dbvec[icoeff][0]*ytmp; - snavj[icoeff] -= snaptr[tid]->dbvec[icoeff][0]*x[j][0]; - snavj[icoeff+ncoeff] -= snaptr[tid]->dbvec[icoeff][1]*x[j][1]; - snavj[icoeff+twoncoeff] -= snaptr[tid]->dbvec[icoeff][2]*x[j][2]; - snavj[icoeff+threencoeff] -= snaptr[tid]->dbvec[icoeff][1]*x[j][2]; - snavj[icoeff+fourncoeff] -= snaptr[tid]->dbvec[icoeff][0]*x[j][2]; - snavj[icoeff+fivencoeff] -= snaptr[tid]->dbvec[icoeff][0]*x[j][1]; + snavi[icoeff] += snaptr[tid]->dbvec[icoeff][0]*xtmp; + snavi[icoeff+nperdim] += snaptr[tid]->dbvec[icoeff][1]*ytmp; + snavi[icoeff+2*nperdim] += snaptr[tid]->dbvec[icoeff][2]*ztmp; + snavi[icoeff+3*nperdim] += snaptr[tid]->dbvec[icoeff][1]*ztmp; + snavi[icoeff+4*nperdim] += snaptr[tid]->dbvec[icoeff][0]*ztmp; + snavi[icoeff+5*nperdim] += snaptr[tid]->dbvec[icoeff][0]*ytmp; + snavj[icoeff] -= snaptr[tid]->dbvec[icoeff][0]*x[j][0]; + snavj[icoeff+nperdim] -= snaptr[tid]->dbvec[icoeff][1]*x[j][1]; + snavj[icoeff+2*nperdim] -= snaptr[tid]->dbvec[icoeff][2]*x[j][2]; + snavj[icoeff+3*nperdim] -= snaptr[tid]->dbvec[icoeff][1]*x[j][2]; + snavj[icoeff+4*nperdim] -= snaptr[tid]->dbvec[icoeff][0]*x[j][2]; + snavj[icoeff+5*nperdim] -= snaptr[tid]->dbvec[icoeff][0]*x[j][1]; } if (quadraticflag) { - double *snavi = snav[i]+quadraticoffset; - double *snavj = snav[j]+quadraticoffset; + const int quadraticoffset = ncoeff; + snavi += quadraticoffset; + snavj += quadraticoffset; int ncount = 0; for (int icoeff = 0; icoeff < ncoeff; icoeff++) { double bi = snaptr[tid]->bvec[icoeff]; @@ -331,27 +322,46 @@ void ComputeSNAVAtom::compute_peratom() double biy = snaptr[tid]->dbvec[icoeff][1]; double biz = snaptr[tid]->dbvec[icoeff][2]; + // diagonal element of quadratic matrix + + double dbxtmp = bi*bix; + double dbytmp = bi*biy; + double dbztmp = bi*biz; + snavi[ncount] += dbxtmp*xtmp; + snavi[ncount+nperdim] += dbytmp*ytmp; + snavi[ncount+2*nperdim] += dbztmp*ztmp; + snavi[ncount+3*nperdim] += dbytmp*ztmp; + snavi[ncount+4*nperdim] += dbxtmp*ztmp; + snavi[ncount+5*nperdim] += dbxtmp*ytmp; + snavj[ncount] -= dbxtmp*x[j][0]; + snavj[ncount+nperdim] -= dbytmp*x[j][1]; + snavj[ncount+2*nperdim] -= dbztmp*x[j][2]; + snavj[ncount+3*nperdim] -= dbytmp*x[j][2]; + snavj[ncount+4*nperdim] -= dbxtmp*x[j][2]; + snavj[ncount+5*nperdim] -= dbxtmp*x[j][1]; + ncount++; + // upper-triangular elements of quadratic matrix - for (int jcoeff = icoeff; jcoeff < ncoeff; jcoeff++) { + for (int jcoeff = icoeff+1; jcoeff < ncoeff; jcoeff++) { double dbxtmp = bi*snaptr[tid]->dbvec[jcoeff][0] + bix*snaptr[tid]->bvec[jcoeff]; double dbytmp = bi*snaptr[tid]->dbvec[jcoeff][1] + biy*snaptr[tid]->bvec[jcoeff]; double dbztmp = bi*snaptr[tid]->dbvec[jcoeff][2] + biz*snaptr[tid]->bvec[jcoeff]; - snavi[ncount] += dbxtmp*xtmp; - snavi[ncount+ncoeffq] += dbytmp*ytmp; - snavi[ncount+twoncoeffq] += dbztmp*ztmp; - snavi[ncount+threencoeffq] += dbytmp*ztmp; - snavi[ncount+fourncoeffq] += dbxtmp*ztmp; - snavi[ncount+fivencoeffq] += dbxtmp*ytmp; - snavj[ncount] -= dbxtmp*x[j][0]; - snavj[ncount+ncoeffq] -= dbytmp*x[j][1]; - snavj[ncount+twoncoeffq] -= dbztmp*x[j][2]; - snavj[ncount+threencoeffq] -= dbytmp*x[j][2]; - snavj[ncount+fourncoeffq] -= dbxtmp*x[j][2]; - snavj[ncount+fivencoeffq] -= dbxtmp*x[j][1]; + snavi[ncount] += dbxtmp*xtmp; + snavi[ncount+nperdim] += dbytmp*ytmp; + snavi[ncount+2*nperdim] += dbztmp*ztmp; + snavi[ncount+3*nperdim] += dbytmp*ztmp; + snavi[ncount+4*nperdim] += dbxtmp*ztmp; + snavi[ncount+5*nperdim] += dbxtmp*ytmp; + snavj[ncount] -= dbxtmp*x[j][0]; + snavj[ncount+nperdim] -= dbytmp*x[j][1]; + snavj[ncount+2*nperdim] -= dbztmp*x[j][2]; + snavj[ncount+3*nperdim] -= dbytmp*x[j][2]; + snavj[ncount+4*nperdim] -= dbxtmp*x[j][2]; + snavj[ncount+5*nperdim] -= dbxtmp*x[j][1]; ncount++; } } @@ -377,7 +387,7 @@ int ComputeSNAVAtom::pack_reverse_comm(int n, int first, double *buf) for (i = first; i < last; i++) for (icoeff = 0; icoeff < size_peratom_cols; icoeff++) buf[m++] = snav[i][icoeff]; - return comm_reverse; + return m; } /* ---------------------------------------------------------------------- */ @@ -403,8 +413,8 @@ double ComputeSNAVAtom::memory_usage() double bytes = nmax*size_peratom_cols * sizeof(double); bytes += 3*njmax*sizeof(double); bytes += njmax*sizeof(int); - bytes += sixncoeff*atom->ntypes; - if (quadraticflag) bytes += sixncoeffq*atom->ntypes; + bytes += 6*nperdim*atom->ntypes; + if (quadraticflag) bytes += 6*nperdim*atom->ntypes; bytes += snaptr[0]->memory_usage()*comm->nthreads; return bytes; } diff --git a/src/SNAP/compute_snav_atom.h b/src/SNAP/compute_snav_atom.h index 35f1478393520dc9f2a687a0db86201b0ca5e52c..2eb9fb804f7420aab541b5995b81e39a2ca83766 100644 --- a/src/SNAP/compute_snav_atom.h +++ b/src/SNAP/compute_snav_atom.h @@ -37,8 +37,7 @@ class ComputeSNAVAtom : public Compute { private: int nmax, njmax, diagonalstyle; - int ncoeff, twoncoeff, threencoeff, fourncoeff, fivencoeff, sixncoeff; - int ncoeffq, twoncoeffq, threencoeffq, fourncoeffq, fivencoeffq, sixncoeffq; + int ncoeff, nperdim; double **cutsq; class NeighList *list; double **snav; diff --git a/src/SNAP/pair_snap.cpp b/src/SNAP/pair_snap.cpp index 377235685cd0f052d2f51ab01967a63f6679707c..8714d55c5cb3dc532056330d2a674e2aa2629089 100644 --- a/src/SNAP/pair_snap.cpp +++ b/src/SNAP/pair_snap.cpp @@ -278,14 +278,15 @@ void PairSNAP::compute_regular(int eflag, int vflag) double bveci = snaptr->bvec[icoeff]; double fack = coeffi[k]*bveci; double* dbveci = snaptr->dbvec[icoeff]; - fij[0] += fack*snaptr->dbvec[icoeff][0]; - fij[1] += fack*snaptr->dbvec[icoeff][1]; - fij[2] += fack*snaptr->dbvec[icoeff][2]; + fij[0] += fack*dbveci[0]; + fij[1] += fack*dbveci[1]; + fij[2] += fack*dbveci[2]; k++; for (int jcoeff = icoeff+1; jcoeff < ncoeff; jcoeff++) { double facki = coeffi[k]*bveci; double fackj = coeffi[k]*snaptr->bvec[jcoeff]; double* dbvecj = snaptr->dbvec[jcoeff]; + fij[0] += facki*dbvecj[0]+fackj*dbveci[0]; fij[1] += facki*dbvecj[1]+fackj*dbveci[1]; fij[2] += facki*dbvecj[2]+fackj*dbveci[2]; @@ -1529,10 +1530,10 @@ void PairSNAP::coeff(int narg, char **arg) } if (comm->me == 0) - printf("ncoeff = %d snancoeff = %d \n",ncoeff,sna[0]->ncoeff); - if (ncoeff != sna[0]->ncoeff) { - error->all(FLERR,"Incorrect SNAP parameter file"); - } + if (ncoeff != sna[0]->ncoeff) { + printf("ncoeff = %d snancoeff = %d \n",ncoeff,sna[0]->ncoeff); + error->all(FLERR,"Incorrect SNAP parameter file"); + } // Calculate maximum cutoff for all elements diff --git a/src/SNAP/pair_snap.h b/src/SNAP/pair_snap.h index d39cb0f8d44a73b37ff5c4688b4c3f690e52f232..b60ab3c3e42657fba6fff2f316aa6e93aa5056a5 100644 --- a/src/SNAP/pair_snap.h +++ b/src/SNAP/pair_snap.h @@ -37,11 +37,8 @@ public: virtual double init_one(int, int); virtual double memory_usage(); - double rcutfac, quadraticflag; // declared public to workaround gcc 4.9 - int ncoeff; // compiler bug, manifest in KOKKOS package - protected: - int ncoeffq, ncoeffall; + int ncoeff, ncoeffq, ncoeffall; double **bvec, ***dbvec; class SNA** sna; int nmax; @@ -100,8 +97,8 @@ protected: double *wjelem; // elements weights double **coeffelem; // element bispectrum coefficients int *map; // mapping from atom types to elements - int twojmax, diagonalstyle, switchflag, bzeroflag; - double rfac0, rmin0, wj1, wj2; + int twojmax, diagonalstyle, switchflag, bzeroflag, quadraticflag; + double rcutfac, rfac0, rmin0, wj1, wj2; int rcutfacflag, twojmaxflag; // flags for required parameters };