Bug fix in long range integral, add tests

bytedance · Nov 21, 2024 · 78cfa1f · 78cfa1f
1 parent 19b7556
commit 78cfa1f
Show file tree

Hide file tree

Showing 3 changed files with 147 additions and 18 deletions.
diff --git a/gpu4pyscf/gto/tests/test_int1e_grids.py b/gpu4pyscf/gto/tests/test_int1e_grids.py
@@ -0,0 +1,123 @@
+# Copyright 2023 The GPU4PySCF Authors. All Rights Reserved.
+#
+# This program is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+import unittest
+import numpy as np
+import pyscf
+from pyscf import lib
+from gpu4pyscf.gto.moleintor import intor
+
+def setUpModule():
+    global mol_sph, mol_cart, grid_points, integral_threshold, density_contraction_threshold
+    atom = '''
+O	0.0000	0.7375	-0.0528
+O	0.0000	-0.7375	-0.0528
+H	0.8190	0.8170	0.4220
+H	-0.8190	-0.8170	0.4220
+'''
+    bas='def2-qzvpp'
+
+    mol_sph = pyscf.M(atom=atom, basis=bas, max_memory=32000)
+    mol_sph.output = '/dev/null'
+    mol_sph.verbose = 0
+    mol_sph.build()
+
+    mol_cart = pyscf.M(atom=atom, basis=bas, max_memory=32000, cart=True)
+    mol_cart.output = '/dev/null'
+    mol_cart.verbose = 0
+    mol_cart.build()
+
+    xs = np.arange(-2.01, 2.0, 0.5)
+    ys = np.arange(-2.02, 2.0, 0.5)
+    zs = np.arange(-2.03, 2.0, 0.5)
+    grid_points = lib.cartesian_prod([xs, ys, zs])
+
+    # All of the following thresholds bound the max value of the corresponding matrix / tensor.
+    integral_threshold = 1e-12
+    density_contraction_threshold = 1e-10
+
+def tearDownModule():
+    global mol_sph, mol_cart, grid_points
+    mol_sph.stdout.close()
+    mol_cart.stdout.close()
+    del mol_sph, mol_cart, grid_points
+
+class KnownValues(unittest.TestCase):
+    '''
+    known values are obtained by Q-Chem
+    '''
+    def test_int1e_grids_full_tensor_cart(self):
+        ref_int1e = mol_cart.intor('int1e_grids', grids=grid_points)
+        test_int1e = intor(mol_cart, 'int1e_grids', grid_points)
+        assert np.abs(ref_int1e - test_int1e).max() < integral_threshold
+
+    def test_int1e_grids_full_tensor_sph(self):
+        ref_int1e = mol_sph.intor('int1e_grids', grids=grid_points)
+        test_int1e = intor(mol_sph, 'int1e_grids', grid_points)
+        assert np.abs(ref_int1e - test_int1e).max() < integral_threshold
+
+    def test_int1e_grids_density_contracted_cart_symmetric(self):
+        np.random.seed(12345)
+        dm = np.random.uniform(-2.0, 2.0, (mol_cart.nao, mol_cart.nao))
+        dm = 0.5 * (dm + dm.T)
+        ref_int1e_dot_D = np.einsum('pij,ij->p', mol_cart.intor('int1e_grids', grids=grid_points), dm)
+        test_int1e_dot_D = intor(mol_cart, 'int1e_grids', grid_points, dm = dm)
+        assert np.abs(ref_int1e_dot_D - test_int1e_dot_D).max() < density_contraction_threshold
+
+    def test_int1e_grids_density_contracted_sph_symmetric(self):
+        np.random.seed(12346)
+        dm = np.random.uniform(-2.0, 2.0, (mol_sph.nao, mol_sph.nao))
+        dm = 0.5 * (dm + dm.T)
+        ref_int1e_dot_D = np.einsum('pij,ij->p', mol_sph.intor('int1e_grids', grids=grid_points), dm)
+        test_int1e_dot_D = intor(mol_sph, 'int1e_grids', grid_points, dm = dm)
+        assert np.abs(ref_int1e_dot_D - test_int1e_dot_D).max() < density_contraction_threshold
+
+    def test_int1e_grids_density_contracted_cart_asymmetric(self):
+        np.random.seed(12347)
+        dm = np.random.uniform(-2.0, 2.0, (mol_cart.nao, mol_cart.nao))
+        ref_int1e_dot_D = np.einsum('pij,ij->p', mol_cart.intor('int1e_grids', grids=grid_points), dm)
+        test_int1e_dot_D = intor(mol_cart, 'int1e_grids', grid_points, dm = dm)
+        assert np.abs(ref_int1e_dot_D - test_int1e_dot_D).max() < density_contraction_threshold
+
+    def test_int1e_grids_density_contracted_sph_asymmetric(self):
+        np.random.seed(12348)
+        dm = np.random.uniform(-2.0, 2.0, (mol_sph.nao, mol_sph.nao))
+        ref_int1e_dot_D = np.einsum('pij,ij->p', mol_sph.intor('int1e_grids', grids=grid_points), dm)
+        test_int1e_dot_D = intor(mol_sph, 'int1e_grids', grid_points, dm = dm)
+        assert np.abs(ref_int1e_dot_D - test_int1e_dot_D).max() < density_contraction_threshold
+
+    def test_int1e_grids_full_tensor_omega(self):
+        omega = 0.8
+        mol_sph_omega = mol_sph.copy()
+        mol_sph_omega.set_range_coulomb(omega)
+        ref_int1e = mol_sph_omega.intor('int1e_grids', grids=grid_points)
+        test_int1e = intor(mol_sph, 'int1e_grids', grid_points, omega = omega)
+        assert np.abs(ref_int1e - test_int1e).max() < integral_threshold
+
+    def test_int1e_grids_density_contracted_omega(self):
+        omega = 1.2
+        mol_sph_omega = mol_sph.copy()
+        mol_sph_omega.set_range_coulomb(omega)
+
+        np.random.seed(12349)
+        dm = np.random.uniform(-2.0, 2.0, (mol_sph.nao, mol_sph.nao))
+
+        ref_int1e_dot_D = np.einsum('pij,ij->p', mol_sph_omega.intor('int1e_grids', grids=grid_points), dm)
+        test_int1e_dot_D = intor(mol_sph, 'int1e_grids', grid_points, dm = dm, omega = omega)
+        assert np.abs(ref_int1e_dot_D - test_int1e_dot_D).max() < integral_threshold
+
+if __name__ == "__main__":
+    print("Full Tests for One Electron Coulomb Integrals")
+    unittest.main()
diff --git a/gpu4pyscf/lib/gint/g1e.cu b/gpu4pyscf/lib/gint/g1e.cu
@@ -44,10 +44,11 @@ static void GINTg1e(double* __restrict__ g, const double* __restrict__ grid_poin
     const double PCy = Py - Cy;
     const double PCz = Pz - Cz;
     double a0 = aij;
-    const double theta = omega > 0.0 ? omega * omega / (omega * omega + a0) : 1.0;
+    const double theta = omega > 0.0 ? omega * omega / (omega * omega + aij) : 1.0;
+    const double sqrt_theta = omega > 0.0 ? omega / sqrt(omega * omega + aij) : 1.0;
     a0 *= theta;
 
-    const double prefactor = 2.0 * M_PI / a0 * eij;
+    const double prefactor = 2.0 * M_PI / aij * eij * sqrt_theta;
     const double boys_input = a0 * (PCx * PCx + PCy * PCy + PCz * PCz);
     double uw[NROOTS * 2];
     GINTrys_root<NROOTS>(boys_input, uw);
@@ -77,8 +78,8 @@ static void GINTg1e(double* __restrict__ g, const double* __restrict__ grid_poin
         gz[i_root] = w[i_root];
 
         const double u2 = a0 * u[i_root];
-        const double t2 = u2 / (u2 + a0);
-        const double b10 = 0.5 / a0 * (1.0 - t2);
+        const double t2 = u2 / (u2 + aij);
+        const double b10 = 0.5 / aij * (1.0 - t2);
         const double c00x = PAx - t2 * PCx;
         const double c00y = PAy - t2 * PCy;
         const double c00z = PAz - t2 * PCz;
@@ -153,10 +154,11 @@ static void GINT_g1e_without_hrr(double* __restrict__ g, const double* __restric
     const double PCy = Py - Cy;
     const double PCz = Pz - Cz;
     double a0 = aij;
-    const double theta = omega > 0.0 ? omega * omega / (omega * omega + a0) : 1.0;
+    const double theta = omega > 0.0 ? omega * omega / (omega * omega + aij) : 1.0;
+    const double sqrt_theta = omega > 0.0 ? omega / sqrt(omega * omega + aij) : 1.0;
     a0 *= theta;
 
-    const double prefactor = 2.0 * M_PI / a0 * eij;
+    const double prefactor = 2.0 * M_PI / aij * eij * sqrt_theta;
     const double boys_input = a0 * (PCx * PCx + PCy * PCy + PCz * PCz);
     double uw[NROOTS * 2];
     GINTrys_root<NROOTS>(boys_input, uw);
@@ -186,8 +188,8 @@ static void GINT_g1e_without_hrr(double* __restrict__ g, const double* __restric
         gz[i_root] = w[i_root];
 
         const double u2 = a0 * u[i_root];
-        const double t2 = u2 / (u2 + a0);
-        const double b10 = 0.5 / a0 * (1.0 - t2);
+        const double t2 = u2 / (u2 + aij);
+        const double b10 = 0.5 / aij * (1.0 - t2);
         const double c00x = PAx - t2 * PCx;
         const double c00y = PAy - t2 * PCy;
         const double c00z = PAz - t2 * PCz;

diff --git a/gpu4pyscf/lib/gint/g1e_root_123.cu b/gpu4pyscf/lib/gint/g1e_root_123.cu
@@ -62,10 +62,11 @@ static void GINTfill_int3c1e_kernel00(double* output, const BasisProdOffsets off
         const double PCy = Py - Cy;
         const double PCz = Pz - Cz;
         double a0 = aij;
-        const double theta = omega > 0.0 ? omega * omega / (omega * omega + a0) : 1.0; 
+        const double theta = omega > 0.0 ? omega * omega / (omega * omega + aij) : 1.0;
+        const double sqrt_theta = omega > 0.0 ? omega / sqrt(omega * omega + aij) : 1.0;
         a0 *= theta;
 
-        const double prefactor = 2.0 * M_PI / a0 * eij;
+        const double prefactor = 2.0 * M_PI / aij * eij * sqrt_theta;
         const double boys_input = a0 * (PCx * PCx + PCy * PCy + PCz * PCz);
         double eri = prefactor;
         if (boys_input > 3.e-7) {
@@ -124,10 +125,11 @@ static void GINTfill_int3c1e_density_contracted_kernel00(double* output, const d
         const double PCy = Py - Cy;
         const double PCz = Pz - Cz;
         double a0 = aij;
-        const double theta = omega > 0.0 ? omega * omega / (omega * omega + a0) : 1.0; 
+        const double theta = omega > 0.0 ? omega * omega / (omega * omega + aij) : 1.0;
+        const double sqrt_theta = omega > 0.0 ? omega / sqrt(omega * omega + aij) : 1.0;
         a0 *= theta;
 
-        const double prefactor = 2.0 * M_PI / a0 * eij;
+        const double prefactor = 2.0 * M_PI / aij * eij * sqrt_theta;
         const double boys_input = a0 * (PCx * PCx + PCy * PCy + PCz * PCz);
         double eri = prefactor;
         if (boys_input > 3.e-7) {
@@ -197,11 +199,12 @@ static void GINTfill_int3c1e_kernel10(double* output, const BasisProdOffsets off
         const double PAy = Py - Ay;
         const double PAz = Pz - Az;
         double a0 = aij;
-        const double theta = omega > 0.0 ? omega * omega / (omega * omega + a0) : 1.0; 
+        const double one_over_two_p = 0.5 / aij;
+        const double theta = omega > 0.0 ? omega * omega / (omega * omega + aij) : 1.0;
+        const double sqrt_theta = omega > 0.0 ? omega / sqrt(omega * omega + aij) : 1.0;
         a0 *= theta;
-        const double one_over_two_p = 0.5 / a0;
 
-        const double prefactor = 2.0 * M_PI / a0 * eij;
+        const double prefactor = 2.0 * M_PI / aij * eij * sqrt_theta;
         const double boys_input = a0 * (PCx * PCx + PCy * PCy + PCz * PCz);
         double eri_x = prefactor;
         double eri_y = prefactor;
@@ -282,11 +285,12 @@ static void GINTfill_int3c1e_density_contracted_kernel10(double* output, const d
         const double PAy = Py - Ay;
         const double PAz = Pz - Az;
         double a0 = aij;
-        const double theta = omega > 0.0 ? omega * omega / (omega * omega + a0) : 1.0; 
+        const double one_over_two_p = 0.5 / aij;
+        const double theta = omega > 0.0 ? omega * omega / (omega * omega + aij) : 1.0;
+        const double sqrt_theta = omega > 0.0 ? omega / sqrt(omega * omega + aij) : 1.0;
         a0 *= theta;
-        const double one_over_two_p = 0.5 / a0;
 
-        const double prefactor = 2.0 * M_PI / a0 * eij;
+        const double prefactor = 2.0 * M_PI / aij * eij * sqrt_theta;
         const double boys_input = a0 * (PCx * PCx + PCy * PCy + PCz * PCz);
         double eri_x = prefactor;
         double eri_y = prefactor;