Skip to content

Commit 9e1e800

Browse files
sunqmQiming Sun
andauthored
GPU kernels for PBC overlap integrals (#456)
* Add overlap integral kernel * Add ipovlp and ipkin kernels * cleanup int1e * Replace ovlp and kin integrals in pbc.scf and pbc.grad * Fix pbc int1e interface * Fix lattice sum range and other bugs * Fix np and cp compatibility --------- Co-authored-by: Qiming Sun <qiming.sun@bytedance.com>
1 parent 2372270 commit 9e1e800

File tree

16 files changed

+1339
-19
lines changed

16 files changed

+1339
-19
lines changed

gpu4pyscf/lib/pbc/CMakeLists.txt

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,7 @@ set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} --ptxas-options=-v")# -maxrregcount=12
33
add_library(pbc SHARED
44
pbc_driver.cu ft_ao.cu unrolled_ft_ao.cu ft_ao_bdiv.cu
55
fill_int3c2e.cu unrolled_int3c2e.cu fill_int2c2e.cu
6+
overlap.cu
67
estimator.cu
78
rys_roots_dat.cu
89
nr_eval_gto.cu

gpu4pyscf/lib/pbc/fill_int2c2e.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -57,7 +57,7 @@ void pbc_int2c2e_kernel(double *out, PBCIntEnvVars envs, PBCInt2c2eBounds bounds
5757
double *env = envs.env;
5858
double *img_coords = envs.img_coords;
5959

60-
int gout_stride = bounds.gout_stride_lookup[lj*L_AUX1+li];
60+
int gout_stride = bounds.gout_stride_lookup[li*L_AUX1+lj];
6161
int nsp_per_block = THREADS / gout_stride;
6262
int sp_id = thread_id % nsp_per_block;
6363
int gout_id = thread_id / nsp_per_block;

0 commit comments

Comments
 (0)