[WIP]Implement multi-GPU support in BSSN RHS and add profiling for H2D/D2H transfers

This commit is contained in:
2026-02-28 01:21:45 +08:00
parent 724e9cd415
commit d94c31c5c4
2 changed files with 75 additions and 8 deletions

View File

@@ -42,4 +42,4 @@ CLINKER = mpiicpx
Cu = nvcc
CUDA_LIB_PATH = -L/usr/lib/cuda/lib64 -I/usr/include -I/usr/lib/cuda/include
#CUDA_APP_FLAGS = -c -g -O3 --ptxas-options=-v -arch compute_13 -code compute_13,sm_13 -Dfortran3 -Dnewc
CUDA_APP_FLAGS = -c -g -O3 --ptxas-options=-v -Dfortran3 -Dnewc -arch=sm_89
CUDA_APP_FLAGS = -c -g -O3 --ptxas-options=-v -Dfortran3 -Dnewc -arch=sm_80