Skip to content

Commit

Permalink
update build/run scripts due to the recent merge from master
Browse files Browse the repository at this point in the history
  • Loading branch information
liuyangzhuan committed Oct 5, 2022
1 parent 6bbb32f commit 73d8a63
Show file tree
Hide file tree
Showing 3 changed files with 18 additions and 48 deletions.
20 changes: 0 additions & 20 deletions CMakeLists.txt.orig
Original file line number Diff line number Diff line change
Expand Up @@ -178,25 +178,6 @@ if (TPL_ENABLE_CUDALIB) ## want to use cuda
message("-- Enabled support for CUDA.")
enable_language(CUDA)
find_package(CUDA REQUIRED)
<<<<<<< HEAD
# if (NOT CMAKE_CUDA_FLAGS)
# cuda_select_nvcc_arch_flags(CUDA_ARCH_FLAGS Auto)
# message("-- Cuda Flags : '${CUDA_ARCH_FLAGS}'")
# endif()
# if (CUDA_FOUND)
# if (NOT CMAKE_CUDA_FLAGS)
# cuda_select_nvcc_arch_flags(CUDA_ARCH_FLAGS Auto)
# message("-- Cuda Flags : '${CUDA_ARCH_FLAGS}'")
# endif()
# set(CUDA_NVCC_FLAGS_RELEASE "-O3 --expt-relaxed-constexpr -DNDEBUG -g ${CMAKE_CUDA_FLAGS} ${CUDA_ARCH_FLAGS}")
# set(CUDA_NVCC_FLAGS_DEBUG "-O0 --expt-relaxed-constexpr -DDEBUG -g -G ${CMAKE_CUDA_FLAGS} ${CUDA_ARCH_FLAGS}")
# list(APPEND CMAKE_CUDA_FLAGS ${CUDA_ARCH_FLAGS})
# message("-- Cuda Flags : '${CMAKE_CUDA_FLAGS}'")
# endif()
# # find_package(CUDAToolkit REQUIRED)

message("-- Cuda libraries at : '${CUDA_LIBRARIES}'")
=======
if (CUDA_FOUND)
if (NOT CMAKE_CUDA_FLAGS)
cuda_select_nvcc_arch_flags(CUDA_ARCH_FLAGS Auto)
Expand All @@ -206,7 +187,6 @@ if (TPL_ENABLE_CUDALIB) ## want to use cuda
set(CMAKE_CUDA_FLAGS_DDEBUG "-O0 --expt-relaxed-constexpr -DDEBUG -g" CACHE STRING "")
endif()

>>>>>>> 1a6d5bad87736c9e6f53530a63dce79856ecd76c
# find_package(CUB REQUIRED)

find_package(CUDAToolkit REQUIRED)
Expand Down
23 changes: 14 additions & 9 deletions example_scripts/batch_script_mpi_runit_cori_gpu_openmpi4.sh
Original file line number Diff line number Diff line change
Expand Up @@ -10,31 +10,36 @@ module load cuda/11.1.1
module load openmpi/4.0.3
module load nsight-systems

export OMP_NUM_THREADS=5
export NUM_GPU_STREAMS=1
export SUPERLU_ACC_OFFLOAD=1
export OMP_NUM_THREADS=1
export MAX_BUFFER_SIZE=50000000
export SUPERLU_NUM_GPU_STREAMS=1
export SUPERLU_BIND_MPI_GPU=1
export SUPERLU_ACC_OFFLOAD=1 # this can be 0 to do CPU tests on GPU nodes
export GPU3DVERSION=1

# srun -n 1 ./EXAMPLE/pddrive -r 1 -c 1 ../EXAMPLE/g20.rua
DIR=$CFS/ntrain9/YangLiu/matrix

export NSUP=128
export NREL=20
# export NSUP=128
# export NREL=20
# export NSUP=256
# export NREL=256
# for MAT in big.rua
# for MAT in g4.rua
# for MAT in g20.rua
# for MAT in s1_mat_0_253872.bin
for MAT in s1_mat_0_126936.bin
# for MAT in torso3.mtx
# for MAT in Graphene2880/H.mtx
# for MAT in s1_mat_0_126936.bin s1_mat_0_253872.bin s1_mat_0_507744.bin
# for MAT in matrix_ACTIVSg70k_AC_00.mtx matrix_ACTIVSg10k_AC_00.mtx
for MAT in temp_13k.mtx temp_25k.mtx temp_75k.mtx
# for MAT in temp_13k.mtx temp_25k.mtx temp_75k.mtx
do
# srun -n 1 nsys profile --stats=true ./EXAMPLE/pddrive -r 1 -c 1 ../../matrix/$MAT
# srun -n 1 ncu -k dlsum_bmod_inv_gpu_mrhs,dlsum_fmod_inv_gpu_mrhs --launch-count 1 --target-processes all ./EXAMPLE/pddrive -r 1 -c 1 ../../matrix/$MAT
# srun -n 1 ncu -f -k dlsum_bmod_inv_gpu_mrhs --set full --launch-count 1 --target-processes all -o trisolve_u ./EXAMPLE/pddrive -r 1 -c 1 ../../matrix/$MAT
# srun -n 1 ncu -f -k dlsum_fmod_inv_gpu_mrhs --set full --launch-count 1 --target-processes all -o trisolve_l "/project/projectdirs/m2957/liuyangz/my_research/superlu_dist_amd_mergefrom_master_12_01_2021/build/EXAMPLE/pddrive" -r 1 -c 1 ../../matrix/$MAT
srun -n 1 ./EXAMPLE/pddrive -r 1 -c 1 $DIR/$MAT
# srun -n 1 ./EXAMPLE/pddrive3d -r 1 -c 1 -d 1 $DIR/$MAT
srun -n 1 ./EXAMPLE/pddrive3d -r 1 -c 1 -d 1 $DIR/$MAT
# srun -n 1 ./EXAMPLE/pddrive3d -r 1 -c 1 -d 1 ../EXAMPLE/big.rua
# srun -n 1 ./EXAMPLE/pddrive -r 1 -c 1 $DIR/$MAT
done

23 changes: 4 additions & 19 deletions example_scripts/run_cmake_build_cori_gpu_openmpi4.sh
Original file line number Diff line number Diff line change
@@ -1,23 +1,18 @@
#!/bin/bash
# Bash script to submit many files to Cori/Edison/Queue
module unload cray-mpich
module swap PrgEnv-intel PrgEnv-gnu
module purge
export MKLROOT=/opt/intel/compilers_and_libraries_2019.3.199/linux/mkl
export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/opt/intel/compilers_and_libraries_2019.3.199/linux/mkl/lib/intel64

# module use /global/common/software/m3169/cori/modulefiles
# module unload openmpi
module unload cmake
module load cmake

# module load cudatoolkit
module load cgpu
<<<<<<< HEAD
module load cuda/10.2.89
=======
module load cuda/11.1.1
module swap gcc gcc/8.3.0
>>>>>>> master
module load gcc/8.3.0
module load openmpi/4.0.3
module load cmake/3.22.1
# module load cuda
# module load openmpi

Expand Down Expand Up @@ -50,12 +45,10 @@ rm -rf DartConfiguration.tcl
# -DCMAKE_CUDA_FLAGS="--disable-warnings -DPRNTlevel=1 -DPROFlevel=0 -DDEBUGlevel=0 -gencode arch=compute_70,code=sm_70 -I/usr/common/software/openmpi/4.0.3/gcc/8.3.0/cuda/10.2.89/include"



cmake .. \
-DCMAKE_BUILD_TYPE=Debug\
-Denable_complex16=OFF\
-DCMAKE_VERBOSE_MAKEFILE:BOOL=ON \
<<<<<<< HEAD
-DCMAKE_C_COMPILER=mpicc \
-DCMAKE_CXX_COMPILER=mpic++ \
-DCMAKE_Fortran_COMPILER=mpif90 \
Expand Down Expand Up @@ -97,14 +90,6 @@ cmake .. \
make pddrive
make pddrive3d

=======
-DCMAKE_CXX_FLAGS="-Ofast -DRELEASE ${INC_VTUNE} -I${CUDA_ROOT}/include" \
-DCMAKE_C_FLAGS="-DGPU_SOLVE -std=c11 -DPRNTlevel=1 -DPROFlevel=0 -DDEBUGlevel=0 ${INC_VTUNE} -I${CUDA_ROOT}/include" \
-DCMAKE_CUDA_FLAGS="-lineinfo --disable-warnings -DPRNTlevel=1 -DPROFlevel=0 -DDEBUGlevel=0 -gencode arch=compute_70,code=sm_70 -I/usr/common/software/openmpi/4.0.3/gcc/8.3.0/cuda/10.2.89/include"
make pddrive
make pddrive3d
# make install
>>>>>>> master
# -DTPL_BLAS_LIBRARIES="/opt/intel/compilers_and_libraries_2017.2.174/linux/mkl/lib/intel64/libmkl_intel_lp64.so;/opt/intel/compilers_and_libraries_2017.2.174/linux/mkl/lib/intel64/libmkl_sequential.so;/opt/intel/compilers_and_libraries_2017.2.174/linux/mkl/lib/intel64/libmkl_core.so"

# -DTPL_BLAS_LIBRARIES="/opt/intel/compilers_and_libraries_2017.2.174/linux/mkl/lib/intel64/libmkl_intel_lp64.so;/opt/intel/compilers_and_libraries_2017.2.174/linux/mkl/lib/intel64/libmkl_sequential.so;/opt/intel/compilers_and_libraries_2017.2.174/linux/mkl/lib/intel64/libmkl_core.so" \
Expand Down

0 comments on commit 73d8a63

Please sign in to comment.