File: nvshmem_run_6node.sh

package info (click to toggle)
superlu-dist 9.2.1%2Bdfsg1-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 16,292 kB
  • sloc: ansic: 172,999; cpp: 7,262; sh: 5,677; f90: 854; python: 563; makefile: 458; fortran: 51; csh: 9
file content (62 lines) | stat: -rw-r--r-- 3,494 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
#!/bin/bash
#BSUB -P BIF115
#BSUB -W 00:10
#BSUB -nnodes 6
#BSUB -alloc_flags gpumps
#BSUB -J superlu_gpu

EXIT_SUCCESS=0
EXIT_HOST=1
EXIT_PARAM=2

CUR_DIR=`pwd`
FILE_DIR=$CUR_DIR/EXAMPLE
INPUT_DIR=$MEMBERWORK/csc289/matrix
FILE_NAME=pddrive
FILE=$FILE_DIR/$FILE_NAME
#CPDIR=/autofs/nccs-svm1_home1/nanding/myproject/superLU/pm/superlu_dist/build_nvshmem280_cuda1103_0127/EXAMPLE
#CPDIR=/autofs/nccs-svm1_home1/nanding/myproject/superLU/pm/superlu_dist/build_nvshmem270_cuda_11013/EXAMPLE
#cp $CPDIR/pddrive $CUR_DIR/EXAMPLE/ -rfv

export NVSHMEM_MPI_LIB_NAME=libmpi_ibm.so
export NVSHMEM_LMPI=-lmpi_ibm
## export NVSHMEM_HCA_PE_MAPPIN  maybe??
nprows=(6)
npcols=(1)  
# MAT=s1_mat_0_126936.bin #Goodwin_127.mtx #A30_015_0_25356.bin #big.rua #s1_mat_0_126936.bin
MAT=Li4244.bin
#(s1_mat_0_126936.bin s1_mat_0_253872.bin Li4244.bin DG_GrapheneDisorder_8192.bin LU_C_BN_C_2by2.bin) #s1_mat_0_253872.bin) #s1_mat_0_507744.bin Li4244.bin DG_GrapheneDisorder_8192.bin LU_C_BN_C_2by2.bin) #Li4244.bin s1_mat_0_253872.bin) 
#matrix=(DG_GrapheneDisorder_8192.bin) #DG_GrapheneDisorder_8192.bin LU_C_BN_C_2by2.bin) #Li4244.bin s1_mat_0_253872.bin) 
##matrix=(g20.rua) #s1_mat_0_126936.bin) #s1_mat_0_507744.bin Li4244.bin LU_C_BN_C_2by2.bin DG_GrapheneDisorder_8192.bin) #DG_GrapheneDisorder_8192.bin LU_C_BN_C_2by2.bin) #Li4244.bin s1_mat_0_253872.bin) 
#matrix=(Li4244.bin s1_mat_0_253872.bin) #DG_GrapheneDisorder_8192.bin LU_C_BN_C_2by2.bin) #Li4244.bin s1_mat_0_253872.bin) 
#export NVSHMEM_HOME=/ccs/home/nanding/mysoftware/nvshmem270_gdr23_cuda1102_11232022/ 
#export NVSHMEM_HOME=/ccs/home/nanding/mysoftware/nvshmem280_gdr23_cuda1102_20230131 
export NVSHMEM_HOME=/ccs/home/nanding/mysoftware/nvshmem280_gdr23_cuda1103_20230127/ 
export LD_LIBRARY_PATH=$NVSHMEM_HOME/lib:$LD_LIBRARY_PATH
#export NVSHMEM_BOOTSTRAP_TWO_STAGE=1
#export NVSHMEM_BOOTSTRAP=MPI
export NSUP=256 
#export NREL=256
export MAX_BUFFER_SIZE=5000000000
export OMP_NUM_THREADS=1

export SUPERLU_ACC_SOLVE=1

#jsrun -n6 -g1 -a1  -c2 ./mpi-based-init |& tee log_nvshmem_2GPU_1NODE
#jsrun -n6 -a1 -c42 -g1 ./mpi-based-init |& tee log_nvshmem_2GPU_6NODE 
mkdir -p ${MAT}_summit
for i in {1..1}
do
MYDATE=$(date '+%Y-%m-%d-%H-%M-%S')
#jsrun -n6 -a1 -c42  -g1  $FILE_DIR/pddrive  -c 1 -r 1 -b 1 $INPUT_DIR/$MAT |& tee ./${MAT}_summit/batch_SLU.o_mpi_1x1_OMP_${OMP_NUM_THREADS}_GPU_1_6NODE_${MYDATE}
#jsrun -n6 -g1 -a1 -c2  $FILE_DIR/pddrive  -c 1 -r 1 -b 1 $INPUT_DIR/$MAT |& tee ./${MAT}_summit/batch_SLU.o_mpi_1x1_OMP_${OMP_NUM_THREADS}_GPU_1_1NODE_${MYDATE}
jsrun -n6 -a1 -c42 -g1  $FILE_DIR/pddrive  -c 1 -r 6 $INPUT_DIR/$MAT |& tee ./${MAT}_summit/SLU.o_mpi_6x1_OMP_${OMP_NUM_THREADS}_GPU_6_6NODE_${MYDATE}
jsrun -n6 -g1 -a1 -c2  $FILE_DIR/pddrive  -c 1 -r 6 $INPUT_DIR/$MAT |& tee ./${MAT}_summit/SLU.o_mpi_6x1_OMP_${OMP_NUM_THREADS}_GPU_6_1NODE_${MYDATE}
done
#MYDATE=$(date '+%Y-%m-%d-%H-%M-%S')
#export NVSHMEM_DEBUG=1
##jsrun -n6 -a1 -c42 -g1 ./mpi-based-init |& tee log_nvshmem_2GPU_6NODE 
##jsrun -n6 -g1 -a1  -c2 ./mpi-based-init |& tee log_nvshmem_2GPU_1NODE
#jsrun -n6 -a1 -c42  -g1  $FILE_DIR/pddrive  -c 1 -r 6 $INPUT_DIR/$MAT |& tee ./${MAT}_summit/SLU.o_mpi_6x1_OMP_${OMP_NUM_THREADS}_GPU_6_6NODE_${MYDATE}
##jsrun -n2 -g3 -a3 -c42  $FILE_DIR/pddrive  -c 1 -r 6 $INPUT_DIR/$MAT |& tee ./${MAT}_summit/SLU.o_mpi_6x1_OMP_${OMP_NUM_THREADS}_GPU_6_2NODE_${MYDATE}
#jsrun -n6 -g1 -a1 -c2  $FILE_DIR/pddrive  -c 1 -r 6 $INPUT_DIR/$MAT |& tee ./${MAT}_summit/SLU.o_mpi_6x1_OMP_${OMP_NUM_THREADS}_GPU_6_1NODE_${MYDATE}