Skip to content

Commit 554587e

Browse files
committed
Gadi singularity modifications
* Fixing the weak scaling to use the right number for ncpu decomposition * Adding gadi_container_go.sh
1 parent 685c8d3 commit 554587e

File tree

4 files changed

+21
-9
lines changed

4 files changed

+21
-9
lines changed

gadi_baremetal_go.sh

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,11 @@
11
#!/bin/bash
22

3-
# the follow load the full software stack and running environment on gadi
4-
source /g/data/m18/codes/UWGeodynamics_2.10.sh
3+
module load petsc/3.21.3 python3/3.11.7 openmpi/4.1.7 python3-as-python hdf5/1.12.2p
4+
5+
UWENV=/g/data/m18/software/venv/uw216 # Project directory
6+
export PATH=${UWENV}/bin:$PATH
7+
export PYTHONPATH=${UWENV}/lib/python3.11/site-packages/:$PYTHONPATH
8+
59
env
610
cat timed_model.py
711

gadi_container_go.sh

Lines changed: 9 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -5,15 +5,21 @@ module load singularity
55
module load openmpi/4.1.4
66

77

8-
export singularityDir=/g/data/m18/software/underworld/
8+
#export singularityDir=/home/565/jug565/scratch_m18/
9+
export singularityDir=/scratch/m18/jug565/codes/
910

1011
# Define the container to use
11-
export containerImage=$singularityDir/underworld-215.sif
12+
#export containerImage=$singularityDir/underworld-215.sif
13+
export containerImage=$singularityDir/uw-rhel.sif
1214

1315
env
1416
cat timed_model.py
1517
echo ""
1618
echo "---------- Running Job ----------"
1719
echo ""
1820
export TIME_LAUNCH_MPI=`date +%s%N | cut -b1-13`
19-
mpiexec -n $PBS_NCPUS singularity exec $containerImage bash -c "TIME_LAUNCH_PYTHON=\`date +%s%N | cut -b1-13\` python3 timed_model.py"
21+
#$PBS_NCPUS vs $NTASKS
22+
mpiexec -n $NTASKS singularity exec -B /opt/pbs/default/lib/,/half-root/ --bind /lib64:/glib64 \
23+
$containerImage \
24+
bash -c "TIME_LAUNCH_PYTHON=\`date +%s%N | cut -b1-13\` LD_LIBRARY_PATH=/apps/openmpi/4.1.4/lib:/glib64:$LD_LIBRARY_PATH python3 timed_model.py"
25+
#mpiexec -n $PBS_NCPUS singularity exec $containerImage bash -c "TIME_LAUNCH_PYTHON=\`date +%s%N | cut -b1-13\` LD_LIBRARY_PATH=/apps/openmpi/4.1.4/lib:$LD_LIBRARY_PATH python3 timed_model.py"

params.sh

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1,15 +1,16 @@
11
#!/bin/bash
2-
export JOBS="1 2 4 6 8"
3-
#export JOBS="1 2 4 6 8 10 12 14 16 18 20 22"
2+
#export JOBS="1 2 3"
3+
#export JOBS="8 10 12"
4+
export JOBS="1 2 3 4 5 6 8 10 12 14 18"
45
#export JOBS="22 22"
5-
export UW_NAME="2.15.0_WeakScaling"
6+
export UW_NAME="UW216-container"
67
export SCALING_TYPE=1 # 1=weak, 2=strong
78

89
export UW_MODEL="SolDB3d" # "SolDB3d" for dim3, though penalty method probably needed for q1.
910
export PICKLENAME=None #"SolDB3d_Gadi_1e-11.pickle" #"conv_test_results_high_res_tighter_take2.pickle" # set to "None" to disable conv testing
1011
export UW_ENABLE_IO="0"
1112

12-
export WALLTIME="00:10:00"
13+
export WALLTIME="00:15:00"
1314
export ACCOUNT="m18"
1415
export QUEUE="normal" # normal or express
1516

scaling_test_job_launcher.sh

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -46,6 +46,7 @@ do
4646
# memory requirement guess: 3GB * nprocs
4747
MEMORY="$((3*${PBSTASKS}))GB"
4848
CMD="qsub -v ${EXPORTVARS} -N ${NAME} -l storage=gdata/m18+gdata/q97,ncpus=${PBSTASKS},mem=${MEMORY},walltime=${WALLTIME},wd -P ${ACCOUNT} -q ${QUEUE} gadi_container_go.sh"
49+
#CMD="qsub -v ${EXPORTVARS} -N ${NAME} -l storage=gdata/m18+gdata/q97,ncpus=${PBSTASKS},mem=${MEMORY},walltime=${WALLTIME},wd -P ${ACCOUNT} -q ${QUEUE} gadi_baremetal_go.sh"
4950
echo ${CMD}
5051
${CMD}
5152
else

0 commit comments

Comments
 (0)