55 lines
862 B
Bash
55 lines
862 B
Bash
#!/bin/bash
|
|
|
|
# ================================
|
|
# Choose the case to run.
|
|
# ================================
|
|
|
|
# Interleaved schedule options = [YES, NO].
|
|
INTERLEAVED=YES
|
|
|
|
# Batch size (global batch size) options = [12, 24, 36, ..., 60].
|
|
GBS=12
|
|
|
|
|
|
|
|
|
|
|
|
# Set interleaved schedule options.
|
|
if [ ${INTERLEAVED} == "YES" ]; then
|
|
MEGATRON_EXTRA_PARAMS="--activations-checkpoint-method uniform --num-layers-per-virtual-pipeline-stage 2 "
|
|
elif [ ${INTERLEAVED} == "NO" ]; then
|
|
MEGATRON_EXTRA_PARAMS="--activations-checkpoint-method uniform "
|
|
else
|
|
echo "Invalid configuration"
|
|
exit 1
|
|
fi
|
|
|
|
|
|
# Other params.
|
|
TP=8
|
|
PP=12
|
|
MBS=1
|
|
NLS=96
|
|
HS=12288
|
|
NAH=96
|
|
DDP=local
|
|
NNODES=12
|
|
|
|
|
|
# Name of the job.
|
|
export JOB_NAME=results_figure_12_interleaved_${INTERLEAVED}_batch_size_${GBS}
|
|
|
|
|
|
# Import the configs.
|
|
. `pwd`/CONFIG.sh
|
|
|
|
|
|
# Submit the job.
|
|
. `pwd`/SBATCH.sh
|
|
|
|
|
|
exit 0
|
|
|
|
|
|
|