@@ -19,6 +19,7 @@ while [[ "$#" -gt 0 ]]; do
1919 --log-dir) log_dir=" $2 " ; shift ;;
2020 --model-weights-parent-dir) model_weights_parent_dir=" $2 " ; shift ;;
2121 --pipeline-parallelism) pipeline_parallelism=" $2 " ; shift ;;
22+ --enforce-eager) enforce_eager=" $2 " ; shift ;;
2223 * ) echo " Unknown parameter passed: $1 " ; exit 1 ;;
2324 esac
2425 shift
5960 export PIPELINE_PARALLELISM=" False"
6061fi
6162
63+ if [ -n " $enforce_eager " ]; then
64+ export ENFORCE_EAGER=$enforce_eager
65+ else
66+ export ENFORCE_EAGER=" False"
67+ fi
68+
6269# ================================= Set default environment variables ======================================
6370# Slurm job configuration
6471export JOB_NAME=" $MODEL_FAMILY -$MODEL_VARIANT "
6875mkdir -p $LOG_DIR
6976
7077# Model and entrypoint configuration. API Server URL (host, port) are set automatically based on the
71- # SLURM job and are written to the file specified at VLLM_BASE_URL_FILENAME
78+ # SLURM job
7279export SRC_DIR=" $( dirname " $0 " ) "
7380export MODEL_DIR=" ${SRC_DIR} /models/${MODEL_FAMILY} "
74- export VLLM_BASE_URL_FILENAME=" ${MODEL_DIR} /.${JOB_NAME} _url"
7581
7682# Variables specific to your working environment, below are examples for the Vector cluster
7783export VLLM_MODEL_WEIGHTS=" ${MODEL_WEIGHTS_PARENT_DIR} /${JOB_NAME} "
@@ -89,11 +95,6 @@ if [[ $fp16_partitions =~ $JOB_PARTITION ]]; then
8995 echo " Data type set to due to non-Ampere GPUs used: $VLLM_DATA_TYPE "
9096fi
9197
92- # Create a file to store the API server URL if it doesn't exist
93- if [ -f $VLLM_BASE_URL_FILENAME ]; then
94- touch $VLLM_BASE_URL_FILENAME
95- fi
96-
9798echo Job Name: $JOB_NAME
9899echo Partition: $JOB_PARTITION
99100echo Num Nodes: $NUM_NODES
@@ -105,6 +106,7 @@ echo Max Model Length: $VLLM_MAX_MODEL_LEN
105106echo Max Num Seqs: $VLLM_MAX_NUM_SEQS
106107echo Vocabulary Size: $VLLM_MAX_LOGPROBS
107108echo Pipeline Parallelism: $PIPELINE_PARALLELISM
109+ echo Enforce Eager: $ENFORCE_EAGER
108110echo Log Directory: $LOG_DIR
109111echo Model Weights Parent Directory: $MODEL_WEIGHTS_PARENT_DIR
110112
0 commit comments