-
Notifications
You must be signed in to change notification settings - Fork 0
/
train_hf.sh
29 lines (23 loc) · 690 Bytes
/
train_hf.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
#!/bin/bash
#SBATCH --time=3-0:00
#SBATCH --job-name=sbatch
#SBATCH --nodelist=allegro-adams
#SBATCH --output=slurm_out/out_%j.txt
#SBATCH --gres="gpu:a6000:1"
#SBATCH --ntasks=16
ROOT_DIR=./../..
NEOX_DIR=${ROOT_DIR}/gpt-neox
DATA_DIR=${ROOT_DIR}/data
MODEL_DIR=${ROOT_DIR}/models
CONFIG_DIR=${ROOT_DIR}/configs
SRC_DIR=${ROOT_DIR}/src
#This exits the script if any command fails
set -e
export PYTHONPATH=${ROOT_DIR}
### START EDITING HERE ###
mode="train_hf_configs"
config_file=${CONFIG_DIR}/training/${mode}.yaml
WANDB_PROJECT=decouple
CUDA_LAUNCH_BLOCKING=1 CUDA_VISIBLE_DEVICES=0 python ${SRC_DIR}/training/run_train_hf.py\
--mode=${mode}\
--config_file=${config_file}\