Skip to content
Snippets Groups Projects
Commit a3a79111 authored by Chelsea Maria John's avatar Chelsea Maria John
Browse files

Merge branch 'master' into 'main'

Master

See merge request !3
parents bb3ef5fe 3a49d3e0
Branches
No related tags found
1 merge request!3Master
#!/bin/bash #!/bin/bash
#SBATCH --account=opengptx-elm #SBATCH --account=opengptx-elm
#SBATCH --partition=booster #SBATCH --partition=booster
#SBATCH --job-name=opt175b #SBATCH --job-name=opt125m_test
#SBATCH --nodes=48 #SBATCH --nodes=4
#SBATCH --hint=nomultithread #SBATCH --hint=nomultithread
#SBATCH --ntasks-per-node=4 #SBATCH --ntasks-per-node=4
#SBATCH --cpus-per-task=12 # number of cores per tasks #SBATCH --cpus-per-task=12 # number of cores per tasks
#SBATCH --gres=gpu:4 # number of gpus #SBATCH --gres=gpu:4 # number of gpus
#SBATCH --time=00:15:00 # maximum execution time (HH:MM:SS) #SBATCH --time=00:10:00 # maximum execution time (HH:MM:SS)
#SBATCH --output=slurmLog/%x-%j.out # output file name #SBATCH --output=slurmLog/%x-%j.out # output file name
#SBATCH --error=slurmLog/%x-%j.err # error file name #SBATCH --error=slurmLog/%x-%j.err # error file name
...@@ -25,7 +25,7 @@ opt-baselines -n "$SLURM_NNODES" -g 4 \ ...@@ -25,7 +25,7 @@ opt-baselines -n "$SLURM_NNODES" -g 4 \
--account opengptx-elm \ --account opengptx-elm \
--partition booster \ --partition booster \
--prefix "$SLURM_JOB_NAME" \ --prefix "$SLURM_JOB_NAME" \
--model-size 175b \ --model-size 125m \
--juwelsbooster \ --juwelsbooster \
--data "$DATA_PATH" \ --data "$DATA_PATH" \
--ntasks-per-node 4 \ --ntasks-per-node 4 \
...@@ -34,7 +34,7 @@ opt-baselines -n "$SLURM_NNODES" -g 4 \ ...@@ -34,7 +34,7 @@ opt-baselines -n "$SLURM_NNODES" -g 4 \
--tensorboard-logdir "$TENSORBOARD_PATH" \ --tensorboard-logdir "$TENSORBOARD_PATH" \
--no-save-dir \ --no-save-dir \
--snapshot-root "$ROOT_OUTPUT_DIR" \ --snapshot-root "$ROOT_OUTPUT_DIR" \
--time 15 \ --time 10 \
--no-wandb \ --no-wandb \
--cpu-bind socket \ --cpu-bind socket \
--salloc --salloc
......
...@@ -32,6 +32,9 @@ source activate.bash ...@@ -32,6 +32,9 @@ source activate.bash
python -m pip install --upgrade pip python -m pip install --upgrade pip
# Requires numpy 1.22.0
python -m pip install numpy==1.22.0
#Installing PyTorch 1.10.1 version with cuda 11.3 used by metaseq #Installing PyTorch 1.10.1 version with cuda 11.3 used by metaseq
# python -m pip install torch==1.10.1+cu113 torchvision==0.11.2+cu113 torchaudio==0.10.1+cu113 -f https://download.pytorch.org/whl/cu113/torch_stable.html # python -m pip install torch==1.10.1+cu113 torchvision==0.11.2+cu113 torchaudio==0.10.1+cu113 -f https://download.pytorch.org/whl/cu113/torch_stable.html
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment