Skip to content
GitLab
Projects
Groups
Snippets
/
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in
Toggle navigation
Menu
Open sidebar
esde
machine-learning
AMBS
Commits
ab931c26
Commit
ab931c26
authored
Jul 22, 2022
by
Bing Gong
Browse files
delete moving HPC template
parent
c8a97008
Pipeline
#106915
failed with stages
in 26 seconds
Changes
3
Pipelines
2
Hide whitespace changes
Inline
Side-by-side
video_prediction_tools/HPC_scripts/preprocess_data_moving_mnist_template.sh
deleted
100644 → 0
View file @
c8a97008
#!/bin/bash -x
#SBATCH --account=<your_project>
#SBATCH --nodes=1
#SBATCH --ntasks=1
##SBATCH --ntasks-per-node=1
#SBATCH --cpus-per-task=1
#SBATCH --output=DataPreprocess_moving_mnist-out.%j
#SBATCH --error=DataPreprocess_moving_mnist-err.%j
#SBATCH --time=04:00:00
#SBATCH --partition=batch
#SBATCH --mail-type=ALL
#SBATCH --mail-user=me@somewhere.com
######### Template identifier (don't remove) #########
echo
"Do not run the template scripts"
exit
99
######### Template identifier (don't remove) #########
# Name of virtual environment
VIRT_ENV_NAME
=
"my_venv"
# !!! ADAPAT DEPENDING ON USAGE OF CONTAINER !!!
# For container usage, comment in the follwoing lines
# Name of container image (must be available in working directory)
CONTAINER_IMG
=
"
${
WORK_DIR
}
/tensorflow_21.09-tf1-py3.sif"
WRAPPER
=
"
${
BASE_DIR
}
/env_setup/wrapper_container.sh"
# sanity checks
if
[[
!
-f
${
CONTAINER_IMG
}
]]
;
then
echo
"ERROR: Cannot find required TF1.15 container image '
${
CONTAINER_IMG
}
'."
exit
1
fi
if
[[
!
-f
${
WRAPPER
}
]]
;
then
echo
"ERROR: Cannot find wrapper-script '
${
WRAPPER
}
' for TF1.15 container image."
exit
1
fi
# clean-up modules to avoid conflicts between host and container settings
module purge
# declare directory-variables which will be modified generate_runscript.py
source_dir
=
/my/path/to/mnist/raw/data/
destination_dir
=
/my/path/to/mnist/tfrecords/
# run Preprocessing (step 2 where Tf-records are generated)
# run postprocessing/generation of model results including evaluation metrics
export
CUDA_VISIBLE_DEVICES
=
0
## One node, single GPU
srun
--mpi
=
pspmix
--cpu-bind
=
none
\
singularity
exec
--nv
"
${
CONTAINER_IMG
}
"
"
${
WRAPPER
}
"
${
VIRT_ENV_NAME
}
\
python3 ../video_prediction/datasets/moving_mnist.py
${
source_dir
}
${
destination_dir
}
# WITHOUT container usage, comment in the follwoing lines (and uncomment the lines above)
# Activate virtual environment if needed (and possible)
#if [ -z ${VIRTUAL_ENV} ]; then
# if [[ -f ../virtual_envs/${VIRT_ENV_NAME}/bin/activate ]]; then
# echo "Activating virtual environment..."
# source ../virtual_envs/${VIRT_ENV_NAME}/bin/activate
# else
# echo "ERROR: Requested virtual environment ${VIRT_ENV_NAME} not found..."
# exit 1
# fi
#fi
#
# Loading modules
#module purge
#source ../env_setup/modules_train.sh
#export CUDA_VISIBLE_DEVICES=0
#
# srun python3 .../video_prediction/datasets/moving_mnist.py ${source_dir} ${destination_dir}
\ No newline at end of file
video_prediction_tools/HPC_scripts/train_model_moving_mnist_template.sh
deleted
100755 → 0
View file @
c8a97008
#!/bin/bash -x
#SBATCH --account=<your_project>
#SBATCH --nodes=1
#SBATCH --ntasks=1
##SBATCH --ntasks-per-node=1
#SBATCH --cpus-per-task=1
#SBATCH --output=train_moving_mnist-out.%j
#SBATCH --error=train_moving_mnist-err.%j
#SBATCH --time=00:20:00
#SBATCH --gres=gpu:1
#SBATCH --partition=gpus
#SBATCH --mail-type=ALL
#SBATCH --mail-user=me@somewhere.com
######### Template identifier (don't remove) #########
echo
"Do not run the template scripts"
exit
99
######### Template identifier (don't remove) #########
# auxiliary variables
WORK_DIR
=
`
pwd
`
BASE_DIR
=
$(
dirname
"
$WORK_DIR
"
)
# Name of virtual environment
VIRT_ENV_NAME
=
"my_venv"
# !!! ADAPAT DEPENDING ON USAGE OF CONTAINER !!!
# For container usage, comment in the follwoing lines
# Name of container image (must be available in working directory)
CONTAINER_IMG
=
"
${
WORK_DIR
}
/tensorflow_21.09-tf1-py3.sif"
WRAPPER
=
"
${
BASE_DIR
}
/env_setup/wrapper_container.sh"
# sanity checks
if
[[
!
-f
${
CONTAINER_IMG
}
]]
;
then
echo
"ERROR: Cannot find required TF1.15 container image '
${
CONTAINER_IMG
}
'."
exit
1
fi
if
[[
!
-f
${
WRAPPER
}
]]
;
then
echo
"ERROR: Cannot find wrapper-script '
${
WRAPPER
}
' for TF1.15 container image."
exit
1
fi
# clean-up modules to avoid conflicts between host and container settings
module purge
# declare directory-variables which will be modified appropriately during Preprocessing (invoked by mpi_split_data_multi_years.py)
source_dir
=
/p/project/deepacf/deeprain/video_prediction_shared_folder/preprocessedData/moving_mnist
destination_dir
=
/p/project/deepacf/deeprain/video_prediction_shared_folder/models/moving_mnist
# for choosing the model, convLSTM,savp, mcnet,vae
model
=
convLSTM
dataset
=
moving_mnist
model_hparams
=
../hparams/
${
dataset
}
/
${
model
}
/model_hparams.json
destination_dir
=
${
destination_dir
}
/
${
model
}
/
"
$(
date
+
"%Y%m%dT%H%M"
)
_"
$USER
""
# run training in container
export
CUDA_VISIBLE_DEVICES
=
0
## One node, single GPU
srun
--mpi
=
pspmix
--cpu-bind
=
none
\
singularity
exec
--nv
"
${
CONTAINER_IMG
}
"
"
${
WRAPPER
}
"
${
VIRT_ENV_NAME
}
\
python ../main_scripts/train.py
--input_dir
${
source_dir
}
/tfrecords/
--dataset
${
dataset
}
--model
${
model
}
\
--model_hparams_dict
${
model_hparams
}
--output_dir
"
${
destination_dir
}
"
/
# WITHOUT container usage, comment in the follwoing lines (and uncomment the lines above)
# Activate virtual environment if needed (and possible)
#if [ -z ${VIRTUAL_ENV} ]; then
# if [[ -f ../virtual_envs/${VIRT_ENV_NAME}/bin/activate ]]; then
# echo "Activating virtual environment..."
# source ../virtual_envs/${VIRT_ENV_NAME}/bin/activate
# else
# echo "ERROR: Requested virtual environment ${VIRT_ENV_NAME} not found..."
# exit 1
# fi
#fi
#
# Loading modules
#module purge
#source ../env_setup/modules_train.sh
#export CUDA_VISIBLE_DEVICES=0
#
# srun python3 ../main_scripts/train.py --input_dir ${source_dir}/tfrecords/ --dataset ${dataset} --model ${model} \
# --model_hparams_dict ${model_hparams} --output_dir "${destination_dir}"/
\ No newline at end of file
video_prediction_tools/HPC_scripts/visualize_postprocess_moving_mnist_template.sh
deleted
100755 → 0
View file @
c8a97008
#!/bin/bash -x
#SBATCH --account=<your_project>
#SBATCH --nodes=1
#SBATCH --ntasks=1
##SBATCH --ntasks-per-node=1
#SBATCH --cpus-per-task=1
#SBATCH --output=generate_era5-out.%j
#SBATCH --error=generate_era5-err.%j
#SBATCH --time=00:20:00
#SBATCH --gres=gpu:1
#SBATCH --partition=develgpus
#SBATCH --mail-type=ALL
#SBATCH --mail-user=me@somewhere.com
######### Template identifier (don't remove) #########
echo
"Do not run the template scripts"
exit
99
######### Template identifier (don't remove) #########
# auxiliary variables
WORK_DIR
=
"
$(
pwd
)
"
BASE_DIR
=
$(
dirname
"
$WORK_DIR
"
)
# Name of virtual environment
VIRT_ENV_NAME
=
"my_venv"
# !!! ADAPAT DEPENDING ON USAGE OF CONTAINER !!!
# For container usage, comment in the follwoing lines
# Name of container image (must be available in working directory)
CONTAINER_IMG
=
"
${
WORK_DIR
}
/tensorflow_21.09-tf1-py3.sif"
WRAPPER
=
"
${
BASE_DIR
}
/env_setup/wrapper_container.sh"
# sanity checks
if
[[
!
-f
${
CONTAINER_IMG
}
]]
;
then
echo
"ERROR: Cannot find required TF1.15 container image '
${
CONTAINER_IMG
}
'."
exit
1
fi
if
[[
!
-f
${
WRAPPER
}
]]
;
then
echo
"ERROR: Cannot find wrapper-script '
${
WRAPPER
}
' for TF1.15 container image."
exit
1
fi
# clean-up modules to avoid conflicts between host and container settings
module purge
# declare directory-variables which will be modified by config_runscript.py
source_dir
=
/p/project/deepacf/deeprain/video_prediction_shared_folder/preprocessedData/moving_mnist
checkpoint_dir
=
/p/project/deepacf/deeprain/video_prediction_shared_folder/models/moving_mnist
results_dir
=
/p/project/deepacf/deeprain/video_prediction_shared_folder/results/moving_mnist
# name of model
model
=
convLSTM
# run postprocessing/generation of model results including evaluation metrics
export
CUDA_VISIBLE_DEVICES
=
0
## One node, single GPU
srun
--mpi
=
pspmix
--cpu-bind
=
none
\
singularity
exec
--nv
"
${
CONTAINER_IMG
}
"
"
${
WRAPPER
}
"
${
VIRT_ENV_NAME
}
\
python3 ../scripts/generate_movingmnist.py
--input_dir
${
source_dir
}
/
--dataset_hparams
sequence_length
=
20
\
--checkpoint
${
checkpoint_dir
}
/
${
model
}
--mode
test
--model
${
model
}
--results_dir
${
results_dir
}
/
${
model
}
\
--batch_size
2
--dataset
era5
>
generate_era5-out.
"
${
SLURM_JOB_ID
}
"
# WITHOUT container usage, comment in the follwoing lines (and uncomment the lines above)
# Activate virtual environment if needed (and possible)
#if [ -z ${VIRTUAL_ENV} ]; then
# if [[ -f ../virtual_envs/${VIRT_ENV_NAME}/bin/activate ]]; then
# echo "Activating virtual environment..."
# source ../virtual_envs/${VIRT_ENV_NAME}/bin/activate
# else
# echo "ERROR: Requested virtual environment ${VIRT_ENV_NAME} not found..."
# exit 1
# fi
#fi
#
# Loading modules
#module purge
#source ../env_setup/modules_train.sh
#export CUDA_VISIBLE_DEVICES=0
#
# srun python3 ../scripts/generate_movingmnist.py --input_dir ${source_dir}/ --dataset_hparams sequence_length=20 \
# --checkpoint ${checkpoint_dir}/${model} --mode test --model ${model} --results_dir ${results_dir}/${model} \
# --batch_size 2 --dataset era5 > generate_era5-out."${SLURM_JOB_ID}"
\ No newline at end of file
Write
Preview
Supports
Markdown
0%
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment