diff --git a/video_prediction_tools/HPC_scripts/preprocess_data_moving_mnist_template.sh b/video_prediction_tools/HPC_scripts/preprocess_data_moving_mnist_template.sh deleted file mode 100644 index f72950255efa181ca95b9b4f13c81efafe1e7733..0000000000000000000000000000000000000000 --- a/video_prediction_tools/HPC_scripts/preprocess_data_moving_mnist_template.sh +++ /dev/null @@ -1,71 +0,0 @@ -#!/bin/bash -x -#SBATCH --account=<your_project> -#SBATCH --nodes=1 -#SBATCH --ntasks=1 -##SBATCH --ntasks-per-node=1 -#SBATCH --cpus-per-task=1 -#SBATCH --output=DataPreprocess_moving_mnist-out.%j -#SBATCH --error=DataPreprocess_moving_mnist-err.%j -#SBATCH --time=04:00:00 -#SBATCH --partition=batch -#SBATCH --mail-type=ALL -#SBATCH --mail-user=me@somewhere.com - -######### Template identifier (don't remove) ######### -echo "Do not run the template scripts" -exit 99 -######### Template identifier (don't remove) ######### - -# Name of virtual environment -VIRT_ENV_NAME="my_venv" - -# !!! ADAPAT DEPENDING ON USAGE OF CONTAINER !!! -# For container usage, comment in the follwoing lines -# Name of container image (must be available in working directory) -CONTAINER_IMG="${WORK_DIR}/tensorflow_21.09-tf1-py3.sif" -WRAPPER="${BASE_DIR}/env_setup/wrapper_container.sh" - -# sanity checks -if [[ ! -f ${CONTAINER_IMG} ]]; then - echo "ERROR: Cannot find required TF1.15 container image '${CONTAINER_IMG}'." - exit 1 -fi - -if [[ ! -f ${WRAPPER} ]]; then - echo "ERROR: Cannot find wrapper-script '${WRAPPER}' for TF1.15 container image." - exit 1 -fi - -# clean-up modules to avoid conflicts between host and container settings -module purge - -# declare directory-variables which will be modified generate_runscript.py -source_dir=/my/path/to/mnist/raw/data/ -destination_dir=/my/path/to/mnist/tfrecords/ - -# run Preprocessing (step 2 where Tf-records are generated) -# run postprocessing/generation of model results including evaluation metrics -export CUDA_VISIBLE_DEVICES=0 -## One node, single GPU -srun --mpi=pspmix --cpu-bind=none \ - singularity exec --nv "${CONTAINER_IMG}" "${WRAPPER}" ${VIRT_ENV_NAME} \ - python3 ../video_prediction/datasets/moving_mnist.py ${source_dir} ${destination_dir} - -# WITHOUT container usage, comment in the follwoing lines (and uncomment the lines above) -# Activate virtual environment if needed (and possible) -#if [ -z ${VIRTUAL_ENV} ]; then -# if [[ -f ../virtual_envs/${VIRT_ENV_NAME}/bin/activate ]]; then -# echo "Activating virtual environment..." -# source ../virtual_envs/${VIRT_ENV_NAME}/bin/activate -# else -# echo "ERROR: Requested virtual environment ${VIRT_ENV_NAME} not found..." -# exit 1 -# fi -#fi -# -# Loading modules -#module purge -#source ../env_setup/modules_train.sh -#export CUDA_VISIBLE_DEVICES=0 -# -# srun python3 .../video_prediction/datasets/moving_mnist.py ${source_dir} ${destination_dir} \ No newline at end of file diff --git a/video_prediction_tools/HPC_scripts/train_model_moving_mnist_template.sh b/video_prediction_tools/HPC_scripts/train_model_moving_mnist_template.sh deleted file mode 100755 index 322d0fac362119032f558232e8161321434d2f2f..0000000000000000000000000000000000000000 --- a/video_prediction_tools/HPC_scripts/train_model_moving_mnist_template.sh +++ /dev/null @@ -1,82 +0,0 @@ -#!/bin/bash -x -#SBATCH --account=<your_project> -#SBATCH --nodes=1 -#SBATCH --ntasks=1 -##SBATCH --ntasks-per-node=1 -#SBATCH --cpus-per-task=1 -#SBATCH --output=train_moving_mnist-out.%j -#SBATCH --error=train_moving_mnist-err.%j -#SBATCH --time=00:20:00 -#SBATCH --gres=gpu:1 -#SBATCH --partition=gpus -#SBATCH --mail-type=ALL -#SBATCH --mail-user=me@somewhere.com - -######### Template identifier (don't remove) ######### -echo "Do not run the template scripts" -exit 99 -######### Template identifier (don't remove) ######### - -# auxiliary variables -WORK_DIR=`pwd` -BASE_DIR=$(dirname "$WORK_DIR") -# Name of virtual environment -VIRT_ENV_NAME="my_venv" -# !!! ADAPAT DEPENDING ON USAGE OF CONTAINER !!! -# For container usage, comment in the follwoing lines -# Name of container image (must be available in working directory) -CONTAINER_IMG="${WORK_DIR}/tensorflow_21.09-tf1-py3.sif" -WRAPPER="${BASE_DIR}/env_setup/wrapper_container.sh" - -# sanity checks -if [[ ! -f ${CONTAINER_IMG} ]]; then - echo "ERROR: Cannot find required TF1.15 container image '${CONTAINER_IMG}'." - exit 1 -fi - -if [[ ! -f ${WRAPPER} ]]; then - echo "ERROR: Cannot find wrapper-script '${WRAPPER}' for TF1.15 container image." - exit 1 -fi - -# clean-up modules to avoid conflicts between host and container settings -module purge - -# declare directory-variables which will be modified appropriately during Preprocessing (invoked by mpi_split_data_multi_years.py) - -source_dir=/p/project/deepacf/deeprain/video_prediction_shared_folder/preprocessedData/moving_mnist -destination_dir=/p/project/deepacf/deeprain/video_prediction_shared_folder/models/moving_mnist - -# for choosing the model, convLSTM,savp, mcnet,vae -model=convLSTM -dataset=moving_mnist -model_hparams=../hparams/${dataset}/${model}/model_hparams.json -destination_dir=${destination_dir}/${model}/"$(date +"%Y%m%dT%H%M")_"$USER"" - -# run training in container -export CUDA_VISIBLE_DEVICES=0 -## One node, single GPU -srun --mpi=pspmix --cpu-bind=none \ - singularity exec --nv "${CONTAINER_IMG}" "${WRAPPER}" ${VIRT_ENV_NAME} \ - python ../main_scripts/train.py --input_dir ${source_dir}/tfrecords/ --dataset ${dataset} --model ${model} \ - --model_hparams_dict ${model_hparams} --output_dir "${destination_dir}"/ - -# WITHOUT container usage, comment in the follwoing lines (and uncomment the lines above) -# Activate virtual environment if needed (and possible) -#if [ -z ${VIRTUAL_ENV} ]; then -# if [[ -f ../virtual_envs/${VIRT_ENV_NAME}/bin/activate ]]; then -# echo "Activating virtual environment..." -# source ../virtual_envs/${VIRT_ENV_NAME}/bin/activate -# else -# echo "ERROR: Requested virtual environment ${VIRT_ENV_NAME} not found..." -# exit 1 -# fi -#fi -# -# Loading modules -#module purge -#source ../env_setup/modules_train.sh -#export CUDA_VISIBLE_DEVICES=0 -# -# srun python3 ../main_scripts/train.py --input_dir ${source_dir}/tfrecords/ --dataset ${dataset} --model ${model} \ -# --model_hparams_dict ${model_hparams} --output_dir "${destination_dir}"/ \ No newline at end of file diff --git a/video_prediction_tools/HPC_scripts/visualize_postprocess_moving_mnist_template.sh b/video_prediction_tools/HPC_scripts/visualize_postprocess_moving_mnist_template.sh deleted file mode 100755 index 142193121fb12ea792d0350eac859652512438a1..0000000000000000000000000000000000000000 --- a/video_prediction_tools/HPC_scripts/visualize_postprocess_moving_mnist_template.sh +++ /dev/null @@ -1,80 +0,0 @@ -#!/bin/bash -x -#SBATCH --account=<your_project> -#SBATCH --nodes=1 -#SBATCH --ntasks=1 -##SBATCH --ntasks-per-node=1 -#SBATCH --cpus-per-task=1 -#SBATCH --output=generate_era5-out.%j -#SBATCH --error=generate_era5-err.%j -#SBATCH --time=00:20:00 -#SBATCH --gres=gpu:1 -#SBATCH --partition=develgpus -#SBATCH --mail-type=ALL -#SBATCH --mail-user=me@somewhere.com - -######### Template identifier (don't remove) ######### -echo "Do not run the template scripts" -exit 99 -######### Template identifier (don't remove) ######### - -# auxiliary variables -WORK_DIR="$(pwd)" -BASE_DIR=$(dirname "$WORK_DIR") -# Name of virtual environment -VIRT_ENV_NAME="my_venv" -# !!! ADAPAT DEPENDING ON USAGE OF CONTAINER !!! -# For container usage, comment in the follwoing lines -# Name of container image (must be available in working directory) -CONTAINER_IMG="${WORK_DIR}/tensorflow_21.09-tf1-py3.sif" -WRAPPER="${BASE_DIR}/env_setup/wrapper_container.sh" - -# sanity checks -if [[ ! -f ${CONTAINER_IMG} ]]; then - echo "ERROR: Cannot find required TF1.15 container image '${CONTAINER_IMG}'." - exit 1 -fi - -if [[ ! -f ${WRAPPER} ]]; then - echo "ERROR: Cannot find wrapper-script '${WRAPPER}' for TF1.15 container image." - exit 1 -fi - -# clean-up modules to avoid conflicts between host and container settings -module purge - -# declare directory-variables which will be modified by config_runscript.py -source_dir=/p/project/deepacf/deeprain/video_prediction_shared_folder/preprocessedData/moving_mnist -checkpoint_dir=/p/project/deepacf/deeprain/video_prediction_shared_folder/models/moving_mnist -results_dir=/p/project/deepacf/deeprain/video_prediction_shared_folder/results/moving_mnist -# name of model -model=convLSTM - -# run postprocessing/generation of model results including evaluation metrics -export CUDA_VISIBLE_DEVICES=0 -## One node, single GPU -srun --mpi=pspmix --cpu-bind=none \ - singularity exec --nv "${CONTAINER_IMG}" "${WRAPPER}" ${VIRT_ENV_NAME} \ - python3 ../scripts/generate_movingmnist.py --input_dir ${source_dir}/ --dataset_hparams sequence_length=20 \ - --checkpoint ${checkpoint_dir}/${model} --mode test --model ${model} --results_dir ${results_dir}/${model} \ - --batch_size 2 --dataset era5 > generate_era5-out."${SLURM_JOB_ID}" - -# WITHOUT container usage, comment in the follwoing lines (and uncomment the lines above) -# Activate virtual environment if needed (and possible) -#if [ -z ${VIRTUAL_ENV} ]; then -# if [[ -f ../virtual_envs/${VIRT_ENV_NAME}/bin/activate ]]; then -# echo "Activating virtual environment..." -# source ../virtual_envs/${VIRT_ENV_NAME}/bin/activate -# else -# echo "ERROR: Requested virtual environment ${VIRT_ENV_NAME} not found..." -# exit 1 -# fi -#fi -# -# Loading modules -#module purge -#source ../env_setup/modules_train.sh -#export CUDA_VISIBLE_DEVICES=0 -# -# srun python3 ../scripts/generate_movingmnist.py --input_dir ${source_dir}/ --dataset_hparams sequence_length=20 \ -# --checkpoint ${checkpoint_dir}/${model} --mode test --model ${model} --results_dir ${results_dir}/${model} \ -# --batch_size 2 --dataset era5 > generate_era5-out."${SLURM_JOB_ID}" \ No newline at end of file