Rename config_runscripts.py to generate_runscripts.py and delete generation...

Rename config_runscripts.py to generate_runscripts.py and delete generation script from HPC_scripts/.

Rename config_runscripts.py to generate_runscripts.py and delete generation...
2eff2cf6 · Michael Langguth · 54863cfd · 54863cfd · 2eff2cf6
Commit 2eff2cf6 authored Feb 4, 2021 by Michael Langguth
--- a/video_prediction_tools/HPC_scripts/config_runscript.py
+++ b/video_prediction_tools/HPC_scripts/config_runscript.py
-"""
-Basic task of the Python-script:
-Creates user-defined runscripts for post processing, training and postprocessing via keyboard interaction.
-"""
-__email__ = "b.gong@fz-juelich.de"
-__authors__ = "Michael Langguth"
-__date__ = "2020-12-22"
-# import modules
-import sys, os, glob
-import numpy as np
-import subprocess
-import datetime as dt
-import json as js
-if sys.version_info[0] < 3:
-    raise Exception("This script has to be run with Python 3!")
-sys.path.append(os.path.dirname(sys.path[0]))
-from model_modules.model_architectures import known_models
-from data_preprocess.dataset_options import known_datasets
-from utils.configurations import *
-def main():
-    list_models = known_models().keys()
-    list_datasets = known_datasets().keys()
-    # sanity check (is Python running in a virtual environment)
-    venv_name = check_virtualenv(labort=True)
-    # set up class instance
-    config_custom = Config_runscript()
-    ## get required information from the user by keyboard interaction
-    # runscript to configure
-    def check_req_runscript(runscript_req, silent=False):
-        if not np.any(runscript_req == ["training","preprocessing"]):
-            if not silent:
-                print("Enter either 'preprocessing' or 'training' to choose the type of runscripts to configure.\n" +
-                      "Note that choosing training also involves the postprocessing runscript.")
-            return False
-        else:
-            return True
-    runscript_req_str = "Enter the name of the dataset for training:\n" + \
-                        " Choose 'preprocessing' for configuring " + \
-                        "preprocessing step 2 or 'training' for configuring training and postprocessing" + \
-                        "of a customized experiment."
-    runscript_err = ValueError("Invalid runscript choice encountered.")
-    runscript = keyboard_interaction(runscript_req_str, check_req_runscript, runscript_err, ntries=2)
-    config_custom.set_req_attrs(runscript)
-    # dataset used for training
-    def check_dataset(dataset_name, silent=False):
-        # NOTE: Generic template for training still has to be integrated!
-        #       After this is done, the latter part of the if-clause can be removed
-        #       and further adaptions for the target_dir and for retrieving base_dir (see below) are required
-        if not dataset_name in list_datasets or dataset_name != "era5":
-            if not silent:
-                print("The following dataset can be used for training:")
-                for dataset_avail in list_datasets: print("* " + dataset_avail)
-            return False
-        else:
-            return True
-    dataset_req_str = "Enter the name of the dataset for training:\n"
-    dataset_err     = ValueError("Please select a dataset from the ones listed above.")
-    dataset = keyboard_interaction(dataset_req_str,check_dataset,dataset_err,ntries=2)
-    # path to preprocessed data
-    def check_expdir(exp_dir, silent=False):
-        status = False
-        if os.path.isdir(exp_dir):
-            file_list = glob.glob(os.path.join(exp_dir,"sequence*.tfrecords"))
-            if len(file_list) > 0:
-                status = True
-            else:
-                print("{0} does not contain any tfrecord-files.".format(exp_dir))
-        else:
-            if not silent: print("Passed directory does not exist!")
-        return status
-    expdir_req_str = "Enter the path to the preprocessed data (directory where tf-records files are located):\n"
-    expdir_err     = FileNotFoundError("Could not find any tfrecords.")
-    exp_dir_full   = keyboard_interaction(expdir_req_str, check_expdir, expdir_err, ntries=3)
-    # split up directory path
-    exp_dir_split = path_rec_split(exp_dir_full)
-    index = [idx for idx, s in enumerate(exp_dir_split) if dataset in s]
-    if index == []:
-        raise ValueError("tfrecords found under '{0}', but directory does not seem to reflect naming convention.".format(exp_dir_full))
-    exp_dir = exp_dir_split[index[0]]
-    # model
-    def check_model(model_name, silent=False):
-        if not model_name in list_models:
-            if not silent:
-                print("{0} is not a valid model!".format(model_name))
-                print("The following models are implemented in the workflow:")
-                for model_avail in list_models: print("* " + model_avail)
-            return False
-        else:
-            return True
-    model_req_str = "Enter the name of the model you want to train:\n"
-    model_err     = ValueError("Please select a model from the ones listed above.")
-    model = keyboard_interaction(model_req_str, check_model, model_err, ntries=2)
-    # experimental ID
-    # No need to call keyboard_interaction here, because the user can pass whatever we wants
-    exp_id = input("Enter your desired experimental id (will be extended by timestamp and username):\n")
-    # also get current timestamp and user-name...
-    timestamp = dt.datetime.now().strftime("%Y%m%dT%H%M%S")
-    user_name = os.environ["USER"]
-    # ... to construct final target_dir and exp_dir_ext as well
-    exp_id = timestamp +"_"+ user_name +"_"+ exp_id  # by convention, exp_id is extended by timestamp and username
-    base_dir   = get_variable_from_runscript('train_model_era5_template.sh','destination_dir')
-    exp_dir_ext= os.path.join(exp_dir,model,exp_id)
-    target_dir = os.path.join(base_dir,exp_dir,model,exp_id)
-    # sanity check (target_dir is unique):
-    if os.path.isdir(target_dir):
-        raise IsADirectoryError(target_dir+" already exists! Make sure that it is unique.")
-    # create destination directory...
-    os.makedirs(target_dir)
-    source_hparams = os.path.join("..","hparams",dataset,model,"model_hparams.json")
-    # sanity check (default hyperparameter json-file exists)
-    if not os.path.isfile(source_hparams):
-        raise FileNotFoundError("Could not find default hyperparameter json-file '"+source_hparams+"'")
-    # ...copy over json-file for hyperparamters...
-    os.system("cp "+source_hparams+" "+target_dir)
-    # ...and open vim
-    cmd_vim = os.environ.get('EDITOR', 'vi') + ' ' + os.path.join(target_dir,"model_hparams.json")
-    subprocess.call(cmd_vim, shell=True)
-    # finally, create runscript for training...
-    cmd = "cd ../env_setup; ./generate_workflow_runscripts.sh ../HPC_scripts/train_model_era5 "+ venv_name+ \
-          " -exp_id="+exp_id+" -exp_dir="+exp_dir+" -exp_dir_ext="+exp_dir_ext+" -model="+model+" ; cd -"
-    os.system(cmd)
-    # ...and postprocessing as well
-    cmd = cmd.replace("train_model_era5","visualize_postprocess_era5")
-    os.system(cmd)
-if __name__== '__main__':
-    main()
--- a/video_prediction_tools/config_runscripts/config_runscripts.py
+++ b/video_prediction_tools/config_runscripts/config_runscripts.py