Commit a6121ba2 authored by Michael Langguth's avatar Michael Langguth
Add save_gpus_info to set-up mof model.

parent aa6d9dd6
Pipeline #58798 passed with stages
in 2 minutes and 6 seconds
......@@ -73,6 +73,7 @@ class TrainModel(object):
print("setup done")
def set_seed(self):
......@@ -285,9 +286,9 @@ class TrainModel(object):
# also track computing node
cnode_file = os.path.join(self.output_dir, "GPU_worker{0}.json".format(str(hvd.local_rank())))
cnode_file = os.path.join(self.output_dir, "GPU_worker{0}.json".format(str(hvd.rank())))
with open(cnode_file, "w") as fjs:
json.dump({"worker{0}".format(str(hvd.local_rank())): host}, fjs)
json.dump({"worker{0}".format(str(hvd.rank())): host}, fjs)
def save_timing_to_pkl(self, training_time, time_per_iteration):
