From 478ad12b77a2417272c8b2b379d5470794293902 Mon Sep 17 00:00:00 2001 From: Jannis Klinkenberg <j.klinkenberg@itc.rwth-aachen.de> Date: Sat, 16 Nov 2024 18:46:15 +0100 Subject: [PATCH] minor bug fixes --- tensorflow/cifar10/train_model.py | 4 +++- tensorflow/cifar10_distributed/train_model.py | 6 +++--- tensorflow/cifar10_distributed/train_model_horovod.py | 2 +- 3 files changed, 7 insertions(+), 5 deletions(-) diff --git a/tensorflow/cifar10/train_model.py b/tensorflow/cifar10/train_model.py index 05648eb..1f84eb0 100644 --- a/tensorflow/cifar10/train_model.py +++ b/tensorflow/cifar10/train_model.py @@ -18,6 +18,8 @@ def parse_command_line(): parser.add_argument("--profile_batches", required=False, help='Batches to profile with for tensorboard. Format "batch_start,batch_end"', type=str, default="2,5") args = parser.parse_args() + args.verbosity = 2 + print("Settings:") settings_map = vars(args) for name in sorted(settings_map.keys()): @@ -64,7 +66,7 @@ def load_dataset(args): return ds_train, ds_test, train_shape def setup(args): - print(f"Number of GPU devices found on worker {args.world_rank}", len(tf.config.list_physical_devices("GPU"))) + print(f"Number of GPU devices found:", len(tf.config.list_physical_devices("GPU"))) tf.keras.backend.clear_session() tf.config.optimizer.set_jit(True) diff --git a/tensorflow/cifar10_distributed/train_model.py b/tensorflow/cifar10_distributed/train_model.py index c80076d..812eea8 100644 --- a/tensorflow/cifar10_distributed/train_model.py +++ b/tensorflow/cifar10_distributed/train_model.py @@ -73,7 +73,7 @@ def load_dataset(args): return ds_train, ds_test, train_shape def setup(args): - print(f"Number of GPU devices found on worker {args.world_rank}", len(tf.config.list_physical_devices("GPU"))) + print(f"Number of GPU devices found on worker {args.world_rank}:", len(tf.config.list_physical_devices("GPU"))) tf.keras.backend.clear_session() tf.config.optimizer.set_jit(True) @@ -85,8 +85,8 @@ def setup(args): ) ) - print("MultiWorkerMirroredStrategy.num_replicas_in_sync", strategy.num_replicas_in_sync) - print("MultiWorkerMirroredStrategy.worker_index", strategy.cluster_resolver.task_id) + print("MultiWorkerMirroredStrategy.num_replicas_in_sync:", strategy.num_replicas_in_sync) + print("MultiWorkerMirroredStrategy.worker_index:", strategy.cluster_resolver.task_id) return strategy diff --git a/tensorflow/cifar10_distributed/train_model_horovod.py b/tensorflow/cifar10_distributed/train_model_horovod.py index 6cae19e..dbd6776 100644 --- a/tensorflow/cifar10_distributed/train_model_horovod.py +++ b/tensorflow/cifar10_distributed/train_model_horovod.py @@ -76,7 +76,7 @@ def load_dataset(args): return ds_train, ds_test, train_shape def setup(args): - print(f"Number of GPU devices found on worker {args.world_rank}", len(tf.config.list_physical_devices("GPU"))) + print(f"Number of GPU devices found on worker {args.world_rank}:", len(tf.config.list_physical_devices("GPU"))) tf.keras.backend.clear_session() tf.config.optimizer.set_jit(True) -- GitLab