diff --git a/pytorch/cifar10/submit_job_venv.sh b/pytorch/cifar10/submit_job_venv.sh index 982188fdb77b6fa78b3686cfb4fc04ef8b1ccc95..ec783c5cd32f1509d8bab1e1bb74969114dfc0b4 100644 --- a/pytorch/cifar10/submit_job_venv.sh +++ b/pytorch/cifar10/submit_job_venv.sh @@ -14,7 +14,7 @@ ### Load modules or software ############################################################ -# TODO: activate your desired virtual environment +# TODO: load/activate your desired modules and virtual environment ############################################################ ### Parameters and Settings diff --git a/pytorch/cifar10_distributed/submit_job_venv.sh b/pytorch/cifar10_distributed/submit_job_venv.sh index ff2fe9252d20c0440cf697b33541609e5113f9ec..38fde6eb7ad8e45d019a74c63ddcdd306df30c37 100644 --- a/pytorch/cifar10_distributed/submit_job_venv.sh +++ b/pytorch/cifar10_distributed/submit_job_venv.sh @@ -14,7 +14,7 @@ ### Load modules or software ############################################################ -# TODO: activate your desired virtual environment +# TODO: load/activate your desired modules and virtual environment ############################################################ ### Parameters and Settings diff --git a/pytorch/mnist/submit_job_venv.sh b/pytorch/mnist/submit_job_venv.sh index 982188fdb77b6fa78b3686cfb4fc04ef8b1ccc95..ec783c5cd32f1509d8bab1e1bb74969114dfc0b4 100644 --- a/pytorch/mnist/submit_job_venv.sh +++ b/pytorch/mnist/submit_job_venv.sh @@ -14,7 +14,7 @@ ### Load modules or software ############################################################ -# TODO: activate your desired virtual environment +# TODO: load/activate your desired modules and virtual environment ############################################################ ### Parameters and Settings diff --git a/pytorch/mnist_distributed/submit_job_venv.sh b/pytorch/mnist_distributed/submit_job_venv.sh index ff2fe9252d20c0440cf697b33541609e5113f9ec..38fde6eb7ad8e45d019a74c63ddcdd306df30c37 100644 --- a/pytorch/mnist_distributed/submit_job_venv.sh +++ b/pytorch/mnist_distributed/submit_job_venv.sh @@ -14,7 +14,7 @@ ### Load modules or software ############################################################ -# TODO: activate your desired virtual environment +# TODO: load/activate your desired modules and virtual environment ############################################################ ### Parameters and Settings diff --git a/tensorflow/cifar10/submit_job_container.sh b/tensorflow/cifar10/submit_job_container.sh index fa9b7b5c86a209e904a1255dbfe663c5fc3ee23f..0e6f4403ddef43c064c7ee4e8bc9f5304e391574 100644 --- a/tensorflow/cifar10/submit_job_container.sh +++ b/tensorflow/cifar10/submit_job_container.sh @@ -14,7 +14,7 @@ ### Load modules or software ############################################################ -# load module for PyTorch container +# load module for TensorFlow container module load TensorFlow/nvcr-24.01-tf2-py3 module list @@ -36,11 +36,11 @@ export NCCL_SOCKET_NTHREADS=8 # multi-threading for NCCL communication ### Execution (Model Training) ############################################################ -# tensorflow in container often needs a tmp directory +# TensorFlow in container often needs a tmp directory NEWTMP=$(pwd)/tmp mkdir -p ${NEWTMP} # run the python script inside the container source set_vars.sh apptainer exec -e --nv -B ${NEWTMP}:/tmp ${TENSORFLOW_IMAGE} \ - bash -c "python -W ignore train_model.py"' + bash -c "python -W ignore train_model.py" diff --git a/tensorflow/cifar10/submit_job_venv.sh b/tensorflow/cifar10/submit_job_venv.sh index cc27dd67c6c75c89bd28be5739cb0a57eda0b100..6a03c40ee85ccad177d1e8d91855f32d0077d5f5 100644 --- a/tensorflow/cifar10/submit_job_venv.sh +++ b/tensorflow/cifar10/submit_job_venv.sh @@ -9,22 +9,12 @@ #SBATCH --ntasks-per-node=2 #SBATCH --cpus-per-task=24 #SBATCH --gres=gpu:2 -#SBATCH --account=supp0001 ############################################################ ### Load modules or software ############################################################ -# TODO: activate your desired virtual environment -module purge -module load GCC/11.3.0 -module load OpenMPI/4.1.4 -module load CMake/3.21.1 -module load Python/3.9.6 -module load NCCL/2.20.5-CUDA-12.4.0 -module load cuDNN/8.9.7.29-CUDA-12.3.0 - -source /work/jk869269/venvs/tensorflow-2.17_CUDA-12.3/bin/activate +# TODO: load/activate your desired modules and virtual environment ############################################################ ### Parameters and Settings diff --git a/tensorflow/cifar10_distributed/submit_job_container.sh b/tensorflow/cifar10_distributed/submit_job_container.sh index 8fc82912b59995ac65184e8633981c3ff5f8b1b4..3e1a1e7204f9c43f0dd7320548eb8c0366f47e88 100644 --- a/tensorflow/cifar10_distributed/submit_job_container.sh +++ b/tensorflow/cifar10_distributed/submit_job_container.sh @@ -14,7 +14,7 @@ ### Load modules or software ############################################################ -# load module for PyTorch container +# load module for TensorFlow container module load TensorFlow/nvcr-24.01-tf2-py3 module list @@ -36,7 +36,7 @@ export NCCL_SOCKET_NTHREADS=8 # multi-threading for NCCL communication ### Execution (Model Training) ############################################################ -# tensorflow in container often needs a tmp directory +# TensorFlow in container often needs a tmp directory NEWTMP=$(pwd)/tmp mkdir -p ${NEWTMP} diff --git a/tensorflow/cifar10_distributed/submit_job_venv.sh b/tensorflow/cifar10_distributed/submit_job_venv.sh index be3ff767cc97f9fe911046e6f55e4cfabe0b035f..14e22096a46d253b88dfb9e585fed86e691bf8fe 100644 --- a/tensorflow/cifar10_distributed/submit_job_venv.sh +++ b/tensorflow/cifar10_distributed/submit_job_venv.sh @@ -9,22 +9,12 @@ #SBATCH --ntasks-per-node=2 #SBATCH --cpus-per-task=24 #SBATCH --gres=gpu:2 -#SBATCH --account=supp0001 ############################################################ ### Load modules or software ############################################################ -# TODO: activate your desired virtual environment -module purge -module load GCC/11.3.0 -module load OpenMPI/4.1.4 -module load CMake/3.21.1 -module load Python/3.9.6 -module load NCCL/2.20.5-CUDA-12.4.0 -module load cuDNN/8.9.7.29-CUDA-12.3.0 - -source /work/jk869269/venvs/tensorflow-2.17_CUDA-12.3/bin/activate +# TODO: load/activate your desired modules and virtual environment ############################################################ ### Parameters and Settings