Skip to content

Commit

Permalink
non-gpu version
Browse files Browse the repository at this point in the history
  • Loading branch information
mwalmsley committed Nov 3, 2023
1 parent 6a375e3 commit 6118ee0
Showing 1 changed file with 25 additions and 0 deletions.
25 changes: 25 additions & 0 deletions only_for_me/narval/train.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,25 @@
#!/bin/bash
#SBATCH --mem=32G
#SBATCH --nodes=1
#SBATCH --time=0:20:0
#SBATCH --tasks-per-node=1
#SBATCH --cpus-per-task=4

### SBATCH --gres=gpu:a100:1

nvidia-smi

PYTHON=/home/walml/envs/zoobot39_dev/bin/python

cp -r /project/def-bovy/walml/data/roots/galaxy_mnist $SLURM_TMPDIR/walml/finetune/data/

ls $SLURM_TMPDIR/walml/finetune/data/galaxy_mnist

export NCCL_BLOCKING_WAIT=1 #Set this environment variable if you wish to use the NCCL backend for inter-GPU communication.
# export MASTER_ADDR=$(hostname) #Store the master node’s IP address in the MASTER_ADDR environment variable.
# echo "r$SLURM_NODEID master: $MASTER_ADDR"
# echo "r$SLURM_NODEID Launching python script"

REPO_DIR=/project/def-bovy/walml/zoobot/
srun $PYTHON $REPO_DIR/only_for_me/narval/train.py --save-dir $REPO_DIR/only_for_me/narval/debug_models --batch-size 4 --color --debug
# srun python $SLURM_TMPDIR/zoobot/only_for_me/narval/finetune.py

0 comments on commit 6118ee0

Please sign in to comment.