lerobot/sbatch.sh

25 lines
837 B
Bash
Raw Normal View History

2024-02-22 21:04:32 +08:00
#!/bin/bash
#SBATCH --nodes=1 # total number of nodes (N to be defined)
#SBATCH --ntasks-per-node=1 # number of tasks per node (here 8 tasks, or 1 task per GPU)
2024-03-05 01:32:29 +08:00
#SBATCH --qos=normal # number of GPUs reserved per node (here 8, or all the GPUs)
#SBATCH --partition=hopper-prod
2024-02-22 21:04:32 +08:00
#SBATCH --gres=gpu:1 # number of GPUs reserved per node (here 8, or all the GPUs)
2024-03-05 01:32:29 +08:00
#SBATCH --cpus-per-task=12 # number of cores per task
#SBATCH --mem-per-cpu=11G
#SBATCH --time=12:00:00
#SBATCH --output=/admin/home/remi_cadene/slurm/%j.out
#SBATCH --error=/admin/home/remi_cadene/slurm/%j.err
#SBATCH --mail-user=remi_cadene@huggingface.co
2024-02-22 21:04:32 +08:00
#SBATCH --mail-type=ALL
CMD=$@
echo "command: $CMD"
2024-03-05 01:32:29 +08:00
# apptainer exec --nv \
# ~/apptainer/nvidia_cuda:12.2.2-devel-ubuntu22.04.sif $SHELL
2024-02-22 21:04:32 +08:00
2024-03-05 01:32:29 +08:00
#source ~/.bashrc
#conda activate fowm
2024-02-29 20:37:48 +08:00
2024-02-22 21:04:32 +08:00
srun $CMD