forked from KevinBian107/VNL-Brax
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathslurm.py
33 lines (31 loc) · 886 Bytes
/
slurm.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
import subprocess
def slurm_submit(script):
output = subprocess.check_output("sbatch", input=script, universal_newlines=True)
job_id = output.strip().split()[-1]
return job_id
def submit():
"""Submit job to cluster.
"""
script = f"""#!/bin/bash
#SBATCH -p olveczkygpu,gpu,gpu_requeue,serial_requeue # olveczky,cox,shared,serial_requeue # olveczkygpu,gpu_requeue
#SBATCH --mem=16000
#SBATCH -c 4
#SBATCH -N 1
# #SBATCH --constraint="a100"
#SBATCH -t 0-8:00
#SBATCH -J rodent
#SBATCH --gres=gpu:nvidia_a100-sxm4-80gb:2
# #SBATCH --gres=gpu:nvidia_h100_80gb_hbm3:2
# # SBATCH -o /slurm/out
# # SBATCH -e /slurm/error
source ~/.bashrc
module load Mambaforge/22.11.1-fasrc01
source activate rl
module load cuda/12.2.0-fasrc01
nvidia-smi
python3 brax_rodent_run_ppo.py
"""
print(f"Submitting job")
job_id = slurm_submit(script)
print(job_id)
submit()