-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathslurm.sh
28 lines (21 loc) · 1.68 KB
/
slurm.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
#!/bin/bash
#SBATCH --job-name rnd # Job name
### Logging
#SBATCH --output=/scratch/cluster/ishand/results/zoo2/rnd_td3_%A_%a.out # Name of stdout output file (%j expands to jobId)
#SBATCH --error=/scratch/cluster/ishand/results/zoo2/rnd_td3_%A_%a.err # Name of stderr output file (%j expands to jobId) %A should be job id, %a sub-job
### Node info
#SBATCH --partition titans # titans or dgx
#SBATCH --nodes=1 # Always set to 1 when using the cluster
#SBATCH --ntasks-per-node=1 # Number of tasks per node (Set to the number of gpus requested)
#SBATCH --time 96:00:00 # Run time (hh:mm:ss)
#SBATCH --gres=gpu:1 # Number of gpus needed
#SBATCH --mem=12G # Memory requirements
#SBATCH --cpus-per-task=8 # Number of cpus needed per task
SEED=$(($SLURM_ARRAY_TASK_ID + 1010))
SEED2=$(($SLURM_ARRAY_TASK_ID + 3 + 1010))
FILE=rnd_td3_10
sleep $SLURM_ARRAY_TASK_ID
python -u train.py --algo her --env FetchPush-v1 --tensorboard-log /scratch/cluster/ishand/results/zoo2/$FILE --eval-episodes 100 --eval-freq 20000 -f /scratch/cluster/ishand/results/zoo2/$FILE --seed $SEED --verbose 0 &
sleep 15
python -u train.py --algo her --env FetchPush-v1 --tensorboard-log /scratch/cluster/ishand/results/zoo2/$FILE --eval-episodes 100 --eval-freq 20000 -f /scratch/cluster/ishand/results/zoo2/$FILE --seed $SEED2 --verbose 0 &
wait