diff --git a/.gitignore b/.gitignore index 738a5270..4eaf5f90 100644 --- a/.gitignore +++ b/.gitignore @@ -5,3 +5,4 @@ __pycache__/ *.egg-info MUJOCO_LOG.TXT ; +*.out diff --git a/dreamerv3/configs.yaml b/dreamerv3/configs.yaml index 1eb58287..a25ac0a0 100644 --- a/dreamerv3/configs.yaml +++ b/dreamerv3/configs.yaml @@ -231,7 +231,20 @@ gymnasium_fetchquad: .*\.units: 512 encoder: {mlp_keys: '.*', cnn_keys: '.*'} decoder: {mlp_keys: '.*', cnn_keys: '.*'} + run.steps: 2e6 +gymnasium_fetchquadpo: + task: gymnasium_FetchPushQuadHardPO-v0 + envs.amount: 4 + run.log_keys_video: [camera_top] + run.train_ratio: 512 + rssm.deter: 512 + .*\.cnn_depth: 32 + .*\.layers: 2 + .*\.units: 512 + encoder: {mlp_keys: '.*', cnn_keys: '.*'} + decoder: {mlp_keys: '.*', cnn_keys: '.*'} + run.steps: 2e6 small: rssm.deter: 512 diff --git a/slurm.bash b/slurm.bash new file mode 100644 index 00000000..82e54490 --- /dev/null +++ b/slurm.bash @@ -0,0 +1,28 @@ +#!/usr/bin/env bash +#SBATCH --cpus-per-gpu=4 +#SBATCH --gres=gpu:1 +#SBATCH --time=48:00:00 +#SBATCH --partition=dineshj-compute +#SBATCH --qos=dj-med +#SBATCH --array=0-2 +#SBATCH --mem=40G + + +##SBATCH --cpus-per-gpu=4 +##SBATCH --partition=compute +##SBATCH --gpus=1 +##SBATCH --qos=low +##SBATCH --time=08:00:00 +##SBATCH --array=0-9 +###SBATCH --mem-per-gpu=16384 + + +export MUJOCO_GL=egl; +export CUDA_VISIBLE_DEVICES=0; export MUJOCO_EGL_DEVICE_ID=$CUDA_VISIBLE_DEVICES; + +EXPERIMENT=po_fq +SEED=$SLURM_ARRAY_TASK_ID + +python dreamerv3/train.py --logdir ~/logdir/${EXPERIMENT}_$(date "+%Y%m%d-%H%M%S")_s$SEED --configs gymnasium_fetchquadpo,small --seed $SEED > "${EXPERIMENT}_s${SEED}.out" 2>&1 & +wait +exit 3