Skip to content

Commit

Permalink
srun
Browse files Browse the repository at this point in the history
  • Loading branch information
LenkaNovak committed Sep 19, 2023
1 parent 78a37d4 commit e579d84
Showing 1 changed file with 10 additions and 16 deletions.
26 changes: 10 additions & 16 deletions .buildkite/pipeline.yml
Original file line number Diff line number Diff line change
@@ -1,3 +1,8 @@
agents:
queue: central
slurm_mem: 8G
modules: julia/1.9.3 cuda/11.8 ucx/1.14.1_cuda-11.8 openmpi/4.1.5_cuda-11.8 hdf5/1.12.2-ompi415 nsight-systems/2023.2.1

env:
JULIA_LOAD_PATH: "${JULIA_LOAD_PATH}:${BUILDKITE_BUILD_CHECKOUT_PATH}/.buildkite"
OPENBLAS_NUM_THREADS: 1
Expand All @@ -9,19 +14,9 @@ env:
CONFIG_PATH: "config/model_configs"
PERF_CONFIG_PATH: "config/perf_configs"
MPI_CONFIG_PATH: "config/mpi_configs"
SLURM_KILL_BAD_EXIT: 1
BUILDKITE_COMMIT: "${BUILDKITE_COMMIT}"
BUILDKITE_BRANCH: "${BUILDKITE_BRANCH}"
SLURM_KILL_BAD_EXIT: 1

agents:
config: cpu
queue: central
modules: julia/1.9.3 cuda/11.8 ucx/1.14.1_cuda-11.8 openmpi/4.1.5_cuda-11.8 hdf5/1.12.2-ompi415 nsight-systems/2023.2.1
slurm_ntasks: 1
slurm_time: 24:00:00
slurm_mem: 8G
slurm_gpus: 1
slurm_cpus_per_task: 8

timeout_in_minutes: 1440

Expand Down Expand Up @@ -68,6 +63,7 @@ steps:

agents:
slurm_cpus_per_task: 8
slurm_gpus: 1
env:
JULIA_NUM_PRECOMPILE_TASKS: 8
JULIA_MAX_NUM_PRECOMPILE_FILES: 50
Expand Down Expand Up @@ -104,15 +100,13 @@ steps:

- label: "MPI Checkpointer unit tests"
key: "checkpointer_mpi_tests"
command: "mpiexec julia --color=yes --project=test/ test/mpi_tests/checkpointer_mpi_tests.jl --run_name checkpointer_mpi --job_id checkpointer_mpi"
command: "srun julia --color=yes --project=test/ test/mpi_tests/checkpointer_mpi_tests.jl --run_name checkpointer_mpi --job_id checkpointer_mpi"
timeout_in_minutes: 20
env:
CLIMACORE_DISTRIBUTED: "MPI"
agents:
config: cpu
queue: central
slurm_nodes: 3
slurm_tasks_per_node: 1
slurm_ntasks: 2
slurm_mem: 16GB

- label: "Perf flame graph diff tests"
command: "julia --color=yes --project=perf/ perf/flame_test.jl --run_name flame_test --job_id flame_perf_target"
Expand Down

0 comments on commit e579d84

Please sign in to comment.