From d36ea0b89717d81a26c188da297353f6525c4997 Mon Sep 17 00:00:00 2001 From: lenka Date: Thu, 28 Mar 2024 16:11:52 -0700 Subject: [PATCH] try --- .buildkite/pipeline.yml | 72 ++++++++++++++++++++--------------------- 1 file changed, 36 insertions(+), 36 deletions(-) diff --git a/.buildkite/pipeline.yml b/.buildkite/pipeline.yml index 1c61f19ff..522d48b0b 100644 --- a/.buildkite/pipeline.yml +++ b/.buildkite/pipeline.yml @@ -429,42 +429,42 @@ steps: slurm_mem: 20GB slurm_gpus: 1 - - group: "Bash scripts" - steps: - - label: "Submit and Monitor sbatch Job on Caltech HPC" - # check that (1) the script can be succesfully submitted, (2) it runs successfully - command: | - " - #!/bin/bash - - # # Submit the sbatch script and capture its job ID - # JOB_ID=$(sbatch test/mpi_tests/local_checks.sh | awk '{print $4}') - # echo "Submitted job with ID: $JOB_ID, output log: slurm-$JOB_ID.out" - # START_TIME=$(date +%s) - - # # Loop until the job finishes - # while true; do - # # Check the status of the job - # STATUS=$(squeue -j $JOB_ID | grep $JOB_ID | awk '{print $5}') - # ELAPSED_TIME=$(( $(date +%s) - $START_TIME )) - - # # If the job status is 'PD' (pending) or 'R' (running), wait and continue checking - # if [ "$STATUS" == "PD" ] || [ "$STATUS" == "R" ]; then - # sleep 60 - # echo "Job is still running... Elapsed time: $ELAPSED_TIME seconds." - # # If the job status is 'CF' (completed successfully), print success message and exit - # elif [ "$STATUS" == "CF" ]; then - # echo "Job completed successfully." - # exit 0 - # # If the job status is anything else, print error message and exit - # else - # echo "Error: Job failed or terminated. See slurm-$JOB_ID.out for more information." - # exit 1 - # fi - # done - " - agents: - slurm_ntasks: 1 + # - group: "Bash scripts" + # steps: + # - label: "Submit and Monitor sbatch Job on Caltech HPC" + # # check that (1) the script can be succesfully submitted, (2) it runs successfully + # command: | + # " + # #!/bin/bash + + # # Submit the sbatch script and capture its job ID + # JOB_ID=$(sbatch test/mpi_tests/local_checks.sh | awk '{print $4}') + # echo "Submitted job with ID: $JOB_ID, output log: slurm-$JOB_ID.out" + # START_TIME=$(date +%s) + + # # Loop until the job finishes + # while true; do + # # Check the status of the job + # STATUS=$(squeue -j $JOB_ID | grep $JOB_ID | awk '{print $5}') + # ELAPSED_TIME=$(( $(date +%s) - $START_TIME )) + + # # If the job status is 'PD' (pending) or 'R' (running), wait and continue checking + # if [ "$STATUS" == "PD" ] || [ "$STATUS" == "R" ]; then + # sleep 60 + # echo "Job is still running... Elapsed time: $ELAPSED_TIME seconds." + # # If the job status is 'CF' (completed successfully), print success message and exit + # elif [ "$STATUS" == "CF" ]; then + # echo "Job completed successfully." + # exit 0 + # # If the job status is anything else, print error message and exit + # else + # echo "Error: Job failed or terminated. See slurm-$JOB_ID.out for more information." + # exit 1 + # fi + # done + # " + # agents: + # slurm_ntasks: 1 - wait