Skip to content

Commit

Permalink
Merge pull request #445 from pepkit/dev_change_lump
Browse files Browse the repository at this point in the history
Change lump parameters, add --lump-j
  • Loading branch information
donaldcampbelljr authored Jan 24, 2024
2 parents 2ff91e3 + 6549740 commit 191dc54
Show file tree
Hide file tree
Showing 5 changed files with 52 additions and 7 deletions.
5 changes: 5 additions & 0 deletions docs/changelog.md
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,11 @@ This project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.htm

### Added
- `--portable` flag to looper report
- `--lump-j` allows grouping samples into a defined number of jobs

### Changed
- `--lumpn` is now `--lump-n`
- `--lump` is now `--lump-s`

## [1.6.0] -- 2023-12-22

Expand Down
16 changes: 12 additions & 4 deletions looper/cli_looper.py
Original file line number Diff line number Diff line change
Expand Up @@ -219,19 +219,27 @@ def add_subparser(cmd):
for subparser in [run_subparser, rerun_subparser]:
subparser.add_argument(
"-u",
"--lump",
"--lump-s",
default=None,
metavar="X",
type=html_range(min_val=0, max_val=100, step=0.1, value=0),
help="Total input file size (GB) to batch into one job",
help="Lump by size: total input file size (GB) to batch into one job",
)
subparser.add_argument(
"-n",
"--lumpn",
"--lump-n",
default=None,
metavar="N",
type=html_range(min_val=1, max_val="num_samples", value=1),
help="Number of commands to batch into one job",
help="Lump by number: number of samples to batch into one job",
)
subparser.add_argument(
"-j",
"--lump-j",
default=None,
metavar="J",
type=int,
help="Lump samples into number of jobs.",
)

check_subparser.add_argument(
Expand Down
14 changes: 14 additions & 0 deletions looper/conductor.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@
import subprocess
import time
import yaml
from math import ceil
from copy import copy, deepcopy
from json import loads
from subprocess import check_output
Expand Down Expand Up @@ -132,6 +133,7 @@ def __init__(
compute_variables=None,
max_cmds=None,
max_size=None,
max_jobs=None,
automatic=True,
collate=False,
):
Expand Down Expand Up @@ -166,6 +168,8 @@ def __init__(
include in a single job script.
:param int | float | NoneType max_size: Upper bound on total file
size of inputs used by the commands lumped into single job script.
:param int | float | NoneType max_jobs: Upper bound on total number of jobs to
group samples for submission.
:param bool automatic: Whether the submission should be automatic once
the pool reaches capacity.
:param bool collate: Whether a collate job is to be submitted (runs on
Expand Down Expand Up @@ -200,6 +204,16 @@ def __init__(
"{}".format(self.extra_pipe_args)
)

if max_jobs:
if max_jobs == 0 or max_jobs < 0:
raise ValueError(
"If specified, max job command count must be a positive integer, greater than zero."
)

num_samples = len(self.prj.samples)
samples_per_job = num_samples / max_jobs
max_cmds = ceil(samples_per_job)

if not self.collate:
self.automatic = automatic
if max_cmds is None and max_size is None:
Expand Down
5 changes: 3 additions & 2 deletions looper/looper.py
Original file line number Diff line number Diff line change
Expand Up @@ -404,8 +404,9 @@ def __call__(self, args, rerun=False, **compute_kwargs):
extra_args=args.command_extra,
extra_args_override=args.command_extra_override,
ignore_flags=args.ignore_flags,
max_cmds=args.lumpn,
max_size=args.lump,
max_cmds=args.lump_n,
max_size=args.lump_s,
max_jobs=args.lump_j,
)
submission_conductors[piface.pipe_iface_file] = conductor

Expand Down
19 changes: 18 additions & 1 deletion tests/smoketests/test_run.py
Original file line number Diff line number Diff line change
Expand Up @@ -439,14 +439,31 @@ def test_looper_run_produces_submission_scripts(self, prep_temp_pep):

def test_looper_lumping(self, prep_temp_pep):
tp = prep_temp_pep
x = test_args_expansion(tp, "run", ["--lumpn", "2"])
x = test_args_expansion(tp, "run", ["--lump-n", "2"])
try:
main(test_args=x)
except Exception:
raise pytest.fail("DID RAISE {0}".format(Exception))
sd = os.path.join(get_outdir(tp), "submission")
verify_filecount_in_dir(sd, ".sub", 4)

def test_looper_lumping_jobs(self, prep_temp_pep):
tp = prep_temp_pep
x = test_args_expansion(tp, "run", ["--lump-j", "1"])
try:
main(test_args=x)
except Exception:
raise pytest.fail("DID RAISE {0}".format(Exception))
sd = os.path.join(get_outdir(tp), "submission")
verify_filecount_in_dir(sd, ".sub", 2)

def test_looper_lumping_jobs_negative(self, prep_temp_pep):
tp = prep_temp_pep
x = test_args_expansion(tp, "run", ["--lump-j", "-1"])

with pytest.raises(ValueError):
main(test_args=x)

def test_looper_limiting(self, prep_temp_pep):
tp = prep_temp_pep
x = test_args_expansion(tp, "run", ["--limit", "2"])
Expand Down

0 comments on commit 191dc54

Please sign in to comment.