Skip to content

Commit

Permalink
Move --skip-decode to model cli helper
Browse files Browse the repository at this point in the history
Signed-off-by: aviator19941 <avinash.sharma@amd.com>
  • Loading branch information
aviator19941 committed Nov 16, 2024
1 parent 9b3f92a commit 2244b9e
Show file tree
Hide file tree
Showing 2 changed files with 5 additions and 11 deletions.
11 changes: 0 additions & 11 deletions sharktank/sharktank/examples/export_paged_llm_v1.py
Original file line number Diff line number Diff line change
Expand Up @@ -54,17 +54,6 @@ def main():
help="Enables strictness during export",
action="store_true",
)
parser.add_argument(
"--attention-kernel",
type=str,
default="decomposed",
choices=["decomposed", "torch"],
)
parser.add_argument(
"--skip-decode",
help="Enables prefill only, skips decode",
action="store_true",
)

cli.add_quantization_options(parser)
cli.add_model_options(parser)
Expand Down
5 changes: 5 additions & 0 deletions sharktank/sharktank/utils/cli.py
Original file line number Diff line number Diff line change
Expand Up @@ -69,6 +69,11 @@ def add_model_options(parser: argparse.ArgumentParser):
default="decomposed",
choices=["decomposed", "torch"],
)
parser.add_argument(
"--skip-decode",
help="Enables prefill only, skips decode",
action="store_true",
)


def add_quantization_options(parser: argparse.ArgumentParser):
Expand Down

0 comments on commit 2244b9e

Please sign in to comment.