Skip to content

Commit

Permalink
benchmark failing because of lack of flag
Browse files Browse the repository at this point in the history
Specifically priviledged because it's not present in the args
object.

Signed-off-by: Eric Curtin <ecurtin@redhat.com>
  • Loading branch information
ericcurtin committed Feb 26, 2025
1 parent 56e3a71 commit 2e9079c
Showing 1 changed file with 6 additions and 8 deletions.
14 changes: 6 additions & 8 deletions ramalama/cli.py
Original file line number Diff line number Diff line change
Expand Up @@ -452,14 +452,8 @@ def add_network_argument(parser, dflt="none"):

def bench_parser(subparsers):
parser = subparsers.add_parser("bench", aliases=["benchmark"], help="benchmark specified AI Model")
bench_run_serve_perplexity_args(parser)
add_network_argument(parser)
parser.add_argument(
"--ngl",
dest="ngl",
type=int,
default=config.get("ngl", -1),
help="number of layers to offload to the gpu, if available",
)
parser.add_argument("MODEL") # positional argument
parser.set_defaults(func=bench_cli)

Expand Down Expand Up @@ -781,14 +775,18 @@ def push_cli(args):


def run_serve_perplexity_args(parser):
parser.add_argument("--authfile", help="path of the authentication file")
bench_run_serve_perplexity_args(parser)
parser.add_argument(
"-c",
"--ctx-size",
dest="context",
default=config.get('ctx_size', 2048),
help="size of the prompt context (0 = loaded from model)",
)


def bench_run_serve_perplexity_args(parser):
parser.add_argument("--authfile", help="path of the authentication file")
parser.add_argument(
"--device", dest="device", action='append', type=str, help="device to leak in to the running container"
)
Expand Down

0 comments on commit 2e9079c

Please sign in to comment.