Skip to content

Commit

Permalink
Follow-up on PR#75: update run.py accordingly (#80)
Browse files Browse the repository at this point in the history
fix
  • Loading branch information
sunggg authored Nov 22, 2023
1 parent dc928f9 commit baa4fa6
Showing 1 changed file with 3 additions and 3 deletions.
6 changes: 3 additions & 3 deletions serve/mlc_serve/run.py
Original file line number Diff line number Diff line change
Expand Up @@ -31,8 +31,8 @@ def parse_args():
args.add_argument("--local-id", type=str, required=True)
args.add_argument("--artifact-path", type=str, default="dist")
args.add_argument("--use-staging-engine", action="store_true")
args.add_argument("--max-num-batched-tokens", type=int, default=-1)
args.add_argument("--max-input-len", type=int, default=-1)
args.add_argument("--max-num-sequences", type=int, default=8)
args.add_argument("--max-input-len", type=int, default=512)
args.add_argument("--min-decode-steps", type=int, default=12)
args.add_argument("--max-decode-steps", type=int, default=16)
args.add_argument("--prompt-allocate-ratio", type=float, default=2.0)
Expand Down Expand Up @@ -90,7 +90,7 @@ def create_engine(
# Set the engine config
engine_config = get_engine_config({
"use_staging_engine": args.use_staging_engine,
"max_num_batched_tokens": args.max_num_batched_tokens,
"max_num_sequences": args.max_num_sequences,
"max_input_len": args.max_input_len,
"min_decode_steps": args.min_decode_steps,
"max_decode_steps": args.max_decode_steps,
Expand Down

0 comments on commit baa4fa6

Please sign in to comment.