Skip to content

Commit

Permalink
🐛 fixup args.max_logprobs
Browse files Browse the repository at this point in the history
Signed-off-by: Joe Runde <[email protected]>
  • Loading branch information
joerunde committed Mar 28, 2024
1 parent a97f2bf commit 74b3785
Showing 1 changed file with 7 additions and 0 deletions.
7 changes: 7 additions & 0 deletions vllm/tgis_utils/args.py
Original file line number Diff line number Diff line change
@@ -1,6 +1,10 @@
import argparse
import os

from vllm.entrypoints.grpc.validation import MAX_TOP_N_TOKENS
from vllm.logger import init_logger

logger = init_logger(__name__)

def _to_env_var(arg_name: str):
return arg_name.upper().replace("-", "_")
Expand Down Expand Up @@ -105,5 +109,8 @@ def postprocess_tgis_args(args: argparse.Namespace) -> argparse.Namespace:
"Inconsistent tensor_parallel_size and num_gpus/num_shard "
"arg values")
args.tensor_parallel_size = num_gpus
if args.max_logprobs < MAX_TOP_N_TOKENS + 1:
logger.info("Setting max_logprobs to %d", MAX_TOP_N_TOKENS + 1)
args.max_logprobs = MAX_TOP_N_TOKENS + 1

return args

0 comments on commit 74b3785

Please sign in to comment.