Skip to content

Commit

Permalink
fix
Browse files Browse the repository at this point in the history
  • Loading branch information
jeffrey-fong committed Aug 31, 2024
1 parent 856a764 commit 441506a
Showing 1 changed file with 3 additions and 5 deletions.
8 changes: 3 additions & 5 deletions server_vllm.py
Original file line number Diff line number Diff line change
Expand Up @@ -138,13 +138,11 @@ async def create_chat_completion(raw_request: Request):

logger.info(f"args: {args}")

if args.served_model_name is not None:
logger.info(
"args.served_model_name is not used in this service and will be ignored. Served model will consist of args.model only."
)

served_model = [args.model]

if args.served_model_name is not None:
served_model += args.served_model_name

engine_args = AsyncEngineArgs.from_cli_args(args)
# A separate tokenizer to map token IDs to strings.
tokenizer = get_tokenizer(
Expand Down

0 comments on commit 441506a

Please sign in to comment.