Skip to content

Commit

Permalink
Merge pull request #262 from MeetKai/served-model-fix
Browse files Browse the repository at this point in the history
Fix served-model-name
  • Loading branch information
musab-mk authored Aug 31, 2024
2 parents 856a764 + 441506a commit f76fd97
Showing 1 changed file with 3 additions and 5 deletions.
8 changes: 3 additions & 5 deletions server_vllm.py
Original file line number Diff line number Diff line change
Expand Up @@ -138,13 +138,11 @@ async def create_chat_completion(raw_request: Request):

logger.info(f"args: {args}")

if args.served_model_name is not None:
logger.info(
"args.served_model_name is not used in this service and will be ignored. Served model will consist of args.model only."
)

served_model = [args.model]

if args.served_model_name is not None:
served_model += args.served_model_name

engine_args = AsyncEngineArgs.from_cli_args(args)
# A separate tokenizer to map token IDs to strings.
tokenizer = get_tokenizer(
Expand Down

0 comments on commit f76fd97

Please sign in to comment.