Skip to content

Commit a0b47f0

Browse files
committed
minor
Signed-off-by: Fridah-nv <201670829+Fridah-nv@users.noreply.github.com>
1 parent 8e14fcf commit a0b47f0

1 file changed

Lines changed: 0 additions & 3 deletions

File tree

examples/llm_autodeploy/api_server.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,6 @@
2121
import uvicorn
2222
from fastapi import FastAPI, HTTPException
2323
from tensorrt_llm._torch.auto_deploy import LLM
24-
from tensorrt_llm.builder import BuildConfig
2524
from tensorrt_llm.llmapi.llm import RequestOutput
2625
from tensorrt_llm.sampling_params import SamplingParams
2726
from tensorrt_llm.serve.openai_protocol import (
@@ -45,8 +44,6 @@ def build_runner_from_config(args) -> LLM:
4544
"""Builds a model runner from our config."""
4645
mto.enable_huggingface_checkpointing()
4746
model_kwargs = {"max_position_embeddings": args.max_seq_len, "use_cache": False}
48-
build_config = BuildConfig(max_seq_len=args.max_seq_len, max_batch_size=args.max_batch_size)
49-
build_config.plugin_config.tokens_per_block = args.max_seq_len
5047

5148
llm = LLM(
5249
model=args.ckpt_path,

0 commit comments

Comments
 (0)