Remove unused import

ajrasane · ajrasane · commit 58302a4a1660 · 2025-08-14T21:56:27.000Z
Signed-off-by: ajrasane &lt;131806219+ajrasane@users.noreply.github.com&gt;
diff --git a/tensorrt_llm/bench/benchmark/throughput.py b/tensorrt_llm/bench/benchmark/throughput.py
@@ -450,6 +450,7 @@ def ignore_trt_only_args(kwargs: dict):
         elif runtime_config.backend == "_autodeploy":
             ignore_trt_only_args(kwargs)
             kwargs["world_size"] = kwargs.pop("tensor_parallel_size", None)
+
             llm = AutoDeployLLM(**kwargs)
         else:
             llm = LLM(**kwargs)
diff --git a/tests/integration/defs/accuracy/test_llm_api_autodeploy.py b/tests/integration/defs/accuracy/test_llm_api_autodeploy.py
@@ -17,8 +17,6 @@
 
 from tensorrt_llm import LLM
 from tensorrt_llm._torch.auto_deploy import LLM as AutoDeployLLM
-from tensorrt_llm.llmapi.llm_args import (CapacitySchedulerPolicy,
-                                          ContextChunkingPolicy)
 from tensorrt_llm.quantization import QuantAlgo
 from tensorrt_llm.sampling_params import SamplingParams
 
@@ -40,7 +38,7 @@ def get_default_kwargs(self):
             'max_batch_size': 512,
             # 131072 is the max seq len for the model
             'max_seq_len': 8192,
-            # max num tokens is derived in the build_config, which is not used by AutoDeploy llmargs. 
+            # max num tokens is derived in the build_config, which is not used by AutoDeploy llmargs.
             # Set it explicitly here to 8192 which is the default in build_config.
             'max_num_tokens': 8192,
             'skip_loading_weights': False,