Skip to content

Commit 0716e0d

Browse files
committed
fixup! feat: Add user-provided speculative decoding support
Signed-off-by: Robin Kobus <[email protected]>
1 parent c5c77c4 commit 0716e0d

File tree

1 file changed

+1
-3
lines changed
  • tests/unittest/api_stability/references_committed

1 file changed

+1
-3
lines changed

tests/unittest/api_stability/references_committed/llm.yaml

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -66,9 +66,7 @@ methods:
6666
default: null
6767
# Speculative decoding
6868
speculative_config:
69-
annotation: Union[tensorrt_llm.llmapi.llm_args.LookaheadDecodingConfig, tensorrt_llm.llmapi.llm_utils.MedusaDecodingConfig,
70-
tensorrt_llm.llmapi.llm_utils.EagleDecodingConfig, tensorrt_llm.llmapi.MTPDecodingConfig, tensorrt_llm.llmapi.llm_args.NGramDecodingConfig,
71-
tensorrt_llm.llmapi.llm_args.DraftTargetDecodingConfig, NoneType]
69+
annotation: Union[tensorrt_llm.llmapi.llm_args.DraftTargetDecodingConfig, tensorrt_llm.llmapi.llm_args.EagleDecodingConfig,tensorrt_llm.llmapi.llm_args.LookaheadDecodingConfig, tensorrt_llm.llmapi.llm_args.MedusaDecodingConfig, tensorrt_llm.llmapi.llm_args.MTPDecodingConfig, tensorrt_llm.llmapi.llm_args.NGramDecodingConfig, tensorrt_llm.llmapi.llm_args.UserProvidedDecodingConfig, NoneType]
7270
default: null
7371
# generation constraints
7472
max_batch_size:

0 commit comments

Comments
 (0)