From 7f0c5361bc27c73813fdf15f7bc4e42cc442ccf5 Mon Sep 17 00:00:00 2001 From: Isotr0py <2037008807@qq.com> Date: Thu, 3 Oct 2024 21:33:12 +0800 Subject: [PATCH] fix cpu decoding --- vllm/worker/cpu_model_runner.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/vllm/worker/cpu_model_runner.py b/vllm/worker/cpu_model_runner.py index cebb0f36a2b2..534d167d994f 100644 --- a/vllm/worker/cpu_model_runner.py +++ b/vllm/worker/cpu_model_runner.py @@ -133,7 +133,7 @@ def build(self) -> ModelInputForCPU: (input_tokens, input_positions, attn_metadata) = self._prepare_decode( self.seq_group_metadata_list) - seq_lens = [] + seq_lens = None return self.model_input_cls( input_tokens=input_tokens,