We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
is_first_step_output
1 parent de9fb4b commit c6cf929Copy full SHA for c6cf929
vllm/worker/tpu_model_runner.py
@@ -541,7 +541,8 @@ def execute_model(
541
seq_group_metadata_list=ctx.seq_group_metadata_list,
542
scheduler_outputs=ctx.scheduler_outputs,
543
is_async=False,
544
- is_last_step=False)
+ is_last_step=False,
545
+ is_first_step_output=i == 0)
546
model_input.async_callback()
547
if use_async_out_proc:
548
return [sampler_outputs[-1]]
0 commit comments