Skip to content

Commit 2ee4bdb

Browse files
committed
Allow queuing up to queued_requests_limit in one scheduler loop
Signed-off-by: Samuel Monson <[email protected]>
1 parent 89b501f commit 2ee4bdb

File tree

2 files changed

+3
-4
lines changed

2 files changed

+3
-4
lines changed

src/guidellm/config.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -136,7 +136,7 @@ class Settings(BaseSettings):
136136
# use number of CPUs - 1, but at least 10
137137
default_factory=lambda: max((os.cpu_count() or 1) - 1, 10)
138138
)
139-
max_add_requests_per_loop: int = 20
139+
min_queued_requests: int = 20
140140
scheduler_start_delay: float = 5
141141

142142
# Data settings

src/guidellm/scheduler/scheduler.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -140,7 +140,6 @@ async def run(
140140
queues.requests,
141141
times_iter,
142142
run_info,
143-
loop_limit=run_info.strategy.queued_requests_limit,
144143
)
145144
# Wait for the test to start
146145
await asyncio.sleep(time.time() - scheduling_strategy.start_time)
@@ -296,14 +295,14 @@ def _add_requests(
296295
requests_queue: Queue[WorkerProcessRequest[RequestT, ResponseT]],
297296
times_iter: Iterator[float],
298297
run_info: SchedulerRunInfo,
299-
loop_limit: Optional[int] = None,
300298
) -> Optional[Iterator[Any]]:
301299
if requests_iter is not None:
302300
try:
303301
added_count = 0
304302

305303
while not requests_queue.full() and added_count < (
306-
loop_limit or settings.max_add_requests_per_loop
304+
run_info.strategy.queued_requests_limit
305+
or settings.min_queued_requests
307306
):
308307
if run_info.created_requests >= run_info.end_number:
309308
raise StopIteration

0 commit comments

Comments
 (0)