File tree Expand file tree Collapse file tree 4 files changed +26
-17
lines changed Expand file tree Collapse file tree 4 files changed +26
-17
lines changed Original file line number Diff line number Diff line change 40
40
BenchmarkerProgressGroup ,
41
41
GenerativeConsoleBenchmarkerProgress ,
42
42
)
43
+ from .scheduler_registry import scheduler_register_benchmark_objects
44
+
45
+ scheduler_register_benchmark_objects ()
43
46
44
47
__all__ = [
45
48
"Aggregator" ,
Original file line number Diff line number Diff line change
1
+ from guidellm .backend import (
2
+ GenerationRequest ,
3
+ GenerationRequestTimings ,
4
+ GenerationResponse ,
5
+ )
6
+ from guidellm .scheduler import ScheduledRequestInfo , SchedulerMessagingPydanticRegistry
7
+
8
+ __all__ = ["scheduler_register_benchmark_objects" ]
9
+
10
+
11
+ def scheduler_register_benchmark_objects ():
12
+ SchedulerMessagingPydanticRegistry .register ("GenerationRequest" )(GenerationRequest )
13
+ SchedulerMessagingPydanticRegistry .register ("GenerationResponse" )(
14
+ GenerationResponse
15
+ )
16
+ SchedulerMessagingPydanticRegistry .register ("GenerationRequestTimings" )(
17
+ GenerationRequestTimings
18
+ )
19
+ SchedulerMessagingPydanticRegistry .register ("ScheduledRequestInfo" )(
20
+ ScheduledRequestInfo
21
+ )
Original file line number Diff line number Diff line change @@ -129,6 +129,7 @@ async def run(
129
129
worker_group = WorkerProcessGroup [
130
130
RequestT , MeasuredRequestTimingsT , ResponseT
131
131
](
132
+ requests = None ,
132
133
cycle_requests = local_requests ,
133
134
backend = backend ,
134
135
strategy = local_strategy ,
Original file line number Diff line number Diff line change @@ -578,6 +578,7 @@ def _locked_update(
578
578
self ._internal_constraints .update (add_constraints )
579
579
if update_constraints :
580
580
self ._update_with_constraints (info )
581
+ self ._state .end_time = time .time ()
581
582
state_copy : SchedulerState = self ._state .model_copy ()
582
583
583
584
return (
@@ -588,23 +589,6 @@ def _locked_update(
588
589
),
589
590
)
590
591
591
- def _locked_cancel_request (
592
- self , info : ScheduledRequestInfo [MeasuredRequestTimingsT ]
593
- ):
594
- if info .status != "queued" :
595
- raise ValueError (f"Cannot cancel request in { info .status } state" )
596
-
597
- with self ._update_lock :
598
- self ._state .queued_requests -= 1
599
- self ._state .processed_requests += 1
600
- self ._state .cancelled_requests += 1
601
-
602
- info .status = "cancelled"
603
- info .scheduler_timings .resolve_end = time .time ()
604
- state_copy : SchedulerState = self ._state .model_copy ()
605
-
606
- return state_copy
607
-
608
592
def _update_new_request (self ):
609
593
self ._state .created_requests += 1
610
594
self ._state .queued_requests += 1
You can’t perform that action at this time.
0 commit comments