@@ -40,7 +40,7 @@ def executor_queue(mock_dist):
4040 max_beam_width = 1 ,
4141 max_num_active_requests = 16 ,
4242 enable_iter_perf_stats = True ,
43- batch_wait_timeout = 0.0 ,
43+ batch_wait_timeout_ms = 0.0 ,
4444 is_disaggregated = False )
4545
4646
@@ -53,7 +53,7 @@ def integration_queue(mock_dist):
5353 max_beam_width = 2 ,
5454 max_num_active_requests = 8 ,
5555 enable_iter_perf_stats = True ,
56- batch_wait_timeout = 0.0 ,
56+ batch_wait_timeout_ms = 0.0 ,
5757 is_disaggregated = False )
5858
5959
@@ -228,8 +228,8 @@ def add_requests_after_delay(delay, num_requests):
228228 item = RequestQueueItem (i + 10 , Mock ())
229229 executor_queue .request_queue .put (item )
230230
231- # Test 1: Without batch_wait_timeout (should only get initial requests)
232- executor_queue .batch_wait_timeout = 0.0
231+ # Test 1: Without batch_wait_timeout_ms (should only get initial requests)
232+ executor_queue .batch_wait_timeout_ms = 0.0
233233
234234 initial_requests = 3
235235 for i in range (initial_requests ):
@@ -250,8 +250,8 @@ def add_requests_after_delay(delay, num_requests):
250250
251251 thread .join ()
252252
253- # Test 2: With batch_wait_timeout (should wait and get all requests)
254- executor_queue .batch_wait_timeout = 0.2
253+ # Test 2: With batch_wait_timeout_ms (should wait and get all requests)
254+ executor_queue .batch_wait_timeout_ms = 200.0
255255
256256 # Clear the queue and add initial requests again
257257 while not executor_queue .request_queue .empty ():
@@ -268,7 +268,7 @@ def add_requests_after_delay(delay, num_requests):
268268 thread = threading .Thread (target = add_requests_after_delay , args = (0.05 , 3 ))
269269 thread .start ()
270270
271- # Get requests with batch_wait_timeout - should wait and get all
271+ # Get requests with batch_wait_timeout_ms - should wait and get all
272272 start_time = time .time ()
273273 items = executor_queue ._get_from_request_queue (None )
274274 elapsed = time .time () - start_time
@@ -442,7 +442,7 @@ def attention_dp_queue(mock_dist_attention_dp):
442442 max_beam_width = 2 ,
443443 max_num_active_requests = 8 ,
444444 enable_iter_perf_stats = True ,
445- batch_wait_timeout = 0.0 ,
445+ batch_wait_timeout_ms = 0.0 ,
446446 is_disaggregated = False )
447447 # Initialize all_ranks_num_active_requests
448448 return queue
0 commit comments