@@ -76,11 +76,11 @@ def test_get_num_unfinished_requests():
7676@pytest .mark .parametrize (
7777 "enable_prefix_caching, prompt_logprobs" ,
7878 [
79- (None , None ),
79+ (False , None ),
8080 (True , 5 ),
8181 ],
8282)
83- def test_schedule (enable_prefix_caching : bool | None , prompt_logprobs : int | None ):
83+ def test_schedule (enable_prefix_caching : bool , prompt_logprobs : int | None ):
8484 """Test scheduling.
8585 Two cases: default APC/no prompt logprobs; APC=True + prompt logprobs
8686 """
@@ -582,12 +582,12 @@ def test_check_stop_min_tokens():
582582@pytest .mark .parametrize (
583583 "enable_prefix_caching, prompt_logprobs" ,
584584 [
585- (None , None ),
585+ (False , None ),
586586 (True , 5 ),
587587 ],
588588)
589589def test_schedule_concurrent_batches (
590- enable_prefix_caching : bool | None , prompt_logprobs : int | None
590+ enable_prefix_caching : bool , prompt_logprobs : int | None
591591):
592592 scheduler = create_scheduler (
593593 max_num_batched_tokens = 1024 ,
@@ -1425,7 +1425,7 @@ def create_scheduler_with_priority(
14251425 model : str = "facebook/opt-125m" ,
14261426 max_num_seqs : int = 16 ,
14271427 max_num_batched_tokens : int = 8192 ,
1428- enable_prefix_caching : bool | None = None ,
1428+ enable_prefix_caching : bool = False ,
14291429 long_prefill_token_threshold : int = 0 ,
14301430 disable_chunked_mm_input : bool = False ,
14311431 use_kv_connector : bool = False ,
@@ -1444,7 +1444,7 @@ def create_scheduler_with_priority(
14441444 max_num_batch_tokens: max num tokens to batch
14451445 enable_prefix_caching: optionally force APC config
14461446 (True/False) or use default
1447- (None )
1447+ (False )
14481448
14491449 Returns:
14501450 {class}`Scheduler` instance with priority scheduling
@@ -1467,17 +1467,12 @@ def create_scheduler_with_priority(
14671467 seed = 42 ,
14681468 )
14691469 # Cache config, optionally force APC
1470- kwargs_cache = (
1471- {}
1472- if enable_prefix_caching is None
1473- else {"enable_prefix_caching" : enable_prefix_caching }
1474- )
14751470 cache_config = CacheConfig (
14761471 block_size = block_size ,
14771472 gpu_memory_utilization = 0.9 ,
14781473 swap_space = 0 ,
14791474 cache_dtype = "auto" ,
1480- ** kwargs_cache ,
1475+ enable_prefix_caching = enable_prefix_caching ,
14811476 )
14821477 kv_transfer_config = (
14831478 KVTransferConfig (
0 commit comments