diff --git a/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxpp2_genpp2.yaml b/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxpp2_genpp2.yaml index 293e3e604a8..b7f03c0f9f5 100644 --- a/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxpp2_genpp2.yaml +++ b/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxpp2_genpp2.yaml @@ -14,6 +14,7 @@ context_servers: kv_cache_config: free_gpu_memory_fraction: 0.2 enable_partial_reuse: False + enable_block_reuse: False disable_overlap_scheduler: True cache_transceiver_config: backend: DEFAULT @@ -29,6 +30,7 @@ generation_servers: kv_cache_config: free_gpu_memory_fraction: 0.2 enable_partial_reuse: False + enable_block_reuse: False disable_overlap_scheduler: True cache_transceiver_config: backend: DEFAULT diff --git a/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxpp2_gentp2.yaml b/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxpp2_gentp2.yaml index 67f41bc7e50..892b4e8b31f 100644 --- a/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxpp2_gentp2.yaml +++ b/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxpp2_gentp2.yaml @@ -14,6 +14,7 @@ context_servers: kv_cache_config: free_gpu_memory_fraction: 0.2 enable_partial_reuse: False + enable_block_reuse: False disable_overlap_scheduler: True cache_transceiver_config: backend: DEFAULT diff --git a/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxpp4_genpp4.yaml b/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxpp4_genpp4.yaml index 35716921234..2c7a67e1cbf 100644 --- a/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxpp4_genpp4.yaml +++ b/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxpp4_genpp4.yaml @@ -14,6 +14,7 @@ context_servers: kv_cache_config: free_gpu_memory_fraction: 0.2 enable_partial_reuse: False + enable_block_reuse: False disable_overlap_scheduler: True cache_transceiver_config: backend: DEFAULT @@ -29,6 +30,7 @@ generation_servers: kv_cache_config: free_gpu_memory_fraction: 0.2 enable_partial_reuse: False + enable_block_reuse: False disable_overlap_scheduler: True cache_transceiver_config: backend: DEFAULT diff --git a/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxtp2pp2_gentp2pp2.yaml b/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxtp2pp2_gentp2pp2.yaml index db62a89cf76..ce47009aaad 100644 --- a/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxtp2pp2_gentp2pp2.yaml +++ b/tests/integration/defs/disaggregated/test_configs/disagg_config_ctxtp2pp2_gentp2pp2.yaml @@ -14,6 +14,7 @@ context_servers: kv_cache_config: free_gpu_memory_fraction: 0.2 enable_partial_reuse: False + enable_block_reuse: False disable_overlap_scheduler: True cache_transceiver_config: backend: DEFAULT @@ -29,6 +30,7 @@ generation_servers: kv_cache_config: free_gpu_memory_fraction: 0.2 enable_partial_reuse: False + enable_block_reuse: False disable_overlap_scheduler: True cache_transceiver_config: backend: DEFAULT