Skip to content

Commit d1fa2f2

Browse files
committed
fix_test_auto_prefix_cache_support
Signed-off-by: Huamin Li <3ericli@gmail.com>
1 parent da554f9 commit d1fa2f2

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

tests/models/language/pooling/test_auto_prefix_cache_support.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,8 @@ def test_classify_models(
2626
with vllm_runner(model,
2727
max_model_len=512,
2828
dtype=dtype,
29-
enable_prefix_caching=True) as vllm_model:
29+
enable_prefix_caching=True,
30+
enable_chunked_prefill=True) as vllm_model:
3031
cache_config = vllm_model.llm.llm_engine.cache_config
3132
assert cache_config.enable_prefix_caching
3233
vllm_outputs = vllm_model.classify(example_prompts)
@@ -63,6 +64,7 @@ def test_embed_models(
6364
runner="pooling",
6465
max_model_len=None,
6566
enable_prefix_caching=True,
67+
enable_chunked_prefill=True,
6668
) as vllm_model:
6769
cache_config = vllm_model.llm.llm_engine.cache_config
6870
assert cache_config.enable_prefix_caching

0 commit comments

Comments
 (0)