We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent f5d3acd commit 53be4a8Copy full SHA for 53be4a8
vllm/config.py
@@ -1146,7 +1146,7 @@ def _verify_prefix_caching(self) -> None:
1146
if not self.enable_prefix_caching:
1147
return
1148
1149
- if self.sliding_window is not None:
+ if self.sliding_window is not None and not envs.VLLM_USE_V1:
1150
raise NotImplementedError(
1151
"Prefix caching is not supported with sliding window. "
1152
"Run with --disable-sliding-window to use prefix caching.")
0 commit comments