We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 0f4f019 commit 14e2b07Copy full SHA for 14e2b07
vllm/v1/attention/backends/mla/cutlass_mla.py
@@ -21,7 +21,7 @@
21
22
class CutlassMLAMetadataBuilder(MLACommonMetadataBuilder[MLACommonMetadata]):
23
# enable full CUDA Graph support for decode-only capture
24
- attn_cudagraph_support: ClassVar[
+ cudagraph_support: ClassVar[
25
AttentionCGSupport] = AttentionCGSupport.UNIFORM_SINGLE_TOKEN_DECODE
26
27
0 commit comments