We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 04bcde1 commit dab72bfCopy full SHA for dab72bf
vllm/config/__init__.py
@@ -364,9 +364,11 @@ def __post_init__(self):
364
self.compilation_config.cudagraph_mode = \
365
CUDAGraphMode.FULL_AND_PIECEWISE
366
367
- # pooling model does not support full cudagraphs
+ # pooling models and encoder-decoder models
368
+ # do not support full cudagraphs
369
if self.model_config is not None and \
- self.model_config.pooler_config is not None:
370
+ (self.model_config.pooler_config is not None
371
+ or self.model_config.is_encoder_decoder):
372
373
CUDAGraphMode.PIECEWISE
374
else:
0 commit comments