We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4e2cfc4 commit f8bf2e9Copy full SHA for f8bf2e9
vllm/distributed/device_communicators/custom_all_reduce.py
@@ -286,8 +286,8 @@ def init_custom_quick_allreduce(self):
286
self.create_qr_shared_buffer()
287
if dtype == torch.bfloat16 and not self.use_fp16_kernels:
288
logger.info(
289
- "Custom quick allreduce: converting bf16 to fp16 "
290
- "can speed up qr, "
+ "Custom quick allreduce: converting bf16 inputs to "
+ "fp16 can improve performance"
291
"set envs.VLLM_ROCM_QR_CAST_BF16_TO_FP16=1 to turn on.")
292
self.qr_disabled = False
293
0 commit comments