From 16708256b803861544fe4904961c9cdaa1e52fab Mon Sep 17 00:00:00 2001 From: Wuwei Lin Date: Mon, 29 Jul 2024 17:37:16 -0700 Subject: [PATCH] Turn on custom allreduce by default in O3 --- python/mlc_llm/interface/compiler_flags.py | 1 + 1 file changed, 1 insertion(+) diff --git a/python/mlc_llm/interface/compiler_flags.py b/python/mlc_llm/interface/compiler_flags.py index 28c9cf4e54..aa2dc4ebd4 100644 --- a/python/mlc_llm/interface/compiler_flags.py +++ b/python/mlc_llm/interface/compiler_flags.py @@ -205,5 +205,6 @@ def from_str(source: str) -> "ModelConfigOverride": faster_transformer=True, cudagraph=True, cutlass=True, + ipc_allreduce_strategy=IPCAllReduceStrategyType.AUTO, ), }