We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent b6e3057 commit 4b2dd14Copy full SHA for 4b2dd14
vllm/spec_decode/spec_decode_worker.py
@@ -10,6 +10,7 @@
10
11
from vllm.config import ParallelConfig, SpeculativeConfig, VllmConfig
12
from vllm.distributed.communication_op import (broadcast_tensor_dict,
13
+ get_tp_group,
14
tensor_model_parallel_gather)
15
from vllm.logger import init_logger
16
from vllm.model_executor.layers.rejection_sampler import RejectionSampler
@@ -365,7 +366,7 @@ def init_device(self) -> None:
365
366
target_lm_head_weight)
367
368
self._metrics.init_tensors(self.rank, device_type=self.device)
- self.spec_decode_sampler.init_tensors(self.rank,
369
+ self.spec_decode_sampler.init_tensors(get_tp_group().local_rank,
370
device_type=self.device)
371
372
scorer_cls: Type[SpeculativeScorer]
0 commit comments