-
-
Notifications
You must be signed in to change notification settings - Fork 11k
Description
I met this problem.
outputs = llm.generate(prompts, sampling_params)
File "/home/ma-user/anaconda3/envs/py39/lib/python3.9/site-packages/vllm/entrypoints/llm.py", line 165, in generate
return self._run_engine(use_tqdm)
File "/home/ma-user/anaconda3/envs/py39/lib/python3.9/site-packages/vllm/entrypoints/llm.py", line 185, in _run_engine
step_outputs = self.llm_engine.step()
File "/home/ma-user/anaconda3/envs/py39/lib/python3.9/site-packages/vllm/engine/llm_engine.py", line 628, in step
all_outputs = self._run_workers(
File "/home/ma-user/anaconda3/envs/py39/lib/python3.9/site-packages/vllm/engine/llm_engine.py", line 795, in _run_workers
driver_worker_output = getattr(self.driver_worker,
File "/home/ma-user/anaconda3/envs/py39/lib/python3.9/site-packages/torch/utils/_contextlib.py", line 115, in decorate_context
return func(*args, **kwargs)
File "/home/ma-user/anaconda3/envs/py39/lib/python3.9/site-packages/vllm/worker/worker.py", line 183, in execute_model
self.cache_swap(*block_swapping_info)
File "/home/ma-user/anaconda3/envs/py39/lib/python3.9/site-packages/vllm/worker/worker.py", line 139, in cache_swap
self.cache_engine.swap_in(blocks_to_swap_in)
File "/home/ma-user/anaconda3/envs/py39/lib/python3.9/site-packages/vllm/worker/cache_engine.py", line 131, in swap_in
self._swap(self.cpu_cache, self.gpu_cache, src_to_dst)
File "/home/ma-user/anaconda3/envs/py39/lib/python3.9/site-packages/vllm/worker/cache_engine.py", line 123, in _swap
cache_ops.swap_blocks(src_key_cache, dst_key_cache, src_to_dst)
RuntimeError: t == DeviceType::CUDA INTERNAL ASSERT FAILED at "/opt/hostedtoolcache/Python/3.9.18/x64/lib/python3.9/site-packages/torch/include/c10/cuda/impl/CUDAGuardImpl.h":25, please report a bug to PyTorch.