We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 953af4f commit 4e6c35aCopy full SHA for 4e6c35a
vllm/model_executor/models/mixtral.py
@@ -54,16 +54,6 @@
54
from vllm.utils import print_warning_once
55
56
57
-def is_sm80(device_id=0):
58
- if not torch.cuda.is_available():
59
- return False
60
- device_properties = torch.cuda.get_device_properties(device_id)
61
- return (device_properties.major == 8 and device_properties.minor == 0)
62
-
63
-if is_sm80():
64
- from vllm.model_executor.layers.fused_moe import ampere_fp8_fused_moe
65
- fused_moe = ampere_fp8_fused_moe
66
67
logger = logging.get_logger(__name__)
68
69
0 commit comments