Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
5 changes: 2 additions & 3 deletions vllm/model_executor/layers/quantization/fp8.py
Original file line number Diff line number Diff line change
Expand Up @@ -62,10 +62,9 @@ def __init__(
weight_block_size: Optional[list[int]] = None,
) -> None:
super().__init__()

self.is_checkpoint_fp8_serialized = is_checkpoint_fp8_serialized
if is_checkpoint_fp8_serialized:
logger.warning("Detected fp8 checkpoint. Please note that the "
"format is experimental and subject to change.")

if activation_scheme not in ACTIVATION_SCHEMES:
raise ValueError(
f"Unsupported activation scheme {activation_scheme}")
Expand Down
5 changes: 1 addition & 4 deletions vllm/platforms/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -217,11 +217,8 @@ def resolve_current_platform_cls_qualname() -> str:
platform_cls_qualname = func()
if platform_cls_qualname is not None:
activated_plugins.append(name)
logger.info("Platform plugin %s loaded.", name)
logger.warning(
"Platform plugin %s function's return value is None", name)
except Exception:
logger.exception("Failed to load platform plugin %s", name)
pass

activated_builtin_plugins = list(
set(activated_plugins) & set(builtin_platform_plugins.keys()))
Expand Down
22 changes: 13 additions & 9 deletions vllm/plugins/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -2,7 +2,7 @@

import logging
import os
from typing import Callable
from typing import Any, Callable

import torch

Expand All @@ -14,7 +14,7 @@
plugins_loaded = False


def load_plugins_by_group(group: str) -> dict[str, Callable]:
def load_plugins_by_group(group: str) -> dict[str, Callable[[], Any]]:
import sys
if sys.version_info < (3, 10):
from importlib_metadata import entry_points
Expand All @@ -27,23 +27,27 @@ def load_plugins_by_group(group: str) -> dict[str, Callable]:
if len(discovered_plugins) == 0:
logger.debug("No plugins for group %s found.", group)
return {}

logger.info("Available plugins for group %s:", group)
for plugin in discovered_plugins:
logger.info("name=%s, value=%s", plugin.name, plugin.value)
logger.info("- %s -> %s", plugin.name, plugin.value)

if allowed_plugins is None:
logger.info("all available plugins for group %s will be loaded.",
group)
logger.info("set environment variable VLLM_PLUGINS to control"
" which plugins to load.")
plugins = {}
logger.info("All plugins in this group will be loaded. "
"Set `VLLM_PLUGINS` to control which plugins to load.")

plugins = dict[str, Callable[[], Any]]()
for plugin in discovered_plugins:
if allowed_plugins is None or plugin.name in allowed_plugins:
if allowed_plugins is not None:
logger.info("Loading plugin %s", plugin.name)

try:
func = plugin.load()
plugins[plugin.name] = func
logger.info("plugin %s loaded.", plugin.name)
except Exception:
logger.exception("Failed to load plugin %s", plugin.name)

return plugins


Expand Down