mirror of
https://github.com/vllm-project/vllm.git
synced 2025-10-20 14:53:52 +08:00
[Misc] Add deprecation warning for beam search (#6402)
This commit is contained in:
@ -41,6 +41,7 @@ if TYPE_CHECKING:
|
||||
NVCC_THREADS: Optional[str] = None
|
||||
VLLM_USE_PRECOMPILED: bool = False
|
||||
VLLM_INSTALL_PUNICA_KERNELS: bool = False
|
||||
VLLM_NO_DEPRECATION_WARNING: bool = False
|
||||
CMAKE_BUILD_TYPE: Optional[str] = None
|
||||
VERBOSE: bool = False
|
||||
|
||||
@ -251,6 +252,10 @@ environment_variables: Dict[str, Callable[[], Any]] = {
|
||||
lambda: os.getenv("VLLM_XLA_CACHE_PATH", "~/.vllm/xla_cache/"),
|
||||
"VLLM_FUSED_MOE_CHUNK_SIZE":
|
||||
lambda: int(os.getenv("VLLM_FUSED_MOE_CHUNK_SIZE", "65536")),
|
||||
|
||||
# If set, vllm will skip the deprecation warnings.
|
||||
"VLLM_NO_DEPRECATION_WARNING":
|
||||
lambda: bool(int(os.getenv("VLLM_NO_DEPRECATION_WARNING", "0"))),
|
||||
}
|
||||
|
||||
# end-env-vars-definition
|
||||
|
@ -8,6 +8,11 @@ import torch
|
||||
from pydantic import Field
|
||||
from typing_extensions import Annotated
|
||||
|
||||
import vllm.envs as envs
|
||||
from vllm.logger import init_logger
|
||||
|
||||
logger = init_logger(__name__)
|
||||
|
||||
_SAMPLING_EPS = 1e-5
|
||||
|
||||
|
||||
@ -184,6 +189,13 @@ class SamplingParams:
|
||||
|
||||
self._verify_args()
|
||||
if self.use_beam_search:
|
||||
if not envs.VLLM_NO_DEPRECATION_WARNING:
|
||||
logger.warning(
|
||||
"[IMPORTANT] We plan to discontinue the support for beam "
|
||||
"search in the next major release. Please refer to "
|
||||
"https://github.com/vllm-project/vllm/issues/6226 for "
|
||||
"more information. Set VLLM_NO_DEPRECATION_WARNING=1 to "
|
||||
"suppress this warning.")
|
||||
self._verify_beam_search()
|
||||
else:
|
||||
self._verify_non_beam_search()
|
||||
|
Reference in New Issue
Block a user