[V1] Guard Against Main Thread Usage (#14972)

Signed-off-by: rshaw@neuralmagic.com <robertgshaw2@gmail.com>
2025-10-20 23:03:52 +08:00 · 2025-03-17 16:23:02 -04:00
parent 5ac1a8e6e4
commit 16e9064f84
1 changed files with 6 additions and 0 deletions
--- a/vllm/engine/arg_utils.py
+++ b/vllm/engine/arg_utils.py
@ -3,6 +3,7 @@
 import argparse
 import dataclasses
 import json
 import threading
 from dataclasses import dataclass
 from typing import (TYPE_CHECKING, Any, Dict, List, Literal, Mapping, Optional,
                    Tuple, Type, Union, cast, get_args)
@ -1576,6 +1577,11 @@ class EngineArgs:
        #############################################################
        # Experimental Features - allow users to opt in.
        # Signal Handlers requires running in main thread.
        if (threading.current_thread() != threading.main_thread()
                and _warn_or_fallback("Engine in background thread")):
            return False
        # LoRA is supported on V1, but off by default for now.
        if self.enable_lora and _warn_or_fallback("LORA"):
            return False