Fix minor style (#4460)

This commit is contained in:
Lianmin Zheng
2025-03-15 21:51:12 -07:00
committed by GitHub
parent 158430473e
commit 2c4f5ccac1
3 changed files with 7 additions and 4 deletions

View File

@@ -340,6 +340,7 @@ class MHATokenToKVPool(KVCache):
cache_v = cache_v.view(self.store_dtype)
if self.capture_mode and cache_k.shape[0] < 4:
# Overlap the copy of K and V cache for small batch size
current_stream = self.device_module.current_stream()
self.alt_stream.wait_stream(current_stream)
with self.device_module.stream(self.alt_stream):

View File

@@ -481,6 +481,7 @@ def suppress_other_loggers():
logging.getLogger("vllm.distributed.device_communicators.shm_broadcast").setLevel(
logging.WARN
)
logging.getLogger("vllm.config").setLevel(logging.ERROR)
warnings.filterwarnings(
"ignore", category=UserWarning, message="The given NumPy array is not writable"
@@ -527,10 +528,11 @@ def kill_process_tree(parent_pid, include_parent: bool = True, skip_pid: int = N
pass
if include_parent:
if parent_pid == os.getpid():
sys.exit(0)
try:
if parent_pid == os.getpid():
itself.kill()
sys.exit(0)
itself.kill()
# Sometime processes cannot be killed with SIGKILL (e.g, PID=1 launched by kubernetes),