[CI] fix port conflicts (#5789)

This commit is contained in:
Lianmin Zheng
2025-04-27 05:17:44 -07:00
committed by GitHub
parent 3c4e0ee64d
commit 35ca04d2fa
7 changed files with 55 additions and 51 deletions

View File

@@ -977,6 +977,7 @@ async def benchmark(
profile: bool,
pd_seperated: bool = False,
flush_cache: bool = False,
warmup_requests: int = 1,
):
if backend in ASYNC_REQUEST_FUNCS:
request_func = ASYNC_REQUEST_FUNCS[backend]
@@ -993,10 +994,8 @@ async def benchmark(
async with semaphore:
return await request_func(request_func_input=request_func_input, pbar=pbar)
if not hasattr(args, "warmup_requests"):
args.warmup_requests = 1
# Warmup
print(f"Starting warmup with {args.warmup_requests} sequences...")
print(f"Starting warmup with {warmup_requests} sequences...")
# Use the first request for all warmup iterations
test_prompt, test_prompt_len, test_output_len = input_requests[0]
@@ -1018,7 +1017,7 @@ async def benchmark(
# Run warmup requests
warmup_tasks = []
for _ in range(args.warmup_requests):
for _ in range(warmup_requests):
warmup_tasks.append(
asyncio.create_task(request_func(request_func_input=test_input))
)
@@ -1026,9 +1025,7 @@ async def benchmark(
warmup_outputs = await asyncio.gather(*warmup_tasks)
# Check if at least one warmup request succeeded
if args.warmup_requests > 0 and not any(
output.success for output in warmup_outputs
):
if warmup_requests > 0 and not any(output.success for output in warmup_outputs):
raise ValueError(
"Warmup failed - Please make sure benchmark arguments "
f"are correctly specified. Error: {warmup_outputs[0].error}"

View File

@@ -281,7 +281,9 @@ async def generate_from_file_request(file: UploadFile, request: Request):
)
try:
ret = await _global_state.generate_request(obj, request).__anext__()
ret = await _global_state.tokenizer_manager.generate_request(
obj, request
).__anext__()
return ret
except ValueError as e:
logger.error(f"Error: {e}")

View File

@@ -8,7 +8,6 @@ import random
import subprocess
import threading
import time
import traceback
import unittest
from concurrent.futures import ThreadPoolExecutor
from dataclasses import dataclass