Fix weight update for data parallelism (#2050)

This commit is contained in:
Lianmin Zheng
2024-11-16 00:30:39 -08:00
committed by GitHub
parent 2ffe0a7363
commit 2f2e07439c
2 changed files with 6 additions and 3 deletions

View File

@@ -231,15 +231,16 @@ def throughput_test(
input_requests = get_dataset(bench_args, tokenizer)
warmup_requests = sample_random_requests(
input_len=20,
output_len=4,
num_prompts=2,
input_len=256,
output_len=16,
num_prompts=16,
range_ratio=0.8,
tokenizer=tokenizer,
dataset_path=bench_args.dataset_path,
)
# Warm up
logging.info("\nWarmup...")
throughput_test_once(
backend_name=bench_args.backend,
backend=backend,
@@ -247,6 +248,7 @@ def throughput_test(
ignore_eos=not bench_args.disable_ignore_eos,
)
logging.info("\nBenchmark...")
result = throughput_test_once(
backend_name=bench_args.backend,
backend=backend,

View File

@@ -83,6 +83,7 @@ class DataParallelController:
self.workers = []
for dp_rank in range(server_args.dp_size):
tmp_port_args = PortArgs.init_new(server_args)
tmp_port_args.tokenizer_ipc_name = port_args.tokenizer_ipc_name
tmp_port_args.detokenizer_ipc_name = port_args.detokenizer_ipc_name
send_to = self.launch_tensor_parallel_group(