Tune params (#696)

This commit is contained in:
Ying Sheng
2024-07-22 03:19:24 -07:00
committed by GitHub
parent d198791fe8
commit c3f1aac811

View File

@@ -70,15 +70,15 @@ class ServerArgs:
self.tokenizer_path = self.model_path
if self.mem_fraction_static is None:
if self.tp_size >= 16:
self.mem_fraction_static = 0.74
self.mem_fraction_static = 0.80
elif self.tp_size >= 8:
self.mem_fraction_static = 0.78
self.mem_fraction_static = 0.84
elif self.tp_size >= 4:
self.mem_fraction_static = 0.82
self.mem_fraction_static = 0.86
elif self.tp_size >= 2:
self.mem_fraction_static = 0.85
else:
self.mem_fraction_static = 0.88
else:
self.mem_fraction_static = 0.89
if isinstance(self.additional_ports, int):
self.additional_ports = [self.additional_ports]
elif self.additional_ports is None: