Update install commands (#583)

This commit is contained in:
Lianmin Zheng
2024-07-03 02:07:34 -07:00
parent 9380f50ff9
commit c7709d3abe
3 changed files with 17 additions and 14 deletions

View File

@@ -291,11 +291,6 @@ class ServerArgs:
action="store_true",
help="Disable flashinfer inference kernels",
)
parser.add_argument(
"--attention-reduce-in-fp32",
action="store_true",
help="Cast the intermidiate attention results to fp32 to avoid possible crashes related to fp16.",
)
parser.add_argument(
"--disable-radix-cache",
action="store_true",
@@ -311,6 +306,12 @@ class ServerArgs:
action="store_true",
help="Disable disk cache to avoid possible crashes related to file system or high concurrency.",
)
parser.add_argument(
"--attention-reduce-in-fp32",
action="store_true",
help="Cast the intermidiate attention results to fp32 to avoid possible crashes related to fp16."
"This only affects Triton attention kernels",
)
@classmethod
def from_cli_args(cls, args: argparse.Namespace):