[Fix] Fix OOM in llava base class (#1249)

This commit is contained in:
Lianmin Zheng
2024-08-28 08:38:50 -07:00
parent c411f32e1c
commit 0a97d7962d
3 changed files with 30 additions and 25 deletions

View File

@@ -1,7 +1,7 @@
"""
Usage:
python3 -m sglang.launch_server --model-path lmms-lab/llava-onevision-qwen2-72b-ov --port=30000 --tp-size=8 --chat-template=chatml-llava --chunked-prefill-size=16384
python3 -m sglang.launch_server --model-path lmms-lab/llava-onevision-qwen2-72b-ov --port=30000 --tp-size=8 --chat-template=chatml-llava
python3 http_llava_onevision_test.py
"""