[Doc]Fix tutorial doc expression (#319)
Fix tutorial doc expression Signed-off-by: wangli <wangli858794774@gmail.com>
This commit is contained in:
@@ -30,10 +30,10 @@ docker run --rm \
|
|||||||
Setup environment variables:
|
Setup environment variables:
|
||||||
|
|
||||||
```bash
|
```bash
|
||||||
# Use Modelscope mirror to speed up model download
|
# Load model from ModelScope to speed up download
|
||||||
export VLLM_USE_MODELSCOPE=True
|
export VLLM_USE_MODELSCOPE=True
|
||||||
|
|
||||||
# To avoid NPU out of memory, set `max_split_size_mb` to any value lower than you need to allocate for Qwen2.5-7B-Instruct
|
# Set `max_split_size_mb` to reduce memory fragmentation and avoid out of memory
|
||||||
export PYTORCH_NPU_ALLOC_CONF=max_split_size_mb:256
|
export PYTORCH_NPU_ALLOC_CONF=max_split_size_mb:256
|
||||||
```
|
```
|
||||||
|
|
||||||
|
|||||||
@@ -29,10 +29,10 @@ docker run --rm \
|
|||||||
Setup environment variables:
|
Setup environment variables:
|
||||||
|
|
||||||
```bash
|
```bash
|
||||||
# Use Modelscope mirror to speed up model download
|
# Load model from ModelScope to speed up download
|
||||||
export VLLM_USE_MODELSCOPE=True
|
export VLLM_USE_MODELSCOPE=True
|
||||||
|
|
||||||
# To avoid NPU out of memory, set `max_split_size_mb` to any value lower than you need to allocate for Qwen2.5-7B-Instruct
|
# Set `max_split_size_mb` to reduce memory fragmentation and avoid out of memory
|
||||||
export PYTORCH_NPU_ALLOC_CONF=max_split_size_mb:256
|
export PYTORCH_NPU_ALLOC_CONF=max_split_size_mb:256
|
||||||
```
|
```
|
||||||
|
|
||||||
|
|||||||
@@ -29,10 +29,10 @@ docker run --rm \
|
|||||||
Setup environment variables:
|
Setup environment variables:
|
||||||
|
|
||||||
```bash
|
```bash
|
||||||
# Use Modelscope mirror to speed up model download
|
# Load model from ModelScope to speed up download
|
||||||
export VLLM_USE_MODELSCOPE=True
|
export VLLM_USE_MODELSCOPE=True
|
||||||
|
|
||||||
# To avoid NPU out of memory, set `max_split_size_mb` to any value lower than you need to allocate for Qwen2.5-7B-Instruct
|
# Set `max_split_size_mb` to reduce memory fragmentation and avoid out of memory
|
||||||
export PYTORCH_NPU_ALLOC_CONF=max_split_size_mb:256
|
export PYTORCH_NPU_ALLOC_CONF=max_split_size_mb:256
|
||||||
```
|
```
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user