[Doc] fix VLLM_USE_V1 value in graph mode docs (#1226)
os.environ["VLLM_USE_V1"] must be assigned with str, not other type.  Signed-off-by: 22dimensions <waitingwind@foxmail.com>
This commit is contained in:
@@ -23,7 +23,7 @@ import os
|
|||||||
|
|
||||||
from vllm import LLM
|
from vllm import LLM
|
||||||
|
|
||||||
os.environ["VLLM_USE_V1"] = 1
|
os.environ["VLLM_USE_V1"] = "1"
|
||||||
|
|
||||||
model = LLM(model="Qwen/Qwen2-7B-Instruct")
|
model = LLM(model="Qwen/Qwen2-7B-Instruct")
|
||||||
outputs = model.generate("Hello, how are you?")
|
outputs = model.generate("Hello, how are you?")
|
||||||
@@ -45,7 +45,7 @@ offline example:
|
|||||||
import os
|
import os
|
||||||
from vllm import LLM
|
from vllm import LLM
|
||||||
|
|
||||||
os.environ["VLLM_USE_V1"] = 1
|
os.environ["VLLM_USE_V1"] = "1"
|
||||||
|
|
||||||
# TorchAirGraph is only work without chunked-prefill now
|
# TorchAirGraph is only work without chunked-prefill now
|
||||||
model = LLM(model="deepseek-ai/DeepSeek-R1-0528", additional_config={"torchair_graph_config": {"enabled": True},"ascend_scheduler_config": {"enabled": True,}})
|
model = LLM(model="deepseek-ai/DeepSeek-R1-0528", additional_config={"torchair_graph_config": {"enabled": True},"ascend_scheduler_config": {"enabled": True,}})
|
||||||
@@ -70,7 +70,7 @@ offline example:
|
|||||||
import os
|
import os
|
||||||
from vllm import LLM
|
from vllm import LLM
|
||||||
|
|
||||||
os.environ["VLLM_USE_V1"] = 1
|
os.environ["VLLM_USE_V1"] = "1"
|
||||||
|
|
||||||
model = LLM(model="someother_model_weight", enforce_eager=True)
|
model = LLM(model="someother_model_weight", enforce_eager=True)
|
||||||
outputs = model.generate("Hello, how are you?")
|
outputs = model.generate("Hello, how are you?")
|
||||||
|
|||||||
Reference in New Issue
Block a user