20 lines
317 B
YAML
20 lines
317 B
YAML
gpu_type: Iluvatar_bi-150
|
|
gpu_num: 1
|
|
command:
|
|
- vllm
|
|
- serve
|
|
- /model
|
|
- --served-model-name
|
|
- llm
|
|
- --max-model-len
|
|
- '4096'
|
|
- --gpu-memory-utilization
|
|
- '0.9'
|
|
- --enforce-eager
|
|
- --trust-remote-code
|
|
- -tp
|
|
- '1'
|
|
env:
|
|
- name: ENV_NAME
|
|
value: ENV_VALUE
|
|
|