diff --git a/computility-run.yaml b/computility-run.yaml new file mode 100644 index 0000000..9258162 --- /dev/null +++ b/computility-run.yaml @@ -0,0 +1,19 @@ +gpu_num: 1 +command: + - vllm + - serve + - /model + - --served-model-name + - llm + - --max-model-len + - '4096' + - --gpu-memory-utilization + - '0.9' + - --enforce-eager + - --trust-remote-code + - -tp + - '1' +env: + - name: ENV_NAME + value: ENV_VALUE + \ No newline at end of file