Update runner docs (#879)
This commit is contained in:
5
.github/workflows/pr-e2e-test.yml
vendored
5
.github/workflows/pr-e2e-test.yml
vendored
@@ -19,6 +19,9 @@ jobs:
|
|||||||
pr-e2e-test:
|
pr-e2e-test:
|
||||||
runs-on: self-hosted
|
runs-on: self-hosted
|
||||||
|
|
||||||
|
env:
|
||||||
|
HF_TOKEN : ${{ secrets.HF_TOKEN }}
|
||||||
|
|
||||||
steps:
|
steps:
|
||||||
- name: Checkout code
|
- name: Checkout code
|
||||||
uses: actions/checkout@v3
|
uses: actions/checkout@v3
|
||||||
@@ -35,7 +38,7 @@ jobs:
|
|||||||
- name: Benchmark Serving
|
- name: Benchmark Serving
|
||||||
run: |
|
run: |
|
||||||
cd /data/zhyncs/venv && source ./bin/activate && cd -
|
cd /data/zhyncs/venv && source ./bin/activate && cd -
|
||||||
python3 -m sglang.launch_server --model /data/zhyncs/Meta-Llama-3.1-8B-Instruct --port 8413 --disable-radix-cache &
|
python3 -m sglang.launch_server --model meta-llama/Meta-Llama-3.1-8B-Instruct --port 8413 --disable-radix-cache &
|
||||||
|
|
||||||
echo "Waiting for server to start..."
|
echo "Waiting for server to start..."
|
||||||
for i in {1..120}; do
|
for i in {1..120}; do
|
||||||
|
|||||||
@@ -15,6 +15,7 @@ add `/lib/systemd/system/runner.service`
|
|||||||
StartLimitIntervalSec=0
|
StartLimitIntervalSec=0
|
||||||
[Service]
|
[Service]
|
||||||
Environment="CUDA_VISIBLE_DEVICES=7"
|
Environment="CUDA_VISIBLE_DEVICES=7"
|
||||||
|
Environment="XDG_CACHE_HOME=/data/.cache"
|
||||||
Restart=always
|
Restart=always
|
||||||
RestartSec=1
|
RestartSec=1
|
||||||
ExecStart=/data/zhyncs/actions-runner/run.sh
|
ExecStart=/data/zhyncs/actions-runner/run.sh
|
||||||
|
|||||||
Reference in New Issue
Block a user