[rust] cache-aware DP - approx tree (#1934)
This commit is contained in:
12
rust/py_src/main.py
Normal file
12
rust/py_src/main.py
Normal file
@@ -0,0 +1,12 @@
|
||||
from sglang_router import PolicyType, Router
|
||||
|
||||
router = Router(
|
||||
worker_urls=[
|
||||
"http://localhost:30000",
|
||||
"http://localhost:30001",
|
||||
],
|
||||
policy=PolicyType.ApproxTree,
|
||||
tokenizer_path="/shared/public/elr-models/meta-llama/Meta-Llama-3.1-8B-Instruct/07eb05b21d191a58c577b4a45982fe0c049d0693/tokenizer.json",
|
||||
)
|
||||
|
||||
router.start()
|
||||
Reference in New Issue
Block a user