Add health endpoint to SGLang runtime server (#90)

This commit is contained in:
isaac-vidas
2024-01-23 22:00:28 -05:00
committed by GitHub
parent 7358fa64f7
commit 3de54a1b55

View File

@@ -17,7 +17,7 @@ import requests
import uvicorn
import uvloop
from fastapi import FastAPI, Request
from fastapi.responses import StreamingResponse
from fastapi.responses import Response, StreamingResponse
from sglang.backend.runtime_endpoint import RuntimeEndpoint
from sglang.srt.conversation import (
Conversation,
@@ -57,6 +57,12 @@ tokenizer_manager = None
chat_template_name = None
@app.get("/health")
async def health() -> Response:
"""Health check."""
return Response(status_code=200)
@app.get("/get_model_info")
async def get_model_info():
result = {