Unverified Commit 7e90a2d1 authored by Fluder-Paradyne's avatar Fluder-Paradyne Committed by GitHub
Browse files

Add `/health` Endpoint for both Servers (#1540)

parent 5687d584
......@@ -17,6 +17,12 @@ app = FastAPI()
engine = None
@app.get("/health")
async def health() -> Response:
"""Health check."""
return Response(status_code=200)
@app.post("/generate")
async def generate(request: Request) -> Response:
"""Generate completion for the request.
......
......@@ -13,7 +13,7 @@ import uvicorn
from fastapi import Request
from fastapi.exceptions import RequestValidationError
from fastapi.middleware.cors import CORSMiddleware
from fastapi.responses import JSONResponse, StreamingResponse
from fastapi.responses import JSONResponse, StreamingResponse, Response
from packaging import version
from vllm.engine.arg_utils import AsyncEngineArgs
......@@ -145,6 +145,12 @@ async def check_length(
return input_ids, None
@app.get("/health")
async def health() -> Response:
"""Health check."""
return Response(status_code=200)
@app.get("/v1/models")
async def show_available_models():
"""Show available models. Right now we only have one model."""
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment