"vscode:/vscode.git/clone" did not exist on "3d7f524aeb8532a9b03784a0fa4c10fae08ae720"
Unverified Commit 7e90a2d1 authored by Fluder-Paradyne's avatar Fluder-Paradyne Committed by GitHub
Browse files

Add `/health` Endpoint for both Servers (#1540)

parent 5687d584
...@@ -17,6 +17,12 @@ app = FastAPI() ...@@ -17,6 +17,12 @@ app = FastAPI()
engine = None engine = None
@app.get("/health")
async def health() -> Response:
"""Health check."""
return Response(status_code=200)
@app.post("/generate") @app.post("/generate")
async def generate(request: Request) -> Response: async def generate(request: Request) -> Response:
"""Generate completion for the request. """Generate completion for the request.
......
...@@ -13,7 +13,7 @@ import uvicorn ...@@ -13,7 +13,7 @@ import uvicorn
from fastapi import Request from fastapi import Request
from fastapi.exceptions import RequestValidationError from fastapi.exceptions import RequestValidationError
from fastapi.middleware.cors import CORSMiddleware from fastapi.middleware.cors import CORSMiddleware
from fastapi.responses import JSONResponse, StreamingResponse from fastapi.responses import JSONResponse, StreamingResponse, Response
from packaging import version from packaging import version
from vllm.engine.arg_utils import AsyncEngineArgs from vllm.engine.arg_utils import AsyncEngineArgs
...@@ -145,6 +145,12 @@ async def check_length( ...@@ -145,6 +145,12 @@ async def check_length(
return input_ids, None return input_ids, None
@app.get("/health")
async def health() -> Response:
"""Health check."""
return Response(status_code=200)
@app.get("/v1/models") @app.get("/v1/models")
async def show_available_models(): async def show_available_models():
"""Show available models. Right now we only have one model.""" """Show available models. Right now we only have one model."""
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment