Unverified Commit 50dbd6c9 authored by Stanislav Kirillov's avatar Stanislav Kirillov Committed by GitHub
Browse files

[bugfix] Fix critical bug when reporting for all paths where...


[bugfix] Fix critical bug when reporting for all paths where handler.create_error_response is used (#34516)
Signed-off-by: default avatarStanislav Kirillov <stas@nebius.com>
Co-authored-by: default avatarStanislav Kirillov <stas@nebius.com>
Co-authored-by: default avatarCyrus Leung <tlleungac@connect.ust.hk>
parent 98bcc6ca
...@@ -57,7 +57,7 @@ async def create_chat_completion(request: ChatCompletionRequest, raw_request: Re ...@@ -57,7 +57,7 @@ async def create_chat_completion(request: ChatCompletionRequest, raw_request: Re
try: try:
generator = await handler.create_chat_completion(request, raw_request) generator = await handler.create_chat_completion(request, raw_request)
except Exception as e: except Exception as e:
return handler.create_error_response(e) generator = handler.create_error_response(e)
if isinstance(generator, ErrorResponse): if isinstance(generator, ErrorResponse):
return JSONResponse( return JSONResponse(
...@@ -96,7 +96,7 @@ async def render_chat_completion(request: ChatCompletionRequest, raw_request: Re ...@@ -96,7 +96,7 @@ async def render_chat_completion(request: ChatCompletionRequest, raw_request: Re
try: try:
result = await handler.render_chat_request(request) result = await handler.render_chat_request(request)
except Exception as e: except Exception as e:
return handler.create_error_response(e) result = handler.create_error_response(e)
if isinstance(result, ErrorResponse): if isinstance(result, ErrorResponse):
return JSONResponse(content=result.model_dump(), status_code=result.error.code) return JSONResponse(content=result.model_dump(), status_code=result.error.code)
......
...@@ -57,7 +57,7 @@ async def create_completion(request: CompletionRequest, raw_request: Request): ...@@ -57,7 +57,7 @@ async def create_completion(request: CompletionRequest, raw_request: Request):
try: try:
generator = await handler.create_completion(request, raw_request) generator = await handler.create_completion(request, raw_request)
except Exception as e: except Exception as e:
return handler.create_error_response(e) generator = handler.create_error_response(e)
if isinstance(generator, ErrorResponse): if isinstance(generator, ErrorResponse):
return JSONResponse( return JSONResponse(
...@@ -94,7 +94,7 @@ async def render_completion(request: CompletionRequest, raw_request: Request): ...@@ -94,7 +94,7 @@ async def render_completion(request: CompletionRequest, raw_request: Request):
try: try:
result = await handler.render_completion_request(request) result = await handler.render_completion_request(request)
except Exception as e: except Exception as e:
return handler.create_error_response(e) result = handler.create_error_response(e)
if isinstance(result, ErrorResponse): if isinstance(result, ErrorResponse):
return JSONResponse(content=result.model_dump(), status_code=result.error.code) return JSONResponse(content=result.model_dump(), status_code=result.error.code)
......
...@@ -66,7 +66,7 @@ async def create_responses(request: ResponsesRequest, raw_request: Request): ...@@ -66,7 +66,7 @@ async def create_responses(request: ResponsesRequest, raw_request: Request):
try: try:
generator = await handler.create_responses(request, raw_request) generator = await handler.create_responses(request, raw_request)
except Exception as e: except Exception as e:
return handler.create_error_response(e) generator = handler.create_error_response(e)
if isinstance(generator, ErrorResponse): if isinstance(generator, ErrorResponse):
return JSONResponse( return JSONResponse(
...@@ -102,7 +102,7 @@ async def retrieve_responses( ...@@ -102,7 +102,7 @@ async def retrieve_responses(
stream=stream, stream=stream,
) )
except Exception as e: except Exception as e:
return handler.create_error_response(e) response = handler.create_error_response(e)
if isinstance(response, ErrorResponse): if isinstance(response, ErrorResponse):
return JSONResponse( return JSONResponse(
...@@ -128,7 +128,7 @@ async def cancel_responses(response_id: str, raw_request: Request): ...@@ -128,7 +128,7 @@ async def cancel_responses(response_id: str, raw_request: Request):
try: try:
response = await handler.cancel_responses(response_id) response = await handler.cancel_responses(response_id)
except Exception as e: except Exception as e:
return handler.create_error_response(e) response = handler.create_error_response(e)
if isinstance(response, ErrorResponse): if isinstance(response, ErrorResponse):
return JSONResponse( return JSONResponse(
......
...@@ -35,7 +35,7 @@ async def create_classify(request: ClassificationRequest, raw_request: Request): ...@@ -35,7 +35,7 @@ async def create_classify(request: ClassificationRequest, raw_request: Request):
try: try:
generator = await handler.create_classify(request, raw_request) generator = await handler.create_classify(request, raw_request)
except Exception as e: except Exception as e:
return handler.create_error_response(e) generator = handler.create_error_response(e)
if isinstance(generator, ErrorResponse): if isinstance(generator, ErrorResponse):
return JSONResponse( return JSONResponse(
......
...@@ -64,7 +64,7 @@ async def create_embedding( ...@@ -64,7 +64,7 @@ async def create_embedding(
try: try:
generator = await handler.create_embedding(request, raw_request) generator = await handler.create_embedding(request, raw_request)
except Exception as e: except Exception as e:
return handler.create_error_response(e) generator = handler.create_error_response(e)
if isinstance(generator, ErrorResponse): if isinstance(generator, ErrorResponse):
return JSONResponse( return JSONResponse(
......
...@@ -44,7 +44,7 @@ async def create_pooling(request: PoolingRequest, raw_request: Request): ...@@ -44,7 +44,7 @@ async def create_pooling(request: PoolingRequest, raw_request: Request):
try: try:
generator = await handler.create_pooling(request, raw_request) generator = await handler.create_pooling(request, raw_request)
except Exception as e: except Exception as e:
return handler.create_error_response(e) generator = handler.create_error_response(e)
if isinstance(generator, ErrorResponse): if isinstance(generator, ErrorResponse):
return JSONResponse( return JSONResponse(
......
...@@ -52,7 +52,7 @@ async def create_score(request: ScoreRequest, raw_request: Request): ...@@ -52,7 +52,7 @@ async def create_score(request: ScoreRequest, raw_request: Request):
try: try:
generator = await handler.create_score(request, raw_request) generator = await handler.create_score(request, raw_request)
except Exception as e: except Exception as e:
return handler.create_error_response(e) generator = handler.create_error_response(e)
if isinstance(generator, ErrorResponse): if isinstance(generator, ErrorResponse):
return JSONResponse( return JSONResponse(
...@@ -103,7 +103,7 @@ async def do_rerank(request: RerankRequest, raw_request: Request): ...@@ -103,7 +103,7 @@ async def do_rerank(request: RerankRequest, raw_request: Request):
try: try:
generator = await handler.do_rerank(request, raw_request) generator = await handler.do_rerank(request, raw_request)
except Exception as e: except Exception as e:
return handler.create_error_response(e) generator = handler.create_error_response(e)
if isinstance(generator, ErrorResponse): if isinstance(generator, ErrorResponse):
return JSONResponse( return JSONResponse(
......
...@@ -67,7 +67,7 @@ async def generate(request: GenerateRequest, raw_request: Request): ...@@ -67,7 +67,7 @@ async def generate(request: GenerateRequest, raw_request: Request):
try: try:
generator = await handler.serve_tokens(request, raw_request) generator = await handler.serve_tokens(request, raw_request)
except Exception as e: except Exception as e:
return handler.create_error_response(e) generator = handler.create_error_response(e)
if isinstance(generator, ErrorResponse): if isinstance(generator, ErrorResponse):
return JSONResponse( return JSONResponse(
......
...@@ -52,7 +52,7 @@ async def tokenize(request: TokenizeRequest, raw_request: Request): ...@@ -52,7 +52,7 @@ async def tokenize(request: TokenizeRequest, raw_request: Request):
try: try:
generator = await handler.create_tokenize(request, raw_request) generator = await handler.create_tokenize(request, raw_request)
except Exception as e: except Exception as e:
return handler.create_error_response(e) generator = handler.create_error_response(e)
if isinstance(generator, ErrorResponse): if isinstance(generator, ErrorResponse):
return JSONResponse( return JSONResponse(
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment