Unverified Commit 67d115db authored by jack's avatar jack Committed by GitHub
Browse files

[Bugfix][Frontend] Disable embedding API for chat models (#7504)


Co-authored-by: default avatarjack <jack@alex>
parent d3d9cb6e
...@@ -71,7 +71,7 @@ class OpenAIServingEmbedding(OpenAIServing): ...@@ -71,7 +71,7 @@ class OpenAIServingEmbedding(OpenAIServing):
lora_modules=None, lora_modules=None,
prompt_adapters=None, prompt_adapters=None,
request_logger=request_logger) request_logger=request_logger)
self._check_embedding_mode(model_config.embedding_mode) self._enabled = self._check_embedding_mode(model_config.embedding_mode)
async def create_embedding( async def create_embedding(
self, self,
...@@ -83,6 +83,8 @@ class OpenAIServingEmbedding(OpenAIServing): ...@@ -83,6 +83,8 @@ class OpenAIServingEmbedding(OpenAIServing):
See https://platform.openai.com/docs/api-reference/embeddings/create See https://platform.openai.com/docs/api-reference/embeddings/create
for the API specification. This API mimics the OpenAI Embedding API. for the API specification. This API mimics the OpenAI Embedding API.
""" """
if not self._enabled:
return self.create_error_response("Embedding API disabled")
error_check_ret = await self._check_model(request) error_check_ret = await self._check_model(request)
if error_check_ret is not None: if error_check_ret is not None:
return error_check_ret return error_check_ret
...@@ -179,3 +181,4 @@ class OpenAIServingEmbedding(OpenAIServing): ...@@ -179,3 +181,4 @@ class OpenAIServingEmbedding(OpenAIServing):
"embedding_mode is False. Embedding API will not work.") "embedding_mode is False. Embedding API will not work.")
else: else:
logger.info("Activating the server engine with embedding enabled.") logger.info("Activating the server engine with embedding enabled.")
return embedding_mode
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment