"vscode:/vscode.git/clone" did not exist on "44c88653fca622bac4fd8380462b4b0ab1971ccd"
Unverified Commit 24d0ef89 authored by Nicolò Lucchesi's avatar Nicolò Lucchesi Committed by GitHub
Browse files

[Misc] Replace TODO in serving transcription (#18895)


Signed-off-by: default avatarNickLucche <nlucches@redhat.com>
parent 7fcfd954
...@@ -278,7 +278,9 @@ class OpenAIServingTranscription(OpenAIServing): ...@@ -278,7 +278,9 @@ class OpenAIServingTranscription(OpenAIServing):
result_generator: Optional[AsyncGenerator[RequestOutput, None]] = None result_generator: Optional[AsyncGenerator[RequestOutput, None]] = None
try: try:
# TODO(rob): subtract len of tokenized prompt. # Unlike most decoder-only models, whisper generation length is not
# constrained by the size of the input audio, which is mapped to a
# fixed-size log-mel-spectogram.
default_max_tokens = self.model_config.max_model_len default_max_tokens = self.model_config.max_model_len
sampling_params = request.to_sampling_params( sampling_params = request.to_sampling_params(
default_max_tokens, self.default_sampling_params) default_max_tokens, self.default_sampling_params)
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment