Unverified Commit b71fcd49 authored by Sergei Skvortsov's avatar Sergei Skvortsov Committed by GitHub
Browse files

[Misc] Add penalties sampling parameters to serve tool (#25974)


Signed-off-by: default avatarSergei Skvortsov <sergeyskv@nebius.com>
Co-authored-by: default avatarSergei Skvortsov <sergeyskv@nebius.com>
parent 75003f34
...@@ -1077,6 +1077,27 @@ def add_cli_args(parser: argparse.ArgumentParser): ...@@ -1077,6 +1077,27 @@ def add_cli_args(parser: argparse.ArgumentParser):
"openai-compatible backends. If not specified, default to greedy " "openai-compatible backends. If not specified, default to greedy "
"decoding (i.e. temperature==0.0).", "decoding (i.e. temperature==0.0).",
) )
sampling_group.add_argument(
"--frequency-penalty",
type=float,
default=None,
help="Frequency penalty sampling parameter. Only has effect on "
"openai-compatible backends.",
)
sampling_group.add_argument(
"--presence-penalty",
type=float,
default=None,
help="Presence penalty sampling parameter. Only has effect on "
"openai-compatible backends.",
)
sampling_group.add_argument(
"--repetition-penalty",
type=float,
default=None,
help="Repetition penalty sampling parameter. Only has effect on "
"openai-compatible backends.",
)
parser.add_argument( parser.add_argument(
'--tokenizer-mode', '--tokenizer-mode',
...@@ -1211,6 +1232,9 @@ async def main_async(args: argparse.Namespace) -> dict[str, Any]: ...@@ -1211,6 +1232,9 @@ async def main_async(args: argparse.Namespace) -> dict[str, Any]:
"top_k": args.top_k, "top_k": args.top_k,
"min_p": args.min_p, "min_p": args.min_p,
"temperature": args.temperature, "temperature": args.temperature,
"frequency_penalty": args.frequency_penalty,
"presence_penalty": args.presence_penalty,
"repetition_penalty": args.repetition_penalty,
}.items() if v is not None }.items() if v is not None
} }
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment