[Misc] Fix sampling from sonnet for long context case (#9235)

94bf9ae4 · Andy Dai · GitHub · f990bab2 · 94bf9ae4
Unverified Commit 94bf9ae4 authored Oct 10, 2024 by Andy Dai Committed by GitHub Oct 11, 2024
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 4 deletions

benchmarks/benchmark_serving.py benchmarks/benchmark_serving.py +4 -4

No files found.
--- a/benchmarks/benchmark_serving.py
+++ b/benchmarks/benchmark_serving.py
@@ -176,9 +176,9 @@ def sample_sonnet_requests(
    # Sample the rest of lines per request.
    sampled_requests: List[Tuple[str, int, int]] = []
    for _ in range(num_requests):
-        sampled_lines = "".join(
-            prefix_lines +
-            random.sample(poem_lines, num_input_lines - num_prefix_lines))
+        num_lines_needed = num_input_lines - num_prefix_lines
+        sampled_lines = "".join(prefix_lines +
+                                random.choices(poem_lines, k=num_lines_needed))

        prompt = f"{base_prompt}{sampled_lines}"
        message = [
@@ -536,7 +536,7 @@ async def benchmark(
        # E.g., "Time to First Token"
        metric_header: str,
    ):
-        # This function print and add statistics of the specified
+        # This function prints and adds statistics of the specified
        # metric.
        if metric_attribute_name not in selected_percentile_metrics:
            return