fix: add `seed` bench_serving to cache key, remove redundant function definition. (#12680)

b88fab31 · yinghui · GitHub · 36942660 · b88fab31 · b88fab31
Unverified Commit b88fab31 authored Nov 04, 2025 by yinghui Committed by GitHub Nov 04, 2025
Show whitespace changes
Inline Side-by-side

Showing with 1 addition and 22 deletions

benchmark/hicache/data_processing.py benchmark/hicache/data_processing.py +0 -21

python/sglang/bench_serving.py python/sglang/bench_serving.py +1 -1

No files found.
--- a/benchmark/hicache/data_processing.py
+++ b/benchmark/hicache/data_processing.py
@@ -2,7 +2,6 @@ import json
 import os
 import pickle
 import random
-from pathlib import Path
 from typing import List, Optional, Tuple, Union
 import numpy as np
@@ -426,26 +425,6 @@ def sample_random_requests(
    return input_requests
-def gen_prompt(tokenizer, token_num):
-    """Generate a random prompt of specified token length using tokenizer vocabulary."""
-    all_available_tokens = list(tokenizer.get_vocab().values())
-    selected_tokens = random.choices(all_available_tokens, k=token_num)
-    return tokenizer.decode(selected_tokens)
-def get_gen_prefix_cache_path(args, tokenizer):
-    """Create cache directory under ~/.cache/sglang/benchmark"""
-    cache_dir = Path.home() / ".cache" / "sglang" / "benchmark"
-    # Create a unique cache filename based on the generation parameters
-    cache_key = (
-        f"gsp_prefix_{args.gsp_num_groups}_{args.gsp_prompts_per_group}_"
-        f"{args.gsp_system_prompt_len}_{args.gsp_question_len}_{args.gsp_output_len}_"
-        f"{tokenizer.__class__.__name__}.pkl"
-    )
-    return cache_dir / cache_key
 def sample_generated_shared_prefix_requests(
    num_groups: int,
    prompts_per_group: int,

--- a/python/sglang/bench_serving.py
+++ b/python/sglang/bench_serving.py
@@ -1507,7 +1507,7 @@ def get_gen_prefix_cache_path(args, tokenizer):
    # Create a unique cache filename based on the generation parameters
    cache_key = (
-        f"gen_shared_prefix_{args.gsp_num_groups}_{args.gsp_prompts_per_group}_"
+        f"gen_shared_prefix_{args.seed}_{args.gsp_num_groups}_{args.gsp_prompts_per_group}_"
        f"{args.gsp_system_prompt_len}_{args.gsp_question_len}_{args.gsp_output_len}_"
        f"{tokenizer.__class__.__name__}.pkl"
    )