Commit 2825dacd authored by lizhigong's avatar lizhigong
Browse files

calibration benchmark for zero overhead schedule

parent 2c3f0e14
......@@ -3,6 +3,7 @@
import argparse
import dataclasses
import json
import os
import random
import time
from pathlib import Path
......@@ -214,8 +215,9 @@ def run_vllm(
use_tqdm=False)
use_beam_search = False
print("sleep 1")
time.sleep(1)
if os.environ.get('VLLM_ZERO_OVERHEAD') == '1':
print("sleep 1")
time.sleep(1) # ZERO_OVERHEAD : sleep and wait the last step in warmup
if not use_beam_search:
if args.profile:
profile_dir = args.profile_result_dir
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment