Commit 2825dacd authored by lizhigong's avatar lizhigong
Browse files

calibration benchmark for zero overhead schedule

parent 2c3f0e14
...@@ -3,6 +3,7 @@ ...@@ -3,6 +3,7 @@
import argparse import argparse
import dataclasses import dataclasses
import json import json
import os
import random import random
import time import time
from pathlib import Path from pathlib import Path
...@@ -214,8 +215,9 @@ def run_vllm( ...@@ -214,8 +215,9 @@ def run_vllm(
use_tqdm=False) use_tqdm=False)
use_beam_search = False use_beam_search = False
print("sleep 1") if os.environ.get('VLLM_ZERO_OVERHEAD') == '1':
time.sleep(1) print("sleep 1")
time.sleep(1) # ZERO_OVERHEAD : sleep and wait the last step in warmup
if not use_beam_search: if not use_beam_search:
if args.profile: if args.profile:
profile_dir = args.profile_result_dir profile_dir = args.profile_result_dir
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment