Minor Optimizations in Schedule Batch (#8724)

Co-authored-by: Suruchi Shah <surshah@linkedin.com>

Minor Optimizations in Schedule Batch (#8724)
Co-authored-by: Suruchi Shah <surshah@linkedin.com>
f352b793 · Lianmin Zheng · GitHub · 6642e3a2 · f352b793
Unverified Commit f352b793 authored Aug 08, 2025 by Lianmin Zheng Committed by GitHub Aug 08, 2025
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 3 deletions

python/sglang/srt/managers/schedule_batch.py python/sglang/srt/managers/schedule_batch.py +4 -3

No files found.
--- a/python/sglang/srt/managers/schedule_batch.py
+++ b/python/sglang/srt/managers/schedule_batch.py
@@ -37,6 +37,7 @@ import logging
 import threading
 from enum import Enum, auto
 from http import HTTPStatus
+from itertools import chain
 from typing import TYPE_CHECKING, Any, List, Optional, Set, Tuple, Union
 import numpy as np
@@ -1145,9 +1146,9 @@ class ScheduleBatch(ScheduleBatchDisaggregationDecodeMixin):
        req_pool_indices_tensor = torch.tensor(req_pool_indices, dtype=torch.int64).to(
            self.device, non_blocking=True
        )
-        input_ids_tensor = torch.tensor(sum(input_ids, []), dtype=torch.int64).to(
+        input_ids_tensor = torch.tensor(
-            self.device, non_blocking=True
+            list(chain.from_iterable(input_ids)), dtype=torch.int64
-        )
+        ).to(self.device, non_blocking=True)
        seq_lens_tensor = torch.tensor(seq_lens, dtype=torch.int64).to(
            self.device, non_blocking=True
        )