[Auto Sync] Update parallel_state.py, few_shot_gsm8k.py (20250903) (#9986)

Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com> Co-authored-by: Leon Gao <leon.gao19@gmail.com>

[Auto Sync] Update parallel_state.py, few_shot_gsm8k.py (20250903) (#9986)
Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com> Co-authored-by: Leon Gao <leon.gao19@gmail.com>
397448eb · Lianmin Zheng · GitHub · 66d5d042 · 397448eb · 397448eb
Unverified Commit 397448eb authored Sep 03, 2025 by Lianmin Zheng Committed by GitHub Sep 03, 2025
Showing with 9 additions and 11 deletions

python/sglang/srt/distributed/parallel_state.py python/sglang/srt/distributed/parallel_state.py +8 -11

python/sglang/test/few_shot_gsm8k.py python/sglang/test/few_shot_gsm8k.py +1 -0

No files found.
--- a/python/sglang/srt/distributed/parallel_state.py
+++ b/python/sglang/srt/distributed/parallel_state.py
@@ -879,17 +879,16 @@ class GroupCoordinator:
        size_tensor = torch.tensor(
            [object_tensor.numel()],
            dtype=torch.long,
-            device=torch.cuda.current_device(),
+            device="cpu",
        )
        # Send object size
-        torch.distributed.send(
+        torch.distributed.send(size_tensor, dst=self.ranks[dst], group=self.cpu_group)
-            size_tensor, dst=self.ranks[dst], group=self.device_group
-        )
        # Send object
        torch.distributed.send(
-            object_tensor, dst=self.ranks[dst], group=self.device_group
+            object_tensor,
+            dst=self.ranks[dst],
+            group=self.device_group,
        )
        return None
@@ -904,13 +903,11 @@ class GroupCoordinator:
            src != self.rank_in_group
        ), "Invalid source rank. Source rank is the same as the current rank."
-        size_tensor = torch.empty(
+        size_tensor = torch.empty(1, dtype=torch.long, device="cpu")
-            1, dtype=torch.long, device=torch.cuda.current_device()
-        )
        # Receive object size
        rank_size = torch.distributed.recv(
-            size_tensor, src=self.ranks[src], group=self.device_group
+            size_tensor, src=self.ranks[src], group=self.cpu_group
        )
        # Tensor to receive serialized objects into.
@@ -928,7 +925,7 @@ class GroupCoordinator:
            rank_object == rank_size
        ), "Received object sender rank does not match the size sender rank."
-        obj = pickle.loads(object_tensor.cpu().numpy().tobytes())
+        obj = pickle.loads(object_tensor.cpu().numpy())
        return obj

--- a/python/sglang/test/few_shot_gsm8k.py
+++ b/python/sglang/test/few_shot_gsm8k.py
@@ -129,6 +129,7 @@ def run_eval(args):
    return {
        "accuracy": acc,
+        "invalid": invalid,
        "latency": latency,
        "output_throughput": output_throughput,
    }