TP/quantization/weight loading refactor part 1 - Simplify parallel linear logic (#1181)

ba0bfd40 · Zhuohan Li · GitHub · 84e4e37d · ba0bfd40
Unverified Commit ba0bfd40 authored Oct 02, 2023 by Zhuohan Li Committed by GitHub Oct 02, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 0 additions and 6 deletions

vllm/model_executor/utils.py vllm/model_executor/utils.py +0 -6

No files found.
--- a/vllm/model_executor/utils.py
+++ b/vllm/model_executor/utils.py
@@ -4,9 +4,6 @@ import random
 import numpy as np
 import torch

-from vllm.model_executor.parallel_utils.parallel_state import model_parallel_is_initialized
-from vllm.model_executor.parallel_utils.tensor_parallel import model_parallel_cuda_manual_seed
-

 def set_random_seed(seed: int) -> None:
    random.seed(seed)
@@ -14,6 +11,3 @@ def set_random_seed(seed: int) -> None:
    torch.manual_seed(seed)
    if torch.cuda.is_available():
        torch.cuda.manual_seed_all(seed)
-
-    if model_parallel_is_initialized():
-        model_parallel_cuda_manual_seed(seed)