setup_rocm.py 2.43 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
# Copyright 2025 SGLang Team. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================

16
import platform
17
18
19
20
21
22
23
import sys
from pathlib import Path

from setuptools import find_packages, setup
from torch.utils.cpp_extension import BuildExtension, CUDAExtension

root = Path(__file__).parent.resolve()
24
arch = platform.machine().lower()
25
26
27
28
29
30
31
32
33


def _get_version():
    with open(root / "pyproject.toml") as f:
        for line in f:
            if line.startswith("version"):
                return line.split("=")[1].strip().strip('"')


34
operator_namespace = "sgl_kernel"
35
include_dirs = [
36
37
    root / "include",
    root / "csrc",
38
39
40
]

sources = [
41
42
    "csrc/allreduce/custom_all_reduce.hip",
    "csrc/moe/moe_align_kernel.cu",
43
    "csrc/moe/moe_topk_softmax_kernels.cu",
44
    "csrc/torch_extension_rocm.cc",
45
    "csrc/speculative/eagle_utils.cu",
46
47
48
49
]

cxx_flags = ["-O3"]
libraries = ["hiprtc", "amdhip64", "c10", "torch", "torch_python"]
50
extra_link_args = ["-Wl,-rpath,$ORIGIN/../../torch/lib", f"-L/usr/lib/{arch}-linux-gnu"]
51
52
53
54
55
56
57
58
59
60
61
62
63
64

hipcc_flags = [
    "-DNDEBUG",
    f"-DOPERATOR_NAMESPACE={operator_namespace}",
    "-O3",
    "-Xcompiler",
    "-fPIC",
    "-std=c++17",
    "-D__HIP_PLATFORM_AMD__=1",
    "--amdgpu-target=gfx942",
    "-DENABLE_BF16",
    "-DENABLE_FP8",
]

65
66
67
68
69
70
71
72
73
74
75
ext_modules = [
    CUDAExtension(
        name="sgl_kernel.common_ops",
        sources=sources,
        include_dirs=include_dirs,
        extra_compile_args={
            "nvcc": hipcc_flags,
            "cxx": cxx_flags,
        },
        libraries=libraries,
        extra_link_args=extra_link_args,
76
        py_limited_api=False,
77
78
79
    ),
]

80
81
82
setup(
    name="sgl-kernel",
    version=_get_version(),
83
    packages=find_packages(where="python"),
84
85
    package_dir={"": "python"},
    ext_modules=ext_modules,
86
    cmdclass={"build_ext": BuildExtension.with_options(use_ninja=True)},
87
88
    options={"bdist_wheel": {"py_limited_api": "cp39"}},
)