setup_rocm.py 2.38 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
# Copyright 2025 SGLang Team. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ==============================================================================

import sys
from pathlib import Path

from setuptools import find_packages, setup
from torch.utils.cpp_extension import BuildExtension, CUDAExtension

root = Path(__file__).parent.resolve()


def _get_version():
    with open(root / "pyproject.toml") as f:
        for line in f:
            if line.startswith("version"):
                return line.split("=")[1].strip().strip('"')


32
operator_namespace = "sgl_kernel"
33
include_dirs = [
34
35
    root / "include",
    root / "csrc",
36
37
38
]

sources = [
39
40
    "csrc/allreduce/custom_all_reduce.hip",
    "csrc/moe/moe_align_kernel.cu",
41
    "csrc/moe/moe_topk_softmax_kernels.cu",
42
    "csrc/torch_extension_rocm.cc",
43
    "csrc/speculative/eagle_utils.cu",
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
]

cxx_flags = ["-O3"]
libraries = ["hiprtc", "amdhip64", "c10", "torch", "torch_python"]
extra_link_args = ["-Wl,-rpath,$ORIGIN/../../torch/lib", "-L/usr/lib/x86_64-linux-gnu"]

hipcc_flags = [
    "-DNDEBUG",
    f"-DOPERATOR_NAMESPACE={operator_namespace}",
    "-O3",
    "-Xcompiler",
    "-fPIC",
    "-std=c++17",
    "-D__HIP_PLATFORM_AMD__=1",
    "--amdgpu-target=gfx942",
    "-DENABLE_BF16",
    "-DENABLE_FP8",
]

63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
ext_modules = [
    CUDAExtension(
        name="sgl_kernel.common_ops",
        sources=sources,
        include_dirs=include_dirs,
        extra_compile_args={
            "nvcc": hipcc_flags,
            "cxx": cxx_flags,
        },
        libraries=libraries,
        extra_link_args=extra_link_args,
        py_limited_api=True,
    ),
]

78
79
80
setup(
    name="sgl-kernel",
    version=_get_version(),
81
    packages=find_packages(where="python"),
82
83
    package_dir={"": "python"},
    ext_modules=ext_modules,
84
    cmdclass={"build_ext": BuildExtension.with_options(use_ninja=True)},
85
86
    options={"bdist_wheel": {"py_limited_api": "cp39"}},
)