Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
SIYIXNI
vllm
Commits
fd58b73a
"vscode:/vscode.git/clone" did not exist on "db7c80bf76c7bfcaee92a2f177c0db92745eb38f"
Unverified
Commit
fd58b73a
authored
Nov 09, 2023
by
Woosuk Kwon
Committed by
GitHub
Nov 09, 2023
Browse files
Build CUDA11.8 wheels for release (#1596)
parent
8efe23f1
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
with
14 additions
and
3 deletions
+14
-3
.github/workflows/publish.yml
.github/workflows/publish.yml
+1
-1
setup.py
setup.py
+13
-2
No files found.
.github/workflows/publish.yml
View file @
fd58b73a
...
...
@@ -50,7 +50,7 @@ jobs:
os
:
[
'
ubuntu-20.04'
]
python-version
:
[
'
3.8'
,
'
3.9'
,
'
3.10'
,
'
3.11'
]
pytorch-version
:
[
'
2.1.0'
]
cuda-version
:
[
'
12.1'
]
cuda-version
:
[
'
11.8'
,
'
12.1'
]
steps
:
-
name
:
Checkout
...
...
setup.py
View file @
fd58b73a
...
...
@@ -12,6 +12,8 @@ from torch.utils.cpp_extension import BuildExtension, CUDAExtension, CUDA_HOME
ROOT_DIR
=
os
.
path
.
dirname
(
__file__
)
MAIN_CUDA_VERSION
=
"12.1"
# Supported NVIDIA GPU architectures.
SUPPORTED_ARCHS
=
{
"7.0"
,
"7.5"
,
"8.0"
,
"8.6"
,
"8.9"
,
"9.0"
}
...
...
@@ -225,7 +227,7 @@ def get_path(*filepath) -> str:
return
os
.
path
.
join
(
ROOT_DIR
,
*
filepath
)
def
find_version
(
filepath
:
str
):
def
find_version
(
filepath
:
str
)
->
str
:
"""Extract version information from the given filepath.
Adapted from https://github.com/ray-project/ray/blob/0b190ee1160eeca9796bc091e07eaebf4c85b511/python/setup.py
...
...
@@ -238,6 +240,15 @@ def find_version(filepath: str):
raise
RuntimeError
(
"Unable to find version string."
)
def
get_vllm_version
()
->
str
:
version
=
find_version
(
get_path
(
"vllm"
,
"__init__.py"
))
cuda_version
=
str
(
nvcc_cuda_version
)
if
cuda_version
!=
MAIN_CUDA_VERSION
:
cuda_version_str
=
cuda_version
.
replace
(
"."
,
""
)[:
3
]
version
+=
f
"+cu
{
cuda_version_str
}
"
return
version
def
read_readme
()
->
str
:
"""Read the README file if present."""
p
=
get_path
(
"README.md"
)
...
...
@@ -256,7 +267,7 @@ def get_requirements() -> List[str]:
setuptools
.
setup
(
name
=
"vllm"
,
version
=
find_version
(
get_path
(
"vllm"
,
"__init__.py"
)
),
version
=
get_vllm_version
(
),
author
=
"vLLM Team"
,
license
=
"Apache 2.0"
,
description
=
(
"A high-throughput and memory-efficient inference and "
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment