Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
ktransformers
Commits
022b8938
Unverified
Commit
022b8938
authored
Aug 30, 2024
by
UnicornChan
Committed by
GitHub
Aug 30, 2024
Browse files
Merge pull request #67 from UnicornChan/main
[fix] fix bugs about Qwen2-57B, install requirement, DockerFile
parents
351698c3
49cce0c4
Changes
5
Hide whitespace changes
Inline
Side-by-side
Showing
5 changed files
with
21 additions
and
16 deletions
+21
-16
.github/workflows/package_wheel_release.yml
.github/workflows/package_wheel_release.yml
+5
-4
.github/workflows/package_wheel_test.yml
.github/workflows/package_wheel_test.yml
+13
-4
Dockerfile
Dockerfile
+2
-1
ktransformers/optimize/optimize_rules/Qwen2-57B-A14B-Instruct.yaml
...mers/optimize/optimize_rules/Qwen2-57B-A14B-Instruct.yaml
+0
-7
pyproject.toml
pyproject.toml
+1
-0
No files found.
.github/workflows/package_wheel_release.yml
View file @
022b8938
...
...
@@ -28,7 +28,6 @@ jobs:
-
{
os
:
ubuntu-20.04
,
pyver
:
'
3.12'
,
cuda
:
'
12.1.1'
,
torch
:
'
2.4.0'
,
cudaarch
:
'
8.0;8.6;8.7;8.9;9.0+PTX'
,
instruct
:
'
FANCY'
,
torch_cu
:
'
121'
}
-
{
os
:
ubuntu-20.04
,
pyver
:
'
3.12'
,
cuda
:
'
12.1.1'
,
torch
:
'
2.4.0'
,
cudaarch
:
'
8.0;8.6;8.7;8.9;9.0+PTX'
,
instruct
:
'
AVX512'
,
torch_cu
:
'
121'
}
-
{
os
:
ubuntu-20.04
,
pyver
:
'
3.12'
,
cuda
:
'
12.1.1'
,
torch
:
'
2.4.0'
,
cudaarch
:
'
8.0;8.6;8.7;8.9;9.0+PTX'
,
instruct
:
'
AVX2'
,
torch_cu
:
'
121'
}
-
{
os
:
ubuntu-20.04
,
pyver
:
'
3.12'
,
cuda
:
'
12.5.1'
,
torch
:
'
2.3.0'
,
cudaarch
:
'
8.0;8.6;8.7;8.9;9.0+PTX'
,
instruct
:
'
FANCY'
,
torch_cu
:
'
124'
}
-
{
os
:
ubuntu-20.04
,
pyver
:
'
3.12'
,
cuda
:
'
12.2.2'
,
torch
:
'
2.3.0'
,
cudaarch
:
'
8.0;8.6;8.7;8.9;9.0+PTX'
,
instruct
:
'
FANCY'
,
torch_cu
:
'
121'
}
-
{
os
:
ubuntu-20.04
,
pyver
:
'
3.12'
,
cuda
:
'
12.2.2'
,
torch
:
'
2.3.0'
,
cudaarch
:
'
8.0;8.6;8.7;8.9;9.0+PTX'
,
instruct
:
'
AVX512'
,
torch_cu
:
'
121'
}
-
{
os
:
ubuntu-20.04
,
pyver
:
'
3.12'
,
cuda
:
'
12.2.2'
,
torch
:
'
2.3.0'
,
cudaarch
:
'
8.0;8.6;8.7;8.9;9.0+PTX'
,
instruct
:
'
AVX2'
,
torch_cu
:
'
121'
}
...
...
@@ -187,8 +186,10 @@ jobs:
}
}
if ($IsWindows) {
$env:CUDA_PATH = "$env:CUDA_PATH/Library"
$env:CUDA_HOME = $env:CUDA_PATH
if (Test-Path -Path "$env:CUDA_PATH/Library/bin/nvcc.exe"){
$env:CUDA_PATH = "$env:CUDA_PATH/Library"
$env:CUDA_HOME = $env:CUDA_PATH
}
$env:PATH = "$env:CUDA_PATH/bin;" + $env:PATH
$directory = "$env:CUDA_PATH/lib/x64/"
if (-not (Test-Path -Path $directory)) {
...
...
@@ -197,7 +198,7 @@ jobs:
}
cp $env:CUDA_PATH/lib/*.lib $env:CUDA_PATH/lib/x64/
$env:INCLUDE =$env:CUDA_PATH + "/include/targets/x64;" + $env:INCLUDE
$env:INCLUDE =$env:CONDA_PREFIX + "/include;" + $env:INCLUDE
}
python -m pip install torch==${{ matrix.torch }} torchvision torchaudio --index-url https://download.pytorch.org/whl/cu${{ matrix.torch_cu }}
python -m pip install cpufeature build wheel ninja packaging setuptools
...
...
.github/workflows/package_wheel_test.yml
View file @
022b8938
name
:
Build Wheels
name
:
Build Wheels
Tests
on
:
workflow_dispatch
:
inputs
:
...
...
@@ -16,8 +16,10 @@ jobs:
matrix
:
include
:
# Ubuntu
-
{
os
:
ubuntu-20.04
,
pyver
:
'
3.12'
,
cuda
:
'
12.5.1'
,
torch
:
'
2.4.0'
,
cudaarch
:
'
8.9;9.0+PTX'
,
instruct
:
'
FANCY'
,
torch_cu
:
'
124'
}
-
{
os
:
ubuntu-20.04
,
pyver
:
'
3.12'
,
cuda
:
'
12.2.2'
,
torch
:
'
2.3.0'
,
cudaarch
:
'
8.9;9.0+PTX'
,
instruct
:
'
FANCY'
,
torch_cu
:
'
121'
}
-
{
os
:
windows-2022
,
pyver
:
'
3.11'
,
cuda
:
'
12.5.1'
,
torch
:
'
2.4.0'
,
cudaarch
:
'
8.9;9.0+PTX'
,
instruct
:
'
AVX2'
,
torch_cu
:
'
124'
}
-
{
os
:
windows-2022
,
pyver
:
'
3.12'
,
cuda
:
'
12.1.1'
,
torch
:
'
2.3.0'
,
cudaarch
:
'
8.9;9.0+PTX'
,
instruct
:
'
AVX2'
,
torch_cu
:
'
121'
}
defaults
:
run
:
...
...
@@ -96,12 +98,19 @@ jobs:
}
}
if ($IsWindows) {
$env:CUDA_PATH = "$env:CUDA_PATH/Library"
$env:CUDA_HOME = $env:CUDA_PATH
if (Test-Path -Path "$env:CUDA_PATH/Library/bin/nvcc.exe"){
$env:CUDA_PATH = "$env:CUDA_PATH/Library"
$env:CUDA_HOME = $env:CUDA_PATH
}
$env:PATH = "$env:CUDA_PATH/bin;" + $env:PATH
$directory = "$env:CUDA_PATH/lib/x64/"
if (-not (Test-Path -Path $directory)) {
New-Item -ItemType Directory -Path $directory
Write-Output "Directory '$directory' created."
}
cp $env:CUDA_PATH/lib/*.lib $env:CUDA_PATH/lib/x64/
$env:INCLUDE =$env:CUDA_PATH + "/include/targets/x64;" + $env:INCLUDE
$env:INCLUDE =$env:CONDA_PREFIX + "/include;" + $env:INCLUDE
}
python -m pip install torch==${{ matrix.torch }} torchvision torchaudio --index-url https://download.pytorch.org/whl/cu${{ matrix.torch_cu }}
python -m pip install cpufeature build wheel ninja packaging setuptools
...
...
Dockerfile
View file @
022b8938
...
...
@@ -12,6 +12,7 @@ EOF
FROM
pytorch/pytorch:2.3.1-cuda12.1-cudnn8-devel as compile_server
WORKDIR
/workspace
ENV
CUDA_HOME /usr/local/cuda
COPY
--from=web_compile /home/ktransformers /workspace/ktransformers
RUN
<<
EOF
apt update -y && apt install -y --no-install-recommends \
...
...
@@ -27,7 +28,7 @@ git submodule init &&
git submodule update &&
pip install ninja pyproject numpy cpufeature &&
pip install flash-attn &&
CPU_INSTRUCT=NATIVE KTRANSFORMERS_FORCE_BUILD=TRUE TORCH_CUDA_ARCH_LIST="8.0;8.6;8.7;8.9" pip install . --no-build-isolation --verbose &&
CPU_INSTRUCT=NATIVE KTRANSFORMERS_FORCE_BUILD=TRUE TORCH_CUDA_ARCH_LIST="8.0;8.6;8.7;8.9
;9.0+PTX
" pip install . --no-build-isolation --verbose &&
pip cache purge
EOF
...
...
ktransformers/optimize/optimize_rules/Qwen2-57B-A14B-Instruct.yaml
View file @
022b8938
-
match
:
name
:
"
^model
\\
.layers
\\
..*
\\
."
replace
:
class
:
"
default"
kwargs
:
generate_device
:
"
cuda"
prefill_device
:
"
cuda"
-
match
:
class
:
ktransformers.models.modeling_qwen2_moe.Qwen2MoeRotaryEmbedding
replace
:
...
...
pyproject.toml
View file @
022b8938
...
...
@@ -18,6 +18,7 @@ dependencies = [
"torch >= 2.3.0"
,
"transformers == 4.43.2"
,
"fastapi >= 0.111.0"
,
"uvicorn >= 0.30.1"
,
"langchain >= 0.2.0"
,
"blessed >= 1.20.0"
,
"accelerate >= 0.31.0"
,
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment