Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
wqshmzh
ktransformers
Commits
1dd84b4a
"tools/vscode:/vscode.git/clone" did not exist on "e7c25c06df676a19e841897d3db7779aa24f4d88"
Unverified
Commit
1dd84b4a
authored
Feb 20, 2025
by
ZiWei Yuan
Committed by
GitHub
Feb 20, 2025
Browse files
Merge pull request #550 from kvcache-ai/docker_dev
Docker dev
parents
64a00651
ed74f91a
Changes
4
Hide whitespace changes
Inline
Side-by-side
Showing
4 changed files
with
95 additions
and
50 deletions
+95
-50
.github/workflows/docker-image
.github/workflows/docker-image
+0
-47
.github/workflows/docker-image.yml
.github/workflows/docker-image.yml
+90
-0
Dockerfile
Dockerfile
+4
-2
ktransformers/tests/mmlu_pro_test.py
ktransformers/tests/mmlu_pro_test.py
+1
-1
No files found.
.github/workflows/docker-image
deleted
100644 → 0
View file @
64a00651
name: DockerHub CI
on:
release:
types: [published]
env:
DOCKERHUB_REPO: ${{ secrets.DOCKERHUB_USERNAME }}/ktransformers
jobs:
build:
runs-on: ubuntu-latest
steps:
- name: Move Docker data directory
run: |
sudo systemctl stop docker
sudo mkdir -p /mnt/docker
sudo rsync -avz /var/lib/docker/ /mnt/docker
sudo rm -rf /var/lib/docker
sudo ln -s /mnt/docker /var/lib/docker
sudo systemctl start docker
-
name: Set up QEMU
uses: docker/setup-qemu-action@v3
-
name: Set up Docker Buildx
uses: docker/setup-buildx-action@v3
-
name: Login to Docker Hub
uses: docker/login-action@v3
with:
username: ${{ secrets.DOCKERHUB_USERNAME }}
password: ${{ secrets.DOCKERHUB_TOKEN }}
-
name: Build and push
uses: docker/build-push-action@v6
with:
push: true
platforms: |
linux/amd64
linux/arm64
tags: |
${{ env.DOCKERHUB_REPO }}:latest
${{ env.DOCKERHUB_REPO }}:${{ github.event.release.tag_name }}
.github/workflows/docker-image.yml
0 → 100644
View file @
1dd84b4a
name
:
DockerHub CI
on
:
release
:
types
:
[
published
]
# push:
# branches:
# - main
env
:
DOCKERHUB_REPO
:
${{ secrets.DOCKERHUB_USERNAME }}/ktransformers
jobs
:
test
:
runs-on
:
ubuntu-latest
steps
:
-
uses
:
actions/checkout@v2
-
name
:
Run tests
run
:
|
if [ -f docker-compose.test.yml ]; then
docker-compose --file docker-compose.test.yml build
docker-compose --file docker-compose.test.yml run sut
else
docker build . --file Dockerfile
fi
docker_task
:
needs
:
test
name
:
${{ matrix.instruct}}
runs-on
:
ubuntu-latest
strategy
:
fail-fast
:
false
matrix
:
include
:
# for amd64
-
{
instruct
:
"
FANCY"
,
platform
:
"
linux/amd64"
}
-
{
instruct
:
"
AVX512"
,
platform
:
"
linux/amd64"
}
-
{
instruct
:
"
AVX2"
,
platform
:
"
linux/amd64"
}
-
{
instruct
:
"
NATIVE"
,
platform
:
"
linux/amd64"
}
# for arm64
-
{
instruct
:
"
NATIVE"
,
platform
:
"
linux/arm64"
}
steps
:
-
name
:
Move Docker data directory
run
:
|
sudo systemctl stop docker
sudo mkdir -p /mnt/docker
sudo rsync -avz /var/lib/docker/ /mnt/docker
sudo rm -rf /var/lib/docker
sudo ln -s /mnt/docker /var/lib/docker
sudo systemctl start docker
-
name
:
Set up QEMU
uses
:
docker/setup-qemu-action@v3
-
name
:
Set up Docker Buildx
uses
:
docker/setup-buildx-action@v3
-
name
:
Login to Docker Hub
uses
:
docker/login-action@v3
with
:
username
:
${{ secrets.DOCKERHUB_USERNAME }}
password
:
${{ secrets.DOCKERHUB_TOKEN }}
-
name
:
Build and push for amd64
if
:
matrix.platform == 'linux/amd64'
uses
:
docker/build-push-action@v6
with
:
push
:
true
platforms
:
|
linux/amd64
tags
:
|
${{ env.DOCKERHUB_REPO }}:latest-${{ matrix.instruct }}
${{ env.DOCKERHUB_REPO }}:${{ github.event.release.tag_name }}-${{ matrix.instruct }}
build-args
:
|
CPU_INSTRUCT=${{ matrix.instruct }}
-
name
:
Build and push for arm64
if
:
matrix.platform == 'linux/arm64'
uses
:
docker/build-push-action@v6
with
:
push
:
true
platforms
:
|
linux/arm64
tags
:
|
${{ env.DOCKERHUB_REPO }}:latest-${{ matrix.instruct }}
${{ env.DOCKERHUB_REPO }}:${{ github.event.release.tag_name }}-${{ matrix.instruct }}
build-args
:
|
CPU_INSTRUCT=${{ matrix.instruct }}
\ No newline at end of file
Dockerfile
View file @
1dd84b4a
...
@@ -11,6 +11,7 @@ EOF
...
@@ -11,6 +11,7 @@ EOF
FROM
pytorch/pytorch:2.3.1-cuda12.1-cudnn8-devel as compile_server
FROM
pytorch/pytorch:2.3.1-cuda12.1-cudnn8-devel as compile_server
ARG
CPU_INSTRUCT=NATIVE
WORKDIR
/workspace
WORKDIR
/workspace
ENV
CUDA_HOME /usr/local/cuda
ENV
CUDA_HOME /usr/local/cuda
COPY
--from=web_compile /home/ktransformers /workspace/ktransformers
COPY
--from=web_compile /home/ktransformers /workspace/ktransformers
...
@@ -28,8 +29,9 @@ git submodule init &&
...
@@ -28,8 +29,9 @@ git submodule init &&
git submodule update &&
git submodule update &&
pip install ninja pyproject numpy cpufeature &&
pip install ninja pyproject numpy cpufeature &&
pip install flash-attn &&
pip install flash-attn &&
CPU_INSTRUCT=NATIVE KTRANSFORMERS_FORCE_BUILD=TRUE TORCH_CUDA_ARCH_LIST="8.0;8.6;8.7;8.9;9.0+PTX" pip install . --no-build-isolation --verbose &&
CPU_INSTRUCT=${CPU_INSTRUCT} KTRANSFORMERS_FORCE_BUILD=TRUE TORCH_CUDA_ARCH_LIST="8.0;8.6;8.7;8.9;9.0+PTX" pip install . --no-build-isolation --verbose &&
pip cache purge
pip cache purge &&
cp /usr/lib/x86_64-linux-gnu/libstdc++.so.6 /opt/conda/lib/
EOF
EOF
ENTRYPOINT
["tail", "-f", "/dev/null"]
ENTRYPOINT
["tail", "-f", "/dev/null"]
\ No newline at end of file
ktransformers/tests/mmlu_pro_test.py
View file @
1dd84b4a
...
@@ -176,7 +176,7 @@ if __name__ == "__main__":
...
@@ -176,7 +176,7 @@ if __name__ == "__main__":
parser
.
add_argument
(
"--result"
,
type
=
str
,
default
=
"./mmlu_pro.json"
,
help
=
"Path to save the result JSON file"
)
parser
.
add_argument
(
"--result"
,
type
=
str
,
default
=
"./mmlu_pro.json"
,
help
=
"Path to save the result JSON file"
)
parser
.
add_argument
(
"--log"
,
type
=
str
,
default
=
"./mmlu_pro.log"
,
help
=
"Path to save the log file"
)
parser
.
add_argument
(
"--log"
,
type
=
str
,
default
=
"./mmlu_pro.log"
,
help
=
"Path to save the log file"
)
parser
.
add_argument
(
"--model"
,
type
=
str
,
default
=
"Pro/deepseek-ai/DeepSeek-V3"
,
help
=
"Model name or path"
)
parser
.
add_argument
(
"--model"
,
type
=
str
,
default
=
"Pro/deepseek-ai/DeepSeek-V3"
,
help
=
"Model name or path"
)
parser
.
add_argument
(
"--api_url"
,
type
=
str
,
default
=
"http://localhost:1
0002
/v1/chat/completions"
,
help
=
"API URL"
)
parser
.
add_argument
(
"--api_url"
,
type
=
str
,
default
=
"http://localhost:1
5488
/v1/chat/completions"
,
help
=
"API URL"
)
# parser.add_argument("--api_url", type=str, default="https://api.siliconflow.cn/v1/chat/completions", help="API URL")
# parser.add_argument("--api_url", type=str, default="https://api.siliconflow.cn/v1/chat/completions", help="API URL")
args
=
parser
.
parse_args
()
args
=
parser
.
parse_args
()
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment