Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
Lmdeploy
Commits
3253240a
"...vllm_benchmark_throughput.git" did not exist on "e25b094622a2e5b3c72c808175e52059ea0600cc"
Commit
3253240a
authored
Jan 12, 2024
by
xiabo
Browse files
对应官方最新版本0.1.0主要增加page Attention
修改测试用例
parent
a8ce8d27
Changes
23
Expand all
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
522 additions
and
518 deletions
+522
-518
tests/csrc/unittests/CMakeLists.txt
tests/csrc/unittests/CMakeLists.txt
+20
-16
tests/csrc/unittests/test_gemm.cu
tests/csrc/unittests/test_gemm.cu
+498
-498
tests/csrc/unittests/test_sampling_kernels.cu
tests/csrc/unittests/test_sampling_kernels.cu
+4
-4
No files found.
tests/csrc/unittests/CMakeLists.txt
View file @
3253240a
...
@@ -17,11 +17,13 @@
...
@@ -17,11 +17,13 @@
include
(
FetchContent
)
include
(
FetchContent
)
FetchContent_Declare
(
FetchContent_Declare
(
googletest
googletest
GIT_REPOSITORY https://github.com/google/googletest.git
URL ../../../3rdparty/googletest-release-1.12.1
GIT_TAG release-1.12.1
#GIT_REPOSITORY https://github.com/google/googletest.git
#GIT_TAG release-1.12.1
)
)
find_package
(
CUDAToolkit REQUIRED
)
# find_package(CUDAToolkit REQUIRED)
find_package
(
CUDA REQUIRED
)
if
(
NOT MSVC
)
if
(
NOT MSVC
)
add_definitions
(
-DTORCH_CUDA=1
)
add_definitions
(
-DTORCH_CUDA=1
)
...
@@ -31,12 +33,14 @@ endif()
...
@@ -31,12 +33,14 @@ endif()
set
(
gtest_force_shared_crt ON CACHE BOOL
""
FORCE
)
set
(
gtest_force_shared_crt ON CACHE BOOL
""
FORCE
)
FetchContent_MakeAvailable
(
googletest
)
FetchContent_MakeAvailable
(
googletest
)
include_directories
(
../../../3rdparty/googletest-release-1.12.1/googletest/include
)
add_executable
(
unittest
add_executable
(
unittest
test_attention_kernels.cu
test_attention_kernels.cu
test_logprob_kernels.cu
test_logprob_kernels.cu
test_penalty_kernels.cu
test_penalty_kernels.cu
test_sampling_kernels.cu
test_sampling_kernels.cu
test_sampling_layer.cu
#
test_sampling_layer.cu
test_tensor.cu
)
test_tensor.cu
)
# automatic discovery of unit tests
# automatic discovery of unit tests
...
@@ -46,38 +50,38 @@ target_compile_features(unittest PRIVATE cxx_std_14)
...
@@ -46,38 +50,38 @@ target_compile_features(unittest PRIVATE cxx_std_14)
# Sorted by alphabetical order of test name.
# Sorted by alphabetical order of test name.
target_link_libraries
(
# Libs for test_attention_kernels
target_link_libraries
(
# Libs for test_attention_kernels
unittest PUBLIC
unittest PUBLIC
CUDA::
cudart
CUDA::
curand
cudart curand
gpt_kernels gtest memory_utils tensor unfused_attention_kernels cuda_utils logger
)
gpt_kernels gtest memory_utils tensor unfused_attention_kernels cuda_utils logger
)
target_link_libraries
(
# Libs for test_logprob_kernels
target_link_libraries
(
# Libs for test_logprob_kernels
unittest PUBLIC
unittest PUBLIC
CUDA::
cudart
cudart
logprob_kernels memory_utils cuda_utils logger
)
logprob_kernels memory_utils cuda_utils logger
)
target_link_libraries
(
# Libs for test_penalty_kernels
target_link_libraries
(
# Libs for test_penalty_kernels
unittest PUBLIC
unittest PUBLIC
CUDA::
cublas
CUDA::cublasLt CUDA::
cudart
cublas
cudart
sampling_penalty_kernels memory_utils cuda_utils logger
)
sampling_penalty_kernels memory_utils cuda_utils logger
)
target_link_libraries
(
# Libs for test_sampling_kernel
target_link_libraries
(
# Libs for test_sampling_kernel
unittest PUBLIC
unittest PUBLIC
CUDA::
cudart
cudart
sampling_topk_kernels sampling_topp_kernels memory_utils tensor cuda_utils logger
)
sampling_topk_kernels sampling_topp_kernels memory_utils tensor cuda_utils logger
)
target_link_libraries
(
# Libs for test_sampling_layer
target_link_libraries
(
# Libs for test_sampling_layer
unittest PUBLIC
unittest PUBLIC
CUDA::
cublas
CUDA::cublasLt CUDA::
cudart
cublas
cudart
cublasMMWrapper memory_utils
cublasMMWrapper memory_utils
DynamicDecodeLayer TopKSamplingLayer TopPSamplingLayer tensor cuda_utils logger
)
DynamicDecodeLayer TopKSamplingLayer TopPSamplingLayer tensor cuda_utils logger
)
target_link_libraries
(
# Libs for test_tensor
target_link_libraries
(
# Libs for test_tensor
unittest PUBLIC tensor cuda_utils logger
)
unittest PUBLIC
-lrocblas
tensor cuda_utils logger
)
remove_definitions
(
-DTORCH_CUDA=1
)
remove_definitions
(
-DTORCH_CUDA=1
)
add_executable
(
test_gemm test_gemm.cu
)
add_executable
(
test_gemm test_gemm.cu
)
target_link_libraries
(
test_gemm PUBLIC
CUDA::
cublas
CUDA::
cudart
CUDA::
curand gemm cublasMMWrapper tensor cuda_utils logger
)
target_link_libraries
(
test_gemm PUBLIC
-lrocblas
cublas cudart curand gemm cublasMMWrapper tensor cuda_utils logger
)
add_executable
(
test_gpt_kernels test_gpt_kernels.cu
)
add_executable
(
test_gpt_kernels test_gpt_kernels.cu
)
target_link_libraries
(
test_gpt_kernels PUBLIC
target_link_libraries
(
test_gpt_kernels PUBLIC
gpt_kernels memory_utils tensor cuda_utils logger
)
gpt_kernels memory_utils tensor cuda_utils logger
)
add_executable
(
test_context_attention_layer test_context_attention_layer.cu
)
#
add_executable(test_context_attention_layer test_context_attention_layer.cu)
target_link_libraries
(
test_context_attention_layer PUBLIC
#
target_link_libraries(test_context_attention_layer PUBLIC
Llama
CUDA::
cublas
CUDA::cublasLt CUDA::
cudart
#
Llama cublas
cudart
unfused_attention_kernels
#
unfused_attention_kernels
memory_utils tensor cublasMMWrapper cuda_utils logger
)
#
memory_utils tensor cublasMMWrapper cuda_utils logger)
tests/csrc/unittests/test_gemm.cu
View file @
3253240a
This diff is collapsed.
Click to expand it.
tests/csrc/unittests/test_sampling_kernels.cu
View file @
3253240a
...
@@ -446,10 +446,10 @@ TYPED_TEST(TopKSamplingKernelTest, BatchCorrectnessLargeK63)
...
@@ -446,10 +446,10 @@ TYPED_TEST(TopKSamplingKernelTest, BatchCorrectnessLargeK63)
this
->
runBatchTest
({
8
,
4000
,
1
,
63
,
1.0
f
,
8
});
this
->
runBatchTest
({
8
,
4000
,
1
,
63
,
1.0
f
,
8
});
};
};
TYPED_TEST
(
TopKSamplingKernelTest
,
BatchCorrectnessLargeK1024
)
//
TYPED_TEST(TopKSamplingKernelTest, BatchCorrectnessLargeK1024)
{
//
{
this
->
runBatchTest
({
8
,
4000
,
1
,
1024
,
0.0
f
,
8
});
//
this->runBatchTest({8, 4000, 1, 1024, 0.0f, 8});
};
//
};
TYPED_TEST
(
TopKSamplingKernelTest
,
BatchCorrectnessTopKTopP
)
TYPED_TEST
(
TopKSamplingKernelTest
,
BatchCorrectnessTopKTopP
)
{
{
...
...
Prev
1
2
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment