Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
jerrrrry
infinicore
Commits
dce99862
Unverified
Commit
dce99862
authored
Mar 06, 2026
by
thatPepe
Committed by
GitHub
Mar 06, 2026
Browse files
Merge pull request #1053 from InfiniTensor/issue/1033xmake
Issue/1033 patch aten and fa adaptations
parents
8d99a8f5
d6e44e84
Changes
102
Show whitespace changes
Inline
Side-by-side
Showing
20 changed files
with
125 additions
and
114 deletions
+125
-114
src/infiniop/ops/attention/operator.cc
src/infiniop/ops/attention/operator.cc
+21
-21
src/infiniop/ops/causal_softmax/operator.cc
src/infiniop/ops/causal_softmax/operator.cc
+4
-4
src/infiniop/ops/clip/operator.cc
src/infiniop/ops/clip/operator.cc
+4
-4
src/infiniop/ops/conv/operator.cc
src/infiniop/ops/conv/operator.cc
+13
-13
src/infiniop/ops/dequantize_awq/operator.cc
src/infiniop/ops/dequantize_awq/operator.cc
+5
-5
src/infiniop/ops/embedding/operator.cc
src/infiniop/ops/embedding/operator.cc
+3
-3
src/infiniop/ops/flash_attention/operator.cc
src/infiniop/ops/flash_attention/operator.cc
+4
-4
src/infiniop/ops/gelu/operator.cc
src/infiniop/ops/gelu/operator.cc
+4
-4
src/infiniop/ops/gemm/operator.cc
src/infiniop/ops/gemm/operator.cc
+4
-4
src/infiniop/ops/kv_caching/operator.cc
src/infiniop/ops/kv_caching/operator.cc
+4
-4
src/infiniop/ops/layer_norm/operator.cc
src/infiniop/ops/layer_norm/operator.cc
+4
-4
src/infiniop/ops/logsoftmax/operator.cc
src/infiniop/ops/logsoftmax/operator.cc
+4
-4
src/infiniop/ops/lp_norm/operator.cc
src/infiniop/ops/lp_norm/operator.cc
+4
-4
src/infiniop/ops/mul/operator.cc
src/infiniop/ops/mul/operator.cc
+4
-4
src/infiniop/ops/ones/operator.cc
src/infiniop/ops/ones/operator.cc
+4
-4
src/infiniop/ops/paged_attention/operator.cc
src/infiniop/ops/paged_attention/operator.cc
+4
-4
src/infiniop/ops/paged_attention_prefill/operator.cc
src/infiniop/ops/paged_attention_prefill/operator.cc
+4
-4
src/infiniop/ops/paged_caching/operator.cc
src/infiniop/ops/paged_caching/operator.cc
+4
-4
src/infiniop/ops/quant/per_channel_quant_int8/operator.cc
src/infiniop/ops/quant/per_channel_quant_int8/operator.cc
+16
-16
src/infiniop/ops/random_sample/nvidia/random_sample_kernel.cuh
...nfiniop/ops/random_sample/nvidia/random_sample_kernel.cuh
+11
-0
No files found.
src/infiniop/ops/attention/operator.cc
View file @
dce99862
...
...
@@ -31,7 +31,7 @@ struct InfiniopAttentionDescriptor {
float
qk_alpha
;
};
__C
__export
infiniStatus_t
infiniopCreateAttentionDescriptor
(
infiniopHandle_t
handle
,
__
INFINI_
C
__export
infiniStatus_t
infiniopCreateAttentionDescriptor
(
infiniopHandle_t
handle
,
infiniopAttentionDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
out_desc
,
infiniopTensorDescriptor_t
q_desc
,
...
...
@@ -218,12 +218,12 @@ __C __export infiniStatus_t infiniopCreateAttentionDescriptor(infiniopHandle_t h
return
INFINI_STATUS_SUCCESS
;
}
__C
__export
infiniStatus_t
infiniopGetAttentionWorkspaceSize
(
infiniopAttentionDescriptor_t
desc
,
size_t
*
size
)
{
__
INFINI_
C
__export
infiniStatus_t
infiniopGetAttentionWorkspaceSize
(
infiniopAttentionDescriptor_t
desc
,
size_t
*
size
)
{
*
size
=
((
InfiniopAttentionDescriptor
*
)
desc
)
->
workspace_size
;
return
INFINI_STATUS_SUCCESS
;
}
__C
__export
infiniStatus_t
infiniopAttention
(
infiniopAttentionDescriptor_t
desc_
,
__
INFINI_
C
__export
infiniStatus_t
infiniopAttention
(
infiniopAttentionDescriptor_t
desc_
,
void
*
workspace_
,
size_t
workspace_size_
,
void
*
out
,
...
...
@@ -274,7 +274,7 @@ __C __export infiniStatus_t infiniopAttention(infiniopAttentionDescriptor_t desc
return
INFINI_STATUS_SUCCESS
;
}
__C
__export
infiniStatus_t
infiniopDestroyAttentionDescriptor
(
infiniopAttentionDescriptor_t
desc_
)
{
__
INFINI_
C
__export
infiniStatus_t
infiniopDestroyAttentionDescriptor
(
infiniopAttentionDescriptor_t
desc_
)
{
auto
desc
=
(
InfiniopAttentionDescriptor
*
)
desc_
;
if
(
desc
->
rearrange_desc_q
)
{
CHECK_STATUS
(
infiniopDestroyRearrangeDescriptor
(
desc
->
rearrange_desc_q
));
...
...
src/infiniop/ops/causal_softmax/operator.cc
View file @
dce99862
...
...
@@ -24,7 +24,7 @@
#include "moore/causal_softmax_moore.h"
#endif
__C
infiniStatus_t
infiniopCreateCausalSoftmaxDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreateCausalSoftmaxDescriptor
(
infiniopHandle_t
handle
,
infiniopCausalSoftmaxDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
y_desc
,
...
...
@@ -78,7 +78,7 @@ __C infiniStatus_t infiniopCreateCausalSoftmaxDescriptor(
#undef CREATE
}
__C
infiniStatus_t
infiniopGetCausalSoftmaxWorkspaceSize
(
infiniopCausalSoftmaxDescriptor_t
desc
,
size_t
*
size
)
{
__
INFINI_
C
infiniStatus_t
infiniopGetCausalSoftmaxWorkspaceSize
(
infiniopCausalSoftmaxDescriptor_t
desc
,
size_t
*
size
)
{
#define GET(CASE, NAMESPACE) \
case CASE: \
...
...
@@ -125,7 +125,7 @@ __C infiniStatus_t infiniopGetCausalSoftmaxWorkspaceSize(infiniopCausalSoftmaxDe
#undef GET
}
__C
infiniStatus_t
infiniopCausalSoftmax
(
__
INFINI_
C
infiniStatus_t
infiniopCausalSoftmax
(
infiniopCausalSoftmaxDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
void
*
y
,
...
...
@@ -177,7 +177,7 @@ __C infiniStatus_t infiniopCausalSoftmax(
#undef CALCULATE
}
__C
infiniStatus_t
infiniopDestroyCausalSoftmaxDescriptor
(
infiniopCausalSoftmaxDescriptor_t
desc
)
{
__
INFINI_
C
infiniStatus_t
infiniopDestroyCausalSoftmaxDescriptor
(
infiniopCausalSoftmaxDescriptor_t
desc
)
{
#define DESTROY(CASE, NAMESPACE) \
case CASE: \
...
...
src/infiniop/ops/clip/operator.cc
View file @
dce99862
...
...
@@ -15,7 +15,7 @@
#include "kunlun/clip_kunlun.h"
#endif
__C
infiniStatus_t
infiniopCreateClipDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreateClipDescriptor
(
infiniopHandle_t
handle
,
infiniopClipDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
y
,
...
...
@@ -62,7 +62,7 @@ __C infiniStatus_t infiniopCreateClipDescriptor(
#undef CREATE
}
__C
infiniStatus_t
infiniopGetClipWorkspaceSize
(
infiniopClipDescriptor_t
desc
,
size_t
*
size
)
{
__
INFINI_
C
infiniStatus_t
infiniopGetClipWorkspaceSize
(
infiniopClipDescriptor_t
desc
,
size_t
*
size
)
{
#define GET(CASE, NAMESPACE) \
case CASE: \
...
...
@@ -98,7 +98,7 @@ __C infiniStatus_t infiniopGetClipWorkspaceSize(infiniopClipDescriptor_t desc, s
#undef GET
}
__C
infiniStatus_t
infiniopClip
(
__
INFINI_
C
infiniStatus_t
infiniopClip
(
infiniopClipDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
...
...
@@ -144,7 +144,7 @@ __C infiniStatus_t infiniopClip(
#undef CALCULATE
}
__C
infiniStatus_t
__
INFINI_
C
infiniStatus_t
infiniopDestroyClipDescriptor
(
infiniopClipDescriptor_t
desc
)
{
#define DELETE(CASE, NAMESPACE) \
...
...
src/infiniop/ops/conv/operator.cc
View file @
dce99862
...
...
@@ -9,7 +9,7 @@
#include "nvidia/conv_nvidia.cuh"
#endif
__C
__export
infiniStatus_t
infiniopCreateConvDescriptor
(
infiniopHandle_t
handle
,
__
INFINI_
C
__export
infiniStatus_t
infiniopCreateConvDescriptor
(
infiniopHandle_t
handle
,
infiniopConvDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
y_desc
,
infiniopTensorDescriptor_t
x_desc
,
...
...
@@ -55,7 +55,7 @@ __C __export infiniStatus_t infiniopCreateConvDescriptor(infiniopHandle_t handle
#undef CREATE
}
__C
infiniStatus_t
__
INFINI_
C
infiniStatus_t
infiniopGetConvWorkspaceSize
(
infiniopConvDescriptor_t
desc
,
size_t
*
size
)
{
...
...
@@ -90,7 +90,7 @@ infiniopGetConvWorkspaceSize(
#undef GET
}
__C
infiniStatus_t
infiniopConv
(
__
INFINI_
C
infiniStatus_t
infiniopConv
(
infiniopConvDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
...
...
@@ -131,7 +131,7 @@ __C infiniStatus_t infiniopConv(
#undef CALCULATE
}
__C
infiniStatus_t
__
INFINI_
C
infiniStatus_t
infiniopDestroyConvDescriptor
(
infiniopConvDescriptor_t
desc
)
{
#define DELETE(CASE, NAMESPACE) \
case CASE: \
...
...
src/infiniop/ops/dequantize_awq/operator.cc
View file @
dce99862
...
...
@@ -12,7 +12,7 @@
#include "iluvatar/dequantize_w42f16_iluvatar.cuh"
#endif
__C
infiniStatus_t
infiniopCreateDequantizeAWQDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreateDequantizeAWQDescriptor
(
infiniopHandle_t
handle
,
infiniopDequantizeAWQDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
out_desc
,
...
...
@@ -54,7 +54,7 @@ __C infiniStatus_t infiniopCreateDequantizeAWQDescriptor(
#undef CREATE
}
__C
infiniStatus_t
infiniopGetDequantizeAWQWorkspaceSize
(
infiniopDequantizeAWQDescriptor_t
desc
,
__
INFINI_
C
infiniStatus_t
infiniopGetDequantizeAWQWorkspaceSize
(
infiniopDequantizeAWQDescriptor_t
desc
,
size_t
*
size
)
{
#define GET(CASE, NAMESPACE) \
case CASE: \
...
...
@@ -84,7 +84,7 @@ __C infiniStatus_t infiniopGetDequantizeAWQWorkspaceSize(infiniopDequantizeAWQDe
#undef GET
}
__C
infiniStatus_t
infiniopDequantizeAWQ
(
__
INFINI_
C
infiniStatus_t
infiniopDequantizeAWQ
(
infiniopDequantizeAWQDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
...
...
@@ -123,7 +123,7 @@ __C infiniStatus_t infiniopDequantizeAWQ(
#undef CALCULATE
}
__C
infiniStatus_t
__
INFINI_
C
infiniStatus_t
infiniopDestroyDequantizeAWQDescriptor
(
infiniopDequantizeAWQDescriptor_t
desc
)
{
#define DELETE(CASE, NAMESPACE) \
...
...
src/infiniop/ops/embedding/operator.cc
View file @
dce99862
...
...
@@ -15,7 +15,7 @@
#include "moore/embedding_moore.h"
#endif
__C
infiniStatus_t
infiniopCreateEmbeddingDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreateEmbeddingDescriptor
(
infiniopHandle_t
handle
,
infiniopEmbeddingDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
output_desc
,
...
...
@@ -65,7 +65,7 @@ __C infiniStatus_t infiniopCreateEmbeddingDescriptor(
#undef CREATE
}
__C
infiniStatus_t
infiniopEmbedding
(
__
INFINI_
C
infiniStatus_t
infiniopEmbedding
(
infiniopEmbeddingDescriptor_t
desc
,
void
*
output
,
const
void
*
input
,
...
...
@@ -111,7 +111,7 @@ __C infiniStatus_t infiniopEmbedding(
#undef CALCULATE
}
__C
infiniStatus_t
infiniopDestroyEmbeddingDescriptor
(
infiniopEmbeddingDescriptor_t
desc
)
{
__
INFINI_
C
infiniStatus_t
infiniopDestroyEmbeddingDescriptor
(
infiniopEmbeddingDescriptor_t
desc
)
{
#define DESTROY(CASE, NAMESPACE) \
case CASE: \
...
...
src/infiniop/ops/flash_attention/operator.cc
View file @
dce99862
...
...
@@ -8,7 +8,7 @@
#endif
#endif
__C
infiniStatus_t
infiniopCreateFlashAttentionDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreateFlashAttentionDescriptor
(
infiniopHandle_t
handle
,
infiniopFlashAttentionDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
out_desc
,
...
...
@@ -45,7 +45,7 @@ __C infiniStatus_t infiniopCreateFlashAttentionDescriptor(
#undef CREATE
}
__C
infiniStatus_t
infiniopGetFlashAttentionWorkspaceSize
(
__
INFINI_
C
infiniStatus_t
infiniopGetFlashAttentionWorkspaceSize
(
infiniopFlashAttentionDescriptor_t
desc
,
size_t
*
size
)
{
...
...
@@ -69,7 +69,7 @@ __C infiniStatus_t infiniopGetFlashAttentionWorkspaceSize(
#undef GET_SIZE
}
__C
infiniStatus_t
infiniopFlashAttention
(
__
INFINI_
C
infiniStatus_t
infiniopFlashAttention
(
infiniopFlashAttentionDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
...
...
@@ -99,7 +99,7 @@ __C infiniStatus_t infiniopFlashAttention(
#undef CALCULATE
}
__C
infiniStatus_t
infiniopDestroyFlashAttentionDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopDestroyFlashAttentionDescriptor
(
infiniopFlashAttentionDescriptor_t
desc
)
{
#define DESTROY(CASE, NAMESPACE) \
...
...
src/infiniop/ops/gelu/operator.cc
View file @
dce99862
...
...
@@ -15,7 +15,7 @@
#include "kunlun/gelu_kunlun.h"
#endif
__C
infiniStatus_t
infiniopCreateGeluDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreateGeluDescriptor
(
infiniopHandle_t
handle
,
infiniopGeluDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
output_desc
,
...
...
@@ -60,7 +60,7 @@ __C infiniStatus_t infiniopCreateGeluDescriptor(
#undef CREATE
}
__C
infiniStatus_t
infiniopGetGeluWorkspaceSize
(
infiniopGeluDescriptor_t
desc
,
size_t
*
size
)
{
__
INFINI_
C
infiniStatus_t
infiniopGetGeluWorkspaceSize
(
infiniopGeluDescriptor_t
desc
,
size_t
*
size
)
{
#define GET(CASE, NAMESPACE) \
case CASE: \
...
...
@@ -98,7 +98,7 @@ __C infiniStatus_t infiniopGetGeluWorkspaceSize(infiniopGeluDescriptor_t desc, s
return
INFINI_STATUS_DEVICE_TYPE_NOT_SUPPORTED
;
}
__C
infiniStatus_t
infiniopGelu
(
__
INFINI_
C
infiniStatus_t
infiniopGelu
(
infiniopGeluDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
...
...
@@ -142,7 +142,7 @@ __C infiniStatus_t infiniopGelu(
#undef CALCULATE
}
__C
infiniStatus_t
__
INFINI_
C
infiniStatus_t
infiniopDestroyGeluDescriptor
(
infiniopGeluDescriptor_t
desc
)
{
#define DELETE(CASE, NAMESPACE) \
...
...
src/infiniop/ops/gemm/operator.cc
View file @
dce99862
...
...
@@ -24,7 +24,7 @@
#include "kunlun/gemm_kunlun.h"
#endif
__C
infiniStatus_t
infiniopCreateGemmDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreateGemmDescriptor
(
infiniopHandle_t
handle
,
infiniopGemmDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
c_desc
,
...
...
@@ -84,7 +84,7 @@ __C infiniStatus_t infiniopCreateGemmDescriptor(
#undef CREATE
}
__C
infiniStatus_t
__
INFINI_
C
infiniStatus_t
infiniopGetGemmWorkspaceSize
(
infiniopGemmDescriptor_t
desc
,
size_t
*
size
)
{
...
...
@@ -137,7 +137,7 @@ infiniopGetGemmWorkspaceSize(
#undef GET
}
__C
infiniStatus_t
infiniopGemm
(
__
INFINI_
C
infiniStatus_t
infiniopGemm
(
infiniopGemmDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
void
*
c
,
...
...
@@ -198,7 +198,7 @@ __C infiniStatus_t infiniopGemm(
#undef CALCULATE
}
__C
infiniStatus_t
__
INFINI_
C
infiniStatus_t
infiniopDestroyGemmDescriptor
(
infiniopGemmDescriptor_t
desc
)
{
#define DELETE(CASE, NAMESPACE) \
...
...
src/infiniop/ops/kv_caching/operator.cc
View file @
dce99862
...
...
@@ -9,7 +9,7 @@
#include "metax/kv_caching_metax.h"
#endif
__C
infiniStatus_t
infiniopCreateKVCachingDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreateKVCachingDescriptor
(
infiniopHandle_t
handle
,
infiniopKVCachingDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
k_cache
,
...
...
@@ -57,7 +57,7 @@ __C infiniStatus_t infiniopCreateKVCachingDescriptor(
#undef CREATE
}
__C
infiniStatus_t
infiniopGetKVCachingWorkspaceSize
(
__
INFINI_
C
infiniStatus_t
infiniopGetKVCachingWorkspaceSize
(
infiniopKVCachingDescriptor_t
desc
,
size_t
*
size
)
{
...
...
@@ -95,7 +95,7 @@ __C infiniStatus_t infiniopGetKVCachingWorkspaceSize(
#undef GET_SIZE
}
__C
infiniStatus_t
infiniopKVCaching
(
__
INFINI_
C
infiniStatus_t
infiniopKVCaching
(
infiniopKVCachingDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
...
...
@@ -139,7 +139,7 @@ __C infiniStatus_t infiniopKVCaching(
#undef CALCULATE
}
__C
infiniStatus_t
infiniopDestroyKVCachingDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopDestroyKVCachingDescriptor
(
infiniopKVCachingDescriptor_t
desc
)
{
#define DELETE(CASE, NAMESPACE) \
...
...
src/infiniop/ops/layer_norm/operator.cc
View file @
dce99862
...
...
@@ -12,7 +12,7 @@
#include "metax/layer_norm_metax.h"
#endif
__C
infiniStatus_t
infiniopCreateLayerNormDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreateLayerNormDescriptor
(
infiniopHandle_t
handle
,
infiniopLayerNormDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
output_desc
,
...
...
@@ -63,7 +63,7 @@ __C infiniStatus_t infiniopCreateLayerNormDescriptor(
#undef CREATE
}
__C
infiniStatus_t
infiniopGetLayerNormWorkspaceSize
(
infiniopLayerNormDescriptor_t
desc
,
size_t
*
size
)
{
__
INFINI_
C
infiniStatus_t
infiniopGetLayerNormWorkspaceSize
(
infiniopLayerNormDescriptor_t
desc
,
size_t
*
size
)
{
#define GET(CASE, NAMESPACE) \
case CASE: \
*size = reinterpret_cast<op::layer_norm::NAMESPACE::Descriptor *>(desc)->workspaceSize(); \
...
...
@@ -96,7 +96,7 @@ __C infiniStatus_t infiniopGetLayerNormWorkspaceSize(infiniopLayerNormDescriptor
return
INFINI_STATUS_DEVICE_TYPE_NOT_SUPPORTED
;
}
__C
infiniStatus_t
infiniopLayerNorm
(
__
INFINI_
C
infiniStatus_t
infiniopLayerNorm
(
infiniopLayerNormDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
...
...
@@ -149,7 +149,7 @@ __C infiniStatus_t infiniopLayerNorm(
#undef CALCULATE
}
__C
infiniStatus_t
__
INFINI_
C
infiniStatus_t
infiniopDestroyLayerNormDescriptor
(
infiniopLayerNormDescriptor_t
desc
)
{
#define DELETE(CASE, NAMESPACE) \
...
...
src/infiniop/ops/logsoftmax/operator.cc
View file @
dce99862
...
...
@@ -15,7 +15,7 @@
// #include "ascend/logsoftmax_ascend.h"
#endif
__C
infiniStatus_t
infiniopCreateLogSoftmaxDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreateLogSoftmaxDescriptor
(
infiniopHandle_t
handle
,
infiniopLogSoftmaxDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
y_desc
,
...
...
@@ -56,7 +56,7 @@ __C infiniStatus_t infiniopCreateLogSoftmaxDescriptor(
}
}
__C
infiniStatus_t
infiniopGetLogSoftmaxWorkspaceSize
(
infiniopLogSoftmaxDescriptor_t
desc
,
size_t
*
size
)
{
__
INFINI_
C
infiniStatus_t
infiniopGetLogSoftmaxWorkspaceSize
(
infiniopLogSoftmaxDescriptor_t
desc
,
size_t
*
size
)
{
#define GET(CASE, NAMESPACE) \
case CASE: \
...
...
@@ -90,7 +90,7 @@ __C infiniStatus_t infiniopGetLogSoftmaxWorkspaceSize(infiniopLogSoftmaxDescript
}
}
__C
infiniStatus_t
infiniopLogSoftmax
(
__
INFINI_
C
infiniStatus_t
infiniopLogSoftmax
(
infiniopLogSoftmaxDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
void
*
y
,
...
...
@@ -129,7 +129,7 @@ __C infiniStatus_t infiniopLogSoftmax(
}
}
__C
infiniStatus_t
infiniopDestroyLogSoftmaxDescriptor
(
infiniopLogSoftmaxDescriptor_t
desc
)
{
__
INFINI_
C
infiniStatus_t
infiniopDestroyLogSoftmaxDescriptor
(
infiniopLogSoftmaxDescriptor_t
desc
)
{
#define DESTROY(CASE, NAMESPACE) \
case CASE: \
...
...
src/infiniop/ops/lp_norm/operator.cc
View file @
dce99862
...
...
@@ -6,7 +6,7 @@
#include "nvidia/lp_norm_nvidia.cuh"
#endif
__C
infiniStatus_t
infiniopCreateLPNormDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreateLPNormDescriptor
(
infiniopHandle_t
handle
,
infiniopLPNormDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
output_desc
,
...
...
@@ -47,7 +47,7 @@ __C infiniStatus_t infiniopCreateLPNormDescriptor(
#undef CREATE
}
__C
infiniStatus_t
infiniopGetLPNormWorkspaceSize
(
infiniopLPNormDescriptor_t
desc
,
size_t
*
size
)
{
__
INFINI_
C
infiniStatus_t
infiniopGetLPNormWorkspaceSize
(
infiniopLPNormDescriptor_t
desc
,
size_t
*
size
)
{
#define GET(CASE, NAMESPACE) \
case CASE: \
*size = reinterpret_cast<op::lp_norm::NAMESPACE::Descriptor *>(desc)->workspaceSize(); \
...
...
@@ -75,7 +75,7 @@ __C infiniStatus_t infiniopGetLPNormWorkspaceSize(infiniopLPNormDescriptor_t des
return
INFINI_STATUS_DEVICE_TYPE_NOT_SUPPORTED
;
}
__C
infiniStatus_t
infiniopLPNorm
(
__
INFINI_
C
infiniStatus_t
infiniopLPNorm
(
infiniopLPNormDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
...
...
@@ -114,7 +114,7 @@ __C infiniStatus_t infiniopLPNorm(
#undef CALCULATE
}
__C
infiniStatus_t
__
INFINI_
C
infiniStatus_t
infiniopDestroyLPNormDescriptor
(
infiniopLPNormDescriptor_t
desc
)
{
#define DELETE(CASE, NAMESPACE) \
...
...
src/infiniop/ops/mul/operator.cc
View file @
dce99862
...
...
@@ -18,7 +18,7 @@
#include "moore/mul_moore.h"
#endif
__C
infiniStatus_t
infiniopCreateMulDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreateMulDescriptor
(
infiniopHandle_t
handle
,
infiniopMulDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
c_desc
,
...
...
@@ -68,7 +68,7 @@ __C infiniStatus_t infiniopCreateMulDescriptor(
#undef CREATE
}
__C
infiniStatus_t
infiniopGetMulWorkspaceSize
(
infiniopMulDescriptor_t
desc
,
size_t
*
size
)
{
__
INFINI_
C
infiniStatus_t
infiniopGetMulWorkspaceSize
(
infiniopMulDescriptor_t
desc
,
size_t
*
size
)
{
#define GET(CASE, NAMESPACE) \
case CASE: \
...
...
@@ -109,7 +109,7 @@ __C infiniStatus_t infiniopGetMulWorkspaceSize(infiniopMulDescriptor_t desc, siz
return
INFINI_STATUS_DEVICE_TYPE_NOT_SUPPORTED
;
}
__C
infiniStatus_t
infiniopMul
(
__
INFINI_
C
infiniStatus_t
infiniopMul
(
infiniopMulDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
...
...
@@ -157,7 +157,7 @@ __C infiniStatus_t infiniopMul(
#undef CALCULATE
}
__C
infiniStatus_t
__
INFINI_
C
infiniStatus_t
infiniopDestroyMulDescriptor
(
infiniopMulDescriptor_t
desc
)
{
#define DELETE(CASE, NAMESPACE) \
...
...
src/infiniop/ops/ones/operator.cc
View file @
dce99862
...
...
@@ -15,7 +15,7 @@
#include "moore/ones_moore.h"
#endif
__C
infiniStatus_t
infiniopCreateOnesDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreateOnesDescriptor
(
infiniopHandle_t
handle
,
infiniopOnesDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
y_desc
,
...
...
@@ -60,7 +60,7 @@ __C infiniStatus_t infiniopCreateOnesDescriptor(
#undef CREATE
}
__C
infiniStatus_t
infiniopGetOnesWorkspaceSize
(
infiniopOnesDescriptor_t
desc
,
size_t
*
size
)
{
__
INFINI_
C
infiniStatus_t
infiniopGetOnesWorkspaceSize
(
infiniopOnesDescriptor_t
desc
,
size_t
*
size
)
{
#define GET(CASE, NAMESPACE) \
case CASE: \
...
...
@@ -98,7 +98,7 @@ __C infiniStatus_t infiniopGetOnesWorkspaceSize(infiniopOnesDescriptor_t desc, s
return
INFINI_STATUS_DEVICE_TYPE_NOT_SUPPORTED
;
}
__C
infiniStatus_t
infiniopOnes
(
__
INFINI_
C
infiniStatus_t
infiniopOnes
(
infiniopOnesDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
...
...
@@ -142,7 +142,7 @@ __C infiniStatus_t infiniopOnes(
#undef CALCULATE
}
__C
infiniStatus_t
__
INFINI_
C
infiniStatus_t
infiniopDestroyOnesDescriptor
(
infiniopOnesDescriptor_t
desc
)
{
#define DELETE(CASE, NAMESPACE) \
...
...
src/infiniop/ops/paged_attention/operator.cc
View file @
dce99862
...
...
@@ -12,7 +12,7 @@
#include "metax/paged_attention_metax.h"
#endif
__C
infiniStatus_t
infiniopCreatePagedAttentionDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreatePagedAttentionDescriptor
(
infiniopHandle_t
handle
,
infiniopPagedAttentionDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
out_desc
,
...
...
@@ -54,7 +54,7 @@ __C infiniStatus_t infiniopCreatePagedAttentionDescriptor(
}
}
__C
infiniStatus_t
infiniopGetPagedAttentionWorkspaceSize
(
__
INFINI_
C
infiniStatus_t
infiniopGetPagedAttentionWorkspaceSize
(
infiniopPagedAttentionDescriptor_t
desc
,
size_t
*
size
)
{
...
...
@@ -84,7 +84,7 @@ __C infiniStatus_t infiniopGetPagedAttentionWorkspaceSize(
}
}
__C
infiniStatus_t
infiniopPagedAttention
(
__
INFINI_
C
infiniStatus_t
infiniopPagedAttention
(
infiniopPagedAttentionDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
void
*
out
,
const
void
*
q
,
const
void
*
k_cache
,
const
void
*
v_cache
,
...
...
@@ -118,7 +118,7 @@ __C infiniStatus_t infiniopPagedAttention(
}
}
__C
infiniStatus_t
infiniopDestroyPagedAttentionDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopDestroyPagedAttentionDescriptor
(
infiniopPagedAttentionDescriptor_t
desc
)
{
#define DESTROY(CASE, NAMESPACE) \
...
...
src/infiniop/ops/paged_attention_prefill/operator.cc
View file @
dce99862
...
...
@@ -12,7 +12,7 @@
#include "moore/paged_attention_prefill_moore.h"
#endif
__C
infiniStatus_t
infiniopCreatePagedAttentionPrefillDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreatePagedAttentionPrefillDescriptor
(
infiniopHandle_t
handle
,
infiniopPagedAttentionPrefillDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
out_desc
,
...
...
@@ -56,7 +56,7 @@ __C infiniStatus_t infiniopCreatePagedAttentionPrefillDescriptor(
}
}
__C
infiniStatus_t
infiniopGetPagedAttentionPrefillWorkspaceSize
(
__
INFINI_
C
infiniStatus_t
infiniopGetPagedAttentionPrefillWorkspaceSize
(
infiniopPagedAttentionPrefillDescriptor_t
desc
,
size_t
*
size
)
{
...
...
@@ -86,7 +86,7 @@ __C infiniStatus_t infiniopGetPagedAttentionPrefillWorkspaceSize(
}
}
__C
infiniStatus_t
infiniopPagedAttentionPrefill
(
__
INFINI_
C
infiniStatus_t
infiniopPagedAttentionPrefill
(
infiniopPagedAttentionPrefillDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
void
*
out
,
const
void
*
q
,
const
void
*
k_cache
,
const
void
*
v_cache
,
...
...
@@ -123,7 +123,7 @@ __C infiniStatus_t infiniopPagedAttentionPrefill(
}
}
__C
infiniStatus_t
infiniopDestroyPagedAttentionPrefillDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopDestroyPagedAttentionPrefillDescriptor
(
infiniopPagedAttentionPrefillDescriptor_t
desc
)
{
#define DESTROY(CASE, NAMESPACE) \
...
...
src/infiniop/ops/paged_caching/operator.cc
View file @
dce99862
...
...
@@ -12,7 +12,7 @@
#include "moore/paged_caching_moore.h"
#endif
__C
infiniStatus_t
infiniopCreatePagedCachingDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopCreatePagedCachingDescriptor
(
infiniopHandle_t
handle
,
infiniopPagedCachingDescriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
k_cache_desc
,
...
...
@@ -49,7 +49,7 @@ __C infiniStatus_t infiniopCreatePagedCachingDescriptor(
}
}
__C
infiniStatus_t
infiniopGetPagedCachingWorkspaceSize
(
__
INFINI_
C
infiniStatus_t
infiniopGetPagedCachingWorkspaceSize
(
infiniopPagedCachingDescriptor_t
desc
,
size_t
*
size
)
{
...
...
@@ -79,7 +79,7 @@ __C infiniStatus_t infiniopGetPagedCachingWorkspaceSize(
}
}
__C
infiniStatus_t
infiniopPagedCaching
(
__
INFINI_
C
infiniStatus_t
infiniopPagedCaching
(
infiniopPagedCachingDescriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
void
*
k_cache
,
void
*
v_cache
,
...
...
@@ -113,7 +113,7 @@ __C infiniStatus_t infiniopPagedCaching(
}
}
__C
infiniStatus_t
infiniopDestroyPagedCachingDescriptor
(
__
INFINI_
C
infiniStatus_t
infiniopDestroyPagedCachingDescriptor
(
infiniopPagedCachingDescriptor_t
desc
)
{
#define DESTROY(CASE, NAMESPACE) \
...
...
src/infiniop/ops/quant/per_channel_quant_int8/operator.cc
View file @
dce99862
...
...
@@ -9,7 +9,7 @@
#include "moore/per_channel_quant_int8_moore.h"
#endif
__C
infiniStatus_t
infiniopCreatePerChannelQuantI8Descriptor
(
infiniopHandle_t
handle
,
__
INFINI_
C
infiniStatus_t
infiniopCreatePerChannelQuantI8Descriptor
(
infiniopHandle_t
handle
,
infiniopPerChannelQuantI8Descriptor_t
*
desc_ptr
,
infiniopTensorDescriptor_t
x_packed_desc
,
infiniopTensorDescriptor_t
x_scale_desc
,
...
...
@@ -40,7 +40,7 @@ __C infiniStatus_t infiniopCreatePerChannelQuantI8Descriptor(infiniopHandle_t ha
#undef CREATE
}
__C
infiniStatus_t
infiniopGetPerChannelQuantI8WorkspaceSize
(
infiniopPerChannelQuantI8Descriptor_t
desc
,
size_t
*
size
)
{
__
INFINI_
C
infiniStatus_t
infiniopGetPerChannelQuantI8WorkspaceSize
(
infiniopPerChannelQuantI8Descriptor_t
desc
,
size_t
*
size
)
{
switch
(
desc
->
device_type
)
{
#define GET(CASE, NAMESPACE) \
case CASE: \
...
...
@@ -61,7 +61,7 @@ __C infiniStatus_t infiniopGetPerChannelQuantI8WorkspaceSize(infiniopPerChannelQ
#undef GET
}
__C
infiniStatus_t
infiniopPerChannelQuantI8
(
infiniopPerChannelQuantI8Descriptor_t
desc
,
__
INFINI_
C
infiniStatus_t
infiniopPerChannelQuantI8
(
infiniopPerChannelQuantI8Descriptor_t
desc
,
void
*
workspace
,
size_t
workspace_size
,
void
*
x_packed
,
...
...
@@ -90,7 +90,7 @@ __C infiniStatus_t infiniopPerChannelQuantI8(infiniopPerChannelQuantI8Descriptor
#undef QUANT
}
__C
infiniStatus_t
infiniopDestroyPerChannelQuantI8Descriptor
(
infiniopPerChannelQuantI8Descriptor_t
desc
)
{
__
INFINI_
C
infiniStatus_t
infiniopDestroyPerChannelQuantI8Descriptor
(
infiniopPerChannelQuantI8Descriptor_t
desc
)
{
#define DESTROY(CASE, NAMESPACE) \
case CASE: \
delete reinterpret_cast<op::per_channel_quant_int8::NAMESPACE::Descriptor *>(desc); \
...
...
src/infiniop/ops/random_sample/nvidia/random_sample_kernel.cuh
View file @
dce99862
...
...
@@ -16,10 +16,21 @@ static cudaError argMax_(
void
*
workspace_ptr
,
size_t
&
workspace_len
,
cudaStream_t
stream
)
{
#if CUDART_VERSION >= 11000 && !defined(ENABLE_QY_API) && !defined(ENABLE_HYGON_API)
// New interface: separate value and index outputs
T
*
max_value
=
&
kv_pair
->
value
;
int
*
max_index
=
&
kv_pair
->
key
;
return
cub
::
DeviceReduce
::
ArgMax
(
workspace_ptr
,
workspace_len
,
logits
,
max_value
,
max_index
,
n
,
stream
);
#else
// Old interface
return
cub
::
DeviceReduce
::
ArgMax
(
workspace_ptr
,
workspace_len
,
logits
,
kv_pair
,
n
,
stream
);
#endif
}
template
<
class
Tval
,
class
Tidx
>
...
...
Prev
1
2
3
4
5
6
Next
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment