Unverified Commit dce99862 authored by thatPepe's avatar thatPepe Committed by GitHub
Browse files

Merge pull request #1053 from InfiniTensor/issue/1033xmake

Issue/1033 patch aten and fa adaptations
parents 8d99a8f5 d6e44e84
......@@ -5,7 +5,7 @@
typedef struct InfiniopDescriptor *infiniopKVCachingDescriptor_t;
__C __export infiniStatus_t infiniopCreateKVCachingDescriptor(
__INFINI_C __export infiniStatus_t infiniopCreateKVCachingDescriptor(
infiniopHandle_t handle,
infiniopKVCachingDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t k_cache,
......@@ -14,9 +14,9 @@ __C __export infiniStatus_t infiniopCreateKVCachingDescriptor(
infiniopTensorDescriptor_t v,
infiniopTensorDescriptor_t past_kv_lengths);
__C __export infiniStatus_t infiniopGetKVCachingWorkspaceSize(infiniopKVCachingDescriptor_t desc, size_t *size);
__INFINI_C __export infiniStatus_t infiniopGetKVCachingWorkspaceSize(infiniopKVCachingDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopKVCaching(infiniopKVCachingDescriptor_t desc,
__INFINI_C __export infiniStatus_t infiniopKVCaching(infiniopKVCachingDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *k_cache,
......@@ -26,6 +26,6 @@ __C __export infiniStatus_t infiniopKVCaching(infiniopKVCachingDescriptor_t desc
const void *past_kv_lengths,
void *stream);
__C __export infiniStatus_t infiniopDestroyKVCachingDescriptor(infiniopKVCachingDescriptor_t desc);
__INFINI_C __export infiniStatus_t infiniopDestroyKVCachingDescriptor(infiniopKVCachingDescriptor_t desc);
#endif
......@@ -5,7 +5,7 @@
typedef struct InfiniopDescriptor *infiniopLayerNormDescriptor_t;
__C __export infiniStatus_t infiniopCreateLayerNormDescriptor(
__INFINI_C __export infiniStatus_t infiniopCreateLayerNormDescriptor(
infiniopHandle_t handle,
infiniopLayerNormDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output_desc,
......@@ -16,9 +16,9 @@ __C __export infiniStatus_t infiniopCreateLayerNormDescriptor(
infiniopTensorDescriptor_t bias_desc,
float eps);
__C __export infiniStatus_t infiniopGetLayerNormWorkspaceSize(infiniopLayerNormDescriptor_t desc, size_t *size);
__INFINI_C __export infiniStatus_t infiniopGetLayerNormWorkspaceSize(infiniopLayerNormDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopLayerNorm(infiniopLayerNormDescriptor_t desc,
__INFINI_C __export infiniStatus_t infiniopLayerNorm(infiniopLayerNormDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *output,
......@@ -29,6 +29,6 @@ __C __export infiniStatus_t infiniopLayerNorm(infiniopLayerNormDescriptor_t desc
const void *bias,
void *stream);
__C __export infiniStatus_t infiniopDestroyLayerNormDescriptor(infiniopLayerNormDescriptor_t desc);
__INFINI_C __export infiniStatus_t infiniopDestroyLayerNormDescriptor(infiniopLayerNormDescriptor_t desc);
#endif
......@@ -5,20 +5,20 @@
typedef struct InfiniopDescriptor *infiniopLogSoftmaxDescriptor_t;
__C __export infiniStatus_t infiniopCreateLogSoftmaxDescriptor(infiniopHandle_t handle,
__INFINI_C __export infiniStatus_t infiniopCreateLogSoftmaxDescriptor(infiniopHandle_t handle,
infiniopLogSoftmaxDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y_desc,
infiniopTensorDescriptor_t x_desc);
__C __export infiniStatus_t infiniopGetLogSoftmaxWorkspaceSize(infiniopLogSoftmaxDescriptor_t desc, size_t *size);
__INFINI_C __export infiniStatus_t infiniopGetLogSoftmaxWorkspaceSize(infiniopLogSoftmaxDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopLogSoftmax(infiniopLogSoftmaxDescriptor_t desc,
__INFINI_C __export infiniStatus_t infiniopLogSoftmax(infiniopLogSoftmaxDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *y,
const void *x,
void *stream);
__C __export infiniStatus_t infiniopDestroyLogSoftmaxDescriptor(infiniopLogSoftmaxDescriptor_t desc);
__INFINI_C __export infiniStatus_t infiniopDestroyLogSoftmaxDescriptor(infiniopLogSoftmaxDescriptor_t desc);
#endif
......@@ -5,7 +5,7 @@
typedef struct InfiniopDescriptor *infiniopLPNormDescriptor_t;
__C __export infiniStatus_t infiniopCreateLPNormDescriptor(
__INFINI_C __export infiniStatus_t infiniopCreateLPNormDescriptor(
infiniopHandle_t handle,
infiniopLPNormDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output_desc,
......@@ -14,15 +14,15 @@ __C __export infiniStatus_t infiniopCreateLPNormDescriptor(
int p,
float eps);
__C __export infiniStatus_t infiniopGetLPNormWorkspaceSize(infiniopLPNormDescriptor_t desc, size_t *size);
__INFINI_C __export infiniStatus_t infiniopGetLPNormWorkspaceSize(infiniopLPNormDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopLPNorm(infiniopLPNormDescriptor_t desc,
__INFINI_C __export infiniStatus_t infiniopLPNorm(infiniopLPNormDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *output,
const void *input,
void *stream);
__C __export infiniStatus_t infiniopDestroyLPNormDescriptor(infiniopLPNormDescriptor_t desc);
__INFINI_C __export infiniStatus_t infiniopDestroyLPNormDescriptor(infiniopLPNormDescriptor_t desc);
#endif
......@@ -5,15 +5,15 @@
typedef struct InfiniopDescriptor *infiniopMulDescriptor_t;
__C __export infiniStatus_t infiniopCreateMulDescriptor(infiniopHandle_t handle,
__INFINI_C __export infiniStatus_t infiniopCreateMulDescriptor(infiniopHandle_t handle,
infiniopMulDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t c,
infiniopTensorDescriptor_t a,
infiniopTensorDescriptor_t b);
__C __export infiniStatus_t infiniopGetMulWorkspaceSize(infiniopMulDescriptor_t desc, size_t *size);
__INFINI_C __export infiniStatus_t infiniopGetMulWorkspaceSize(infiniopMulDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopMul(infiniopMulDescriptor_t desc,
__INFINI_C __export infiniStatus_t infiniopMul(infiniopMulDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *c,
......@@ -21,6 +21,6 @@ __C __export infiniStatus_t infiniopMul(infiniopMulDescriptor_t desc,
const void *b,
void *stream);
__C __export infiniStatus_t infiniopDestroyMulDescriptor(infiniopMulDescriptor_t desc);
__INFINI_C __export infiniStatus_t infiniopDestroyMulDescriptor(infiniopMulDescriptor_t desc);
#endif
......@@ -5,20 +5,20 @@
typedef struct InfiniopDescriptor *infiniopOnesDescriptor_t;
__C __export infiniStatus_t infiniopCreateOnesDescriptor(infiniopHandle_t handle,
__INFINI_C __export infiniStatus_t infiniopCreateOnesDescriptor(infiniopHandle_t handle,
infiniopOnesDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y,
infiniopTensorDescriptor_t x);
__C __export infiniStatus_t infiniopGetOnesWorkspaceSize(infiniopOnesDescriptor_t desc, size_t *size);
__INFINI_C __export infiniStatus_t infiniopGetOnesWorkspaceSize(infiniopOnesDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopOnes(infiniopOnesDescriptor_t desc,
__INFINI_C __export infiniStatus_t infiniopOnes(infiniopOnesDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *y,
const void *x,
void *stream);
__C __export infiniStatus_t infiniopDestroyOnesDescriptor(infiniopOnesDescriptor_t desc);
__INFINI_C __export infiniStatus_t infiniopDestroyOnesDescriptor(infiniopOnesDescriptor_t desc);
#endif
......@@ -30,7 +30,7 @@ typedef struct InfiniopDescriptor *infiniopPagedAttentionDescriptor_t;
* @param scale The attention scaling factor (typically 1/sqrt(head_size)).
* @return infiniStatus_t Status code.
*/
__C __export infiniStatus_t infiniopCreatePagedAttentionDescriptor(
__INFINI_C __export infiniStatus_t infiniopCreatePagedAttentionDescriptor(
infiniopHandle_t handle,
infiniopPagedAttentionDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t out_desc,
......@@ -49,7 +49,7 @@ __C __export infiniStatus_t infiniopCreatePagedAttentionDescriptor(
* @param size A pointer to store the required workspace size in bytes.
* @return infiniStatus_t Status code of the operation.
*/
__C __export infiniStatus_t infiniopGetPagedAttentionWorkspaceSize(
__INFINI_C __export infiniStatus_t infiniopGetPagedAttentionWorkspaceSize(
infiniopPagedAttentionDescriptor_t desc, size_t *size);
/**
......@@ -68,7 +68,7 @@ __C __export infiniStatus_t infiniopGetPagedAttentionWorkspaceSize(
* @param stream The CUDA stream for the operation. Can be NULL.
* @return infiniStatus_t Status code of the operation.
*/
__C __export infiniStatus_t infiniopPagedAttention(
__INFINI_C __export infiniStatus_t infiniopPagedAttention(
infiniopPagedAttentionDescriptor_t desc,
void *workspace,
size_t workspace_size,
......@@ -87,7 +87,7 @@ __C __export infiniStatus_t infiniopPagedAttention(
* @param desc The descriptor to be destroyed.
* @return infiniStatus_t Status code of the operation.
*/
__C __export infiniStatus_t infiniopDestroyPagedAttentionDescriptor(
__INFINI_C __export infiniStatus_t infiniopDestroyPagedAttentionDescriptor(
infiniopPagedAttentionDescriptor_t desc);
#endif // __INFINIOP_PAGED_ATTENTION_API_H__
......@@ -29,7 +29,7 @@ typedef struct InfiniopDescriptor *infiniopPagedAttentionPrefillDescriptor_t;
* @param scale The attention scaling factor (typically 1.0 / sqrt(head_size)).
* @return infiniStatus_t Status code of the operation.
*/
__C __export infiniStatus_t infiniopCreatePagedAttentionPrefillDescriptor(
__INFINI_C __export infiniStatus_t infiniopCreatePagedAttentionPrefillDescriptor(
infiniopHandle_t handle,
infiniopPagedAttentionPrefillDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t out_desc,
......@@ -45,7 +45,7 @@ __C __export infiniStatus_t infiniopCreatePagedAttentionPrefillDescriptor(
/**
* @brief Retrieves the workspace size required for the Paged Attention Prefill operation.
*/
__C __export infiniStatus_t infiniopGetPagedAttentionPrefillWorkspaceSize(
__INFINI_C __export infiniStatus_t infiniopGetPagedAttentionPrefillWorkspaceSize(
infiniopPagedAttentionPrefillDescriptor_t desc, size_t *size);
/**
......@@ -64,7 +64,7 @@ __C __export infiniStatus_t infiniopGetPagedAttentionPrefillWorkspaceSize(
* @param stream The device stream (e.g., cudaStream_t) for the operation.
* @return infiniStatus_t Status code of the operation.
*/
__C __export infiniStatus_t infiniopPagedAttentionPrefill(
__INFINI_C __export infiniStatus_t infiniopPagedAttentionPrefill(
infiniopPagedAttentionPrefillDescriptor_t desc,
void *workspace,
size_t workspace_size,
......@@ -81,7 +81,7 @@ __C __export infiniStatus_t infiniopPagedAttentionPrefill(
/**
* @brief Destroys a Paged Attention Prefill descriptor.
*/
__C __export infiniStatus_t infiniopDestroyPagedAttentionPrefillDescriptor(
__INFINI_C __export infiniStatus_t infiniopDestroyPagedAttentionPrefillDescriptor(
infiniopPagedAttentionPrefillDescriptor_t desc);
#endif // __INFINIOP_PAGED_ATTENTION_PREFILL_API_H__
......@@ -21,7 +21,7 @@ typedef struct InfiniopDescriptor *infiniopPagedCachingDescriptor_t;
* @param slot_mapping_desc Descriptor for the slot mapping tensor.
* @return infiniStatus_t Status code of the operation.
*/
__C __export infiniStatus_t infiniopCreatePagedCachingDescriptor(
__INFINI_C __export infiniStatus_t infiniopCreatePagedCachingDescriptor(
infiniopHandle_t handle,
infiniopPagedCachingDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t k_cache_desc,
......@@ -37,7 +37,7 @@ __C __export infiniStatus_t infiniopCreatePagedCachingDescriptor(
* @param size A pointer to store the required workspace size in bytes (typically 0).
* @return infiniStatus_t Status code of the operation.
*/
__C __export infiniStatus_t infiniopGetPagedCachingWorkspaceSize(
__INFINI_C __export infiniStatus_t infiniopGetPagedCachingWorkspaceSize(
infiniopPagedCachingDescriptor_t desc, size_t *size);
/**
......@@ -54,7 +54,7 @@ __C __export infiniStatus_t infiniopGetPagedCachingWorkspaceSize(
* @param stream The CUDA stream for the operation. Can be NULL.
* @return infiniStatus_t Status code of the operation.
*/
__C __export infiniStatus_t infiniopPagedCaching(
__INFINI_C __export infiniStatus_t infiniopPagedCaching(
infiniopPagedCachingDescriptor_t desc,
void *workspace,
size_t workspace_size,
......@@ -71,7 +71,7 @@ __C __export infiniStatus_t infiniopPagedCaching(
* @param desc The descriptor to be destroyed.
* @return infiniStatus_t Status code of the operation.
*/
__C __export infiniStatus_t infiniopDestroyPagedCachingDescriptor(
__INFINI_C __export infiniStatus_t infiniopDestroyPagedCachingDescriptor(
infiniopPagedCachingDescriptor_t desc);
#endif // __INFINIOP_PAGED_CACHING_API_H__
......@@ -5,16 +5,16 @@
typedef InfiniopDescriptor *infiniopPerChannelQuantI8Descriptor_t;
__C __export infiniStatus_t infiniopCreatePerChannelQuantI8Descriptor(infiniopHandle_t handle,
__INFINI_C __export infiniStatus_t infiniopCreatePerChannelQuantI8Descriptor(infiniopHandle_t handle,
infiniopPerChannelQuantI8Descriptor_t *desc_ptr,
infiniopTensorDescriptor_t x_packed_desc,
infiniopTensorDescriptor_t x_scale_desc,
infiniopTensorDescriptor_t x_zero_desc,
infiniopTensorDescriptor_t x_desc);
__C __export infiniStatus_t infiniopGetPerChannelQuantI8WorkspaceSize(infiniopPerChannelQuantI8Descriptor_t desc, size_t *size);
__INFINI_C __export infiniStatus_t infiniopGetPerChannelQuantI8WorkspaceSize(infiniopPerChannelQuantI8Descriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopPerChannelQuantI8(infiniopPerChannelQuantI8Descriptor_t desc,
__INFINI_C __export infiniStatus_t infiniopPerChannelQuantI8(infiniopPerChannelQuantI8Descriptor_t desc,
void *workspace,
size_t workspace_size,
void *x_packed,
......@@ -23,6 +23,6 @@ __C __export infiniStatus_t infiniopPerChannelQuantI8(infiniopPerChannelQuantI8D
const void *x,
void *stream);
__C __export infiniStatus_t infiniopDestroyPerChannelQuantI8Descriptor(infiniopPerChannelQuantI8Descriptor_t desc);
__INFINI_C __export infiniStatus_t infiniopDestroyPerChannelQuantI8Descriptor(infiniopPerChannelQuantI8Descriptor_t desc);
#endif
......@@ -5,23 +5,23 @@
typedef struct InfiniopDescriptor *infiniopRandomSampleDescriptor_t;
__C __export infiniStatus_t infiniopCreateRandomSampleDescriptor(
__INFINI_C __export infiniStatus_t infiniopCreateRandomSampleDescriptor(
infiniopHandle_t handle,
infiniopRandomSampleDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t result,
infiniopTensorDescriptor_t probs);
__C __export infiniStatus_t infiniopGetRandomSampleWorkspaceSize(
__INFINI_C __export infiniStatus_t infiniopGetRandomSampleWorkspaceSize(
infiniopRandomSampleDescriptor_t desc,
size_t *size);
__C __export infiniStatus_t infiniopCreateRandomSampleBatchDescriptor(
__INFINI_C __export infiniStatus_t infiniopCreateRandomSampleBatchDescriptor(
infiniopHandle_t handle,
infiniopRandomSampleDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t result,
infiniopTensorDescriptor_t probs);
__C __export infiniStatus_t infiniopRandomSample(
__INFINI_C __export infiniStatus_t infiniopRandomSample(
infiniopRandomSampleDescriptor_t desc,
void *workspace,
size_t workspace_size,
......@@ -33,7 +33,7 @@ __C __export infiniStatus_t infiniopRandomSample(
float temperature,
void *stream);
__C __export infiniStatus_t infiniopRandomSampleBatch(
__INFINI_C __export infiniStatus_t infiniopRandomSampleBatch(
infiniopRandomSampleDescriptor_t desc,
void *workspace,
size_t workspace_size,
......@@ -46,7 +46,7 @@ __C __export infiniStatus_t infiniopRandomSampleBatch(
int batch_size,
void *stream);
__C __export infiniStatus_t infiniopDestroyRandomSampleDescriptor(
__INFINI_C __export infiniStatus_t infiniopDestroyRandomSampleDescriptor(
infiniopRandomSampleDescriptor_t desc);
#endif
......@@ -5,19 +5,19 @@
typedef struct InfiniopDescriptor *infiniopRearrangeDescriptor_t;
__C __export infiniStatus_t infiniopCreateRearrangeDescriptor(
__INFINI_C __export infiniStatus_t infiniopCreateRearrangeDescriptor(
infiniopHandle_t handle,
infiniopRearrangeDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t dst,
infiniopTensorDescriptor_t src);
__C __export infiniStatus_t infiniopRearrange(
__INFINI_C __export infiniStatus_t infiniopRearrange(
infiniopRearrangeDescriptor_t desc,
void *dst,
const void *src,
void *stream);
__C __export infiniStatus_t infiniopDestroyRearrangeDescriptor(
__INFINI_C __export infiniStatus_t infiniopDestroyRearrangeDescriptor(
infiniopRearrangeDescriptor_t desc);
#endif
......@@ -5,20 +5,20 @@
typedef struct InfiniopDescriptor *infiniopReluDescriptor_t;
__C __export infiniStatus_t infiniopCreateReluDescriptor(infiniopHandle_t handle,
__INFINI_C __export infiniStatus_t infiniopCreateReluDescriptor(infiniopHandle_t handle,
infiniopReluDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y,
infiniopTensorDescriptor_t x);
__C __export infiniStatus_t infiniopGetReluWorkspaceSize(infiniopReluDescriptor_t desc, size_t *size);
__INFINI_C __export infiniStatus_t infiniopGetReluWorkspaceSize(infiniopReluDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopRelu(infiniopReluDescriptor_t desc,
__INFINI_C __export infiniStatus_t infiniopRelu(infiniopReluDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *y,
const void *x,
void *stream);
__C __export infiniStatus_t infiniopDestroyReluDescriptor(infiniopReluDescriptor_t desc);
__INFINI_C __export infiniStatus_t infiniopDestroyReluDescriptor(infiniopReluDescriptor_t desc);
#endif
......@@ -5,7 +5,7 @@
typedef struct InfiniopDescriptor *infiniopRMSNormDescriptor_t;
__C __export infiniStatus_t infiniopCreateRMSNormDescriptor(
__INFINI_C __export infiniStatus_t infiniopCreateRMSNormDescriptor(
infiniopHandle_t handle,
infiniopRMSNormDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y_desc,
......@@ -13,11 +13,11 @@ __C __export infiniStatus_t infiniopCreateRMSNormDescriptor(
infiniopTensorDescriptor_t w_desc,
float epsilon);
__C __export infiniStatus_t infiniopGetRMSNormWorkspaceSize(infiniopRMSNormDescriptor_t desc, size_t *size);
__INFINI_C __export infiniStatus_t infiniopGetRMSNormWorkspaceSize(infiniopRMSNormDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopRMSNorm(infiniopRMSNormDescriptor_t desc, void *workspace, size_t workspace_size,
__INFINI_C __export infiniStatus_t infiniopRMSNorm(infiniopRMSNormDescriptor_t desc, void *workspace, size_t workspace_size,
void *y, const void *x, const void *w, void *stream);
__C __export infiniStatus_t infiniopDestroyRMSNormDescriptor(infiniopRMSNormDescriptor_t desc);
__INFINI_C __export infiniStatus_t infiniopDestroyRMSNormDescriptor(infiniopRMSNormDescriptor_t desc);
#endif
......@@ -12,7 +12,7 @@ typedef enum {
typedef struct InfiniopDescriptor *infiniopRoPEDescriptor_t;
__C __export infiniStatus_t infiniopCreateRoPEDescriptor(
__INFINI_C __export infiniStatus_t infiniopCreateRoPEDescriptor(
infiniopHandle_t handle,
infiniopRoPEDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y,
......@@ -22,9 +22,9 @@ __C __export infiniStatus_t infiniopCreateRoPEDescriptor(
infiniopTensorDescriptor_t cos_table,
infiniopRoPEAlgo_t algo);
__C __export infiniStatus_t infiniopGetRoPEWorkspaceSize(infiniopRoPEDescriptor_t desc, size_t *size);
__INFINI_C __export infiniStatus_t infiniopGetRoPEWorkspaceSize(infiniopRoPEDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopRoPE(
__INFINI_C __export infiniStatus_t infiniopRoPE(
infiniopRoPEDescriptor_t desc,
void *workspace,
size_t workspace_size,
......@@ -35,6 +35,6 @@ __C __export infiniStatus_t infiniopRoPE(
void const *cos_table,
void *stream);
__C __export infiniStatus_t infiniopDestroyRoPEDescriptor(infiniopRoPEDescriptor_t desc);
__INFINI_C __export infiniStatus_t infiniopDestroyRoPEDescriptor(infiniopRoPEDescriptor_t desc);
#endif
......@@ -5,20 +5,20 @@
typedef struct InfiniopDescriptor *infiniopSigmoidDescriptor_t;
__C __export infiniStatus_t infiniopCreateSigmoidDescriptor(infiniopHandle_t handle,
__INFINI_C __export infiniStatus_t infiniopCreateSigmoidDescriptor(infiniopHandle_t handle,
infiniopSigmoidDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y,
infiniopTensorDescriptor_t x);
__C __export infiniStatus_t infiniopGetSigmoidWorkspaceSize(infiniopSigmoidDescriptor_t desc, size_t *size);
__INFINI_C __export infiniStatus_t infiniopGetSigmoidWorkspaceSize(infiniopSigmoidDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopSigmoid(infiniopSigmoidDescriptor_t desc,
__INFINI_C __export infiniStatus_t infiniopSigmoid(infiniopSigmoidDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *y,
const void *x,
void *stream);
__C __export infiniStatus_t infiniopDestroySigmoidDescriptor(infiniopSigmoidDescriptor_t desc);
__INFINI_C __export infiniStatus_t infiniopDestroySigmoidDescriptor(infiniopSigmoidDescriptor_t desc);
#endif
......@@ -5,20 +5,20 @@
typedef struct InfiniopDescriptor *infiniopSiluDescriptor_t;
__C __export infiniStatus_t infiniopCreateSiluDescriptor(infiniopHandle_t handle,
__INFINI_C __export infiniStatus_t infiniopCreateSiluDescriptor(infiniopHandle_t handle,
infiniopSiluDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output,
infiniopTensorDescriptor_t intput);
__C __export infiniStatus_t infiniopGetSiluWorkspaceSize(infiniopSiluDescriptor_t desc, size_t *size);
__INFINI_C __export infiniStatus_t infiniopGetSiluWorkspaceSize(infiniopSiluDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopSilu(infiniopSiluDescriptor_t desc,
__INFINI_C __export infiniStatus_t infiniopSilu(infiniopSiluDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *output,
const void *intput,
void *stream);
__C __export infiniStatus_t infiniopDestroySiluDescriptor(infiniopSiluDescriptor_t desc);
__INFINI_C __export infiniStatus_t infiniopDestroySiluDescriptor(infiniopSiluDescriptor_t desc);
#endif
......@@ -22,7 +22,7 @@ typedef struct InfiniopDescriptor *infiniopSiluAndMulDescriptor_t;
* @param input Descriptor for the input tensor. Shape [..., 2*d].
* @return infiniStatus_t Status code of the operation.
*/
__C __export infiniStatus_t infiniopCreateSiluAndMulDescriptor(
__INFINI_C __export infiniStatus_t infiniopCreateSiluAndMulDescriptor(
infiniopHandle_t handle,
infiniopSiluAndMulDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output,
......@@ -34,7 +34,7 @@ __C __export infiniStatus_t infiniopCreateSiluAndMulDescriptor(
* @param size Pointer to store the required workspace size in bytes.
* @return infiniStatus_t Status code of the operation.
*/
__C __export infiniStatus_t infiniopGetSiluAndMulWorkspaceSize(
__INFINI_C __export infiniStatus_t infiniopGetSiluAndMulWorkspaceSize(
infiniopSiluAndMulDescriptor_t desc,
size_t *size);
......@@ -52,7 +52,7 @@ __C __export infiniStatus_t infiniopGetSiluAndMulWorkspaceSize(
* @param stream Pointer to the execution stream (e.g., CUDA stream). Can be NULL for default stream.
* @return infiniStatus_t Status code of the operation.
*/
__C __export infiniStatus_t infiniopSiluAndMul(
__INFINI_C __export infiniStatus_t infiniopSiluAndMul(
infiniopSiluAndMulDescriptor_t desc,
void *workspace,
size_t workspace_size,
......@@ -65,7 +65,7 @@ __C __export infiniStatus_t infiniopSiluAndMul(
* @param desc The descriptor to destroy.
* @return infiniStatus_t Status code of the operation.
*/
__C __export infiniStatus_t infiniopDestroySiluAndMulDescriptor(
__INFINI_C __export infiniStatus_t infiniopDestroySiluAndMulDescriptor(
infiniopSiluAndMulDescriptor_t desc);
#endif // __INFINIOP_SILU_AND_MUL_API_H__
......@@ -5,16 +5,16 @@
typedef struct InfiniopDescriptor *infiniopSoftmaxDescriptor_t;
__C __export infiniStatus_t infiniopCreateSoftmaxDescriptor(
__INFINI_C __export infiniStatus_t infiniopCreateSoftmaxDescriptor(
infiniopHandle_t handle,
infiniopSoftmaxDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y_desc,
infiniopTensorDescriptor_t x_desc,
int axis);
__C __export infiniStatus_t infiniopGetSoftmaxWorkspaceSize(infiniopSoftmaxDescriptor_t desc, size_t *size);
__INFINI_C __export infiniStatus_t infiniopGetSoftmaxWorkspaceSize(infiniopSoftmaxDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopSoftmax(
__INFINI_C __export infiniStatus_t infiniopSoftmax(
infiniopSoftmaxDescriptor_t desc,
void *workspace,
size_t workspace_size,
......@@ -22,6 +22,6 @@ __C __export infiniStatus_t infiniopSoftmax(
const void *x,
void *stream);
__C __export infiniStatus_t infiniopDestroySoftmaxDescriptor(infiniopSoftmaxDescriptor_t desc);
__INFINI_C __export infiniStatus_t infiniopDestroySoftmaxDescriptor(infiniopSoftmaxDescriptor_t desc);
#endif
......@@ -5,20 +5,20 @@
typedef struct InfiniopDescriptor *infiniopSoftplusDescriptor_t;
__C __export infiniStatus_t infiniopCreateSoftplusDescriptor(infiniopHandle_t handle,
__INFINI_C __export infiniStatus_t infiniopCreateSoftplusDescriptor(infiniopHandle_t handle,
infiniopSoftplusDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y,
infiniopTensorDescriptor_t x);
__C __export infiniStatus_t infiniopGetSoftplusWorkspaceSize(infiniopSoftplusDescriptor_t desc, size_t *size);
__INFINI_C __export infiniStatus_t infiniopGetSoftplusWorkspaceSize(infiniopSoftplusDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopSoftplus(infiniopSoftplusDescriptor_t desc,
__INFINI_C __export infiniStatus_t infiniopSoftplus(infiniopSoftplusDescriptor_t desc,
void *workspace,
size_t workspace_size,
void *y,
const void *x,
void *stream);
__C __export infiniStatus_t infiniopDestroySoftplusDescriptor(infiniopSoftplusDescriptor_t desc);
__INFINI_C __export infiniStatus_t infiniopDestroySoftplusDescriptor(infiniopSoftplusDescriptor_t desc);
#endif
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment