"docs/vscode:/vscode.git/clone" did not exist on "c0777e6565a5ab58db699de75cd122ef9b8de847"
Unverified Commit dce99862 authored by thatPepe's avatar thatPepe Committed by GitHub
Browse files

Merge pull request #1053 from InfiniTensor/issue/1033xmake

Issue/1033 patch aten and fa adaptations
parents 8d99a8f5 d6e44e84
...@@ -5,7 +5,7 @@ ...@@ -5,7 +5,7 @@
typedef struct InfiniopDescriptor *infiniopKVCachingDescriptor_t; typedef struct InfiniopDescriptor *infiniopKVCachingDescriptor_t;
__C __export infiniStatus_t infiniopCreateKVCachingDescriptor( __INFINI_C __export infiniStatus_t infiniopCreateKVCachingDescriptor(
infiniopHandle_t handle, infiniopHandle_t handle,
infiniopKVCachingDescriptor_t *desc_ptr, infiniopKVCachingDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t k_cache, infiniopTensorDescriptor_t k_cache,
...@@ -14,9 +14,9 @@ __C __export infiniStatus_t infiniopCreateKVCachingDescriptor( ...@@ -14,9 +14,9 @@ __C __export infiniStatus_t infiniopCreateKVCachingDescriptor(
infiniopTensorDescriptor_t v, infiniopTensorDescriptor_t v,
infiniopTensorDescriptor_t past_kv_lengths); infiniopTensorDescriptor_t past_kv_lengths);
__C __export infiniStatus_t infiniopGetKVCachingWorkspaceSize(infiniopKVCachingDescriptor_t desc, size_t *size); __INFINI_C __export infiniStatus_t infiniopGetKVCachingWorkspaceSize(infiniopKVCachingDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopKVCaching(infiniopKVCachingDescriptor_t desc, __INFINI_C __export infiniStatus_t infiniopKVCaching(infiniopKVCachingDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
void *k_cache, void *k_cache,
...@@ -26,6 +26,6 @@ __C __export infiniStatus_t infiniopKVCaching(infiniopKVCachingDescriptor_t desc ...@@ -26,6 +26,6 @@ __C __export infiniStatus_t infiniopKVCaching(infiniopKVCachingDescriptor_t desc
const void *past_kv_lengths, const void *past_kv_lengths,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroyKVCachingDescriptor(infiniopKVCachingDescriptor_t desc); __INFINI_C __export infiniStatus_t infiniopDestroyKVCachingDescriptor(infiniopKVCachingDescriptor_t desc);
#endif #endif
...@@ -5,7 +5,7 @@ ...@@ -5,7 +5,7 @@
typedef struct InfiniopDescriptor *infiniopLayerNormDescriptor_t; typedef struct InfiniopDescriptor *infiniopLayerNormDescriptor_t;
__C __export infiniStatus_t infiniopCreateLayerNormDescriptor( __INFINI_C __export infiniStatus_t infiniopCreateLayerNormDescriptor(
infiniopHandle_t handle, infiniopHandle_t handle,
infiniopLayerNormDescriptor_t *desc_ptr, infiniopLayerNormDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output_desc, infiniopTensorDescriptor_t output_desc,
...@@ -16,9 +16,9 @@ __C __export infiniStatus_t infiniopCreateLayerNormDescriptor( ...@@ -16,9 +16,9 @@ __C __export infiniStatus_t infiniopCreateLayerNormDescriptor(
infiniopTensorDescriptor_t bias_desc, infiniopTensorDescriptor_t bias_desc,
float eps); float eps);
__C __export infiniStatus_t infiniopGetLayerNormWorkspaceSize(infiniopLayerNormDescriptor_t desc, size_t *size); __INFINI_C __export infiniStatus_t infiniopGetLayerNormWorkspaceSize(infiniopLayerNormDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopLayerNorm(infiniopLayerNormDescriptor_t desc, __INFINI_C __export infiniStatus_t infiniopLayerNorm(infiniopLayerNormDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
void *output, void *output,
...@@ -29,6 +29,6 @@ __C __export infiniStatus_t infiniopLayerNorm(infiniopLayerNormDescriptor_t desc ...@@ -29,6 +29,6 @@ __C __export infiniStatus_t infiniopLayerNorm(infiniopLayerNormDescriptor_t desc
const void *bias, const void *bias,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroyLayerNormDescriptor(infiniopLayerNormDescriptor_t desc); __INFINI_C __export infiniStatus_t infiniopDestroyLayerNormDescriptor(infiniopLayerNormDescriptor_t desc);
#endif #endif
...@@ -5,20 +5,20 @@ ...@@ -5,20 +5,20 @@
typedef struct InfiniopDescriptor *infiniopLogSoftmaxDescriptor_t; typedef struct InfiniopDescriptor *infiniopLogSoftmaxDescriptor_t;
__C __export infiniStatus_t infiniopCreateLogSoftmaxDescriptor(infiniopHandle_t handle, __INFINI_C __export infiniStatus_t infiniopCreateLogSoftmaxDescriptor(infiniopHandle_t handle,
infiniopLogSoftmaxDescriptor_t *desc_ptr, infiniopLogSoftmaxDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y_desc, infiniopTensorDescriptor_t y_desc,
infiniopTensorDescriptor_t x_desc); infiniopTensorDescriptor_t x_desc);
__C __export infiniStatus_t infiniopGetLogSoftmaxWorkspaceSize(infiniopLogSoftmaxDescriptor_t desc, size_t *size); __INFINI_C __export infiniStatus_t infiniopGetLogSoftmaxWorkspaceSize(infiniopLogSoftmaxDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopLogSoftmax(infiniopLogSoftmaxDescriptor_t desc, __INFINI_C __export infiniStatus_t infiniopLogSoftmax(infiniopLogSoftmaxDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
void *y, void *y,
const void *x, const void *x,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroyLogSoftmaxDescriptor(infiniopLogSoftmaxDescriptor_t desc); __INFINI_C __export infiniStatus_t infiniopDestroyLogSoftmaxDescriptor(infiniopLogSoftmaxDescriptor_t desc);
#endif #endif
...@@ -5,7 +5,7 @@ ...@@ -5,7 +5,7 @@
typedef struct InfiniopDescriptor *infiniopLPNormDescriptor_t; typedef struct InfiniopDescriptor *infiniopLPNormDescriptor_t;
__C __export infiniStatus_t infiniopCreateLPNormDescriptor( __INFINI_C __export infiniStatus_t infiniopCreateLPNormDescriptor(
infiniopHandle_t handle, infiniopHandle_t handle,
infiniopLPNormDescriptor_t *desc_ptr, infiniopLPNormDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output_desc, infiniopTensorDescriptor_t output_desc,
...@@ -14,15 +14,15 @@ __C __export infiniStatus_t infiniopCreateLPNormDescriptor( ...@@ -14,15 +14,15 @@ __C __export infiniStatus_t infiniopCreateLPNormDescriptor(
int p, int p,
float eps); float eps);
__C __export infiniStatus_t infiniopGetLPNormWorkspaceSize(infiniopLPNormDescriptor_t desc, size_t *size); __INFINI_C __export infiniStatus_t infiniopGetLPNormWorkspaceSize(infiniopLPNormDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopLPNorm(infiniopLPNormDescriptor_t desc, __INFINI_C __export infiniStatus_t infiniopLPNorm(infiniopLPNormDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
void *output, void *output,
const void *input, const void *input,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroyLPNormDescriptor(infiniopLPNormDescriptor_t desc); __INFINI_C __export infiniStatus_t infiniopDestroyLPNormDescriptor(infiniopLPNormDescriptor_t desc);
#endif #endif
...@@ -5,15 +5,15 @@ ...@@ -5,15 +5,15 @@
typedef struct InfiniopDescriptor *infiniopMulDescriptor_t; typedef struct InfiniopDescriptor *infiniopMulDescriptor_t;
__C __export infiniStatus_t infiniopCreateMulDescriptor(infiniopHandle_t handle, __INFINI_C __export infiniStatus_t infiniopCreateMulDescriptor(infiniopHandle_t handle,
infiniopMulDescriptor_t *desc_ptr, infiniopMulDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t c, infiniopTensorDescriptor_t c,
infiniopTensorDescriptor_t a, infiniopTensorDescriptor_t a,
infiniopTensorDescriptor_t b); infiniopTensorDescriptor_t b);
__C __export infiniStatus_t infiniopGetMulWorkspaceSize(infiniopMulDescriptor_t desc, size_t *size); __INFINI_C __export infiniStatus_t infiniopGetMulWorkspaceSize(infiniopMulDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopMul(infiniopMulDescriptor_t desc, __INFINI_C __export infiniStatus_t infiniopMul(infiniopMulDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
void *c, void *c,
...@@ -21,6 +21,6 @@ __C __export infiniStatus_t infiniopMul(infiniopMulDescriptor_t desc, ...@@ -21,6 +21,6 @@ __C __export infiniStatus_t infiniopMul(infiniopMulDescriptor_t desc,
const void *b, const void *b,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroyMulDescriptor(infiniopMulDescriptor_t desc); __INFINI_C __export infiniStatus_t infiniopDestroyMulDescriptor(infiniopMulDescriptor_t desc);
#endif #endif
...@@ -5,20 +5,20 @@ ...@@ -5,20 +5,20 @@
typedef struct InfiniopDescriptor *infiniopOnesDescriptor_t; typedef struct InfiniopDescriptor *infiniopOnesDescriptor_t;
__C __export infiniStatus_t infiniopCreateOnesDescriptor(infiniopHandle_t handle, __INFINI_C __export infiniStatus_t infiniopCreateOnesDescriptor(infiniopHandle_t handle,
infiniopOnesDescriptor_t *desc_ptr, infiniopOnesDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y, infiniopTensorDescriptor_t y,
infiniopTensorDescriptor_t x); infiniopTensorDescriptor_t x);
__C __export infiniStatus_t infiniopGetOnesWorkspaceSize(infiniopOnesDescriptor_t desc, size_t *size); __INFINI_C __export infiniStatus_t infiniopGetOnesWorkspaceSize(infiniopOnesDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopOnes(infiniopOnesDescriptor_t desc, __INFINI_C __export infiniStatus_t infiniopOnes(infiniopOnesDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
void *y, void *y,
const void *x, const void *x,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroyOnesDescriptor(infiniopOnesDescriptor_t desc); __INFINI_C __export infiniStatus_t infiniopDestroyOnesDescriptor(infiniopOnesDescriptor_t desc);
#endif #endif
...@@ -30,7 +30,7 @@ typedef struct InfiniopDescriptor *infiniopPagedAttentionDescriptor_t; ...@@ -30,7 +30,7 @@ typedef struct InfiniopDescriptor *infiniopPagedAttentionDescriptor_t;
* @param scale The attention scaling factor (typically 1/sqrt(head_size)). * @param scale The attention scaling factor (typically 1/sqrt(head_size)).
* @return infiniStatus_t Status code. * @return infiniStatus_t Status code.
*/ */
__C __export infiniStatus_t infiniopCreatePagedAttentionDescriptor( __INFINI_C __export infiniStatus_t infiniopCreatePagedAttentionDescriptor(
infiniopHandle_t handle, infiniopHandle_t handle,
infiniopPagedAttentionDescriptor_t *desc_ptr, infiniopPagedAttentionDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t out_desc, infiniopTensorDescriptor_t out_desc,
...@@ -49,7 +49,7 @@ __C __export infiniStatus_t infiniopCreatePagedAttentionDescriptor( ...@@ -49,7 +49,7 @@ __C __export infiniStatus_t infiniopCreatePagedAttentionDescriptor(
* @param size A pointer to store the required workspace size in bytes. * @param size A pointer to store the required workspace size in bytes.
* @return infiniStatus_t Status code of the operation. * @return infiniStatus_t Status code of the operation.
*/ */
__C __export infiniStatus_t infiniopGetPagedAttentionWorkspaceSize( __INFINI_C __export infiniStatus_t infiniopGetPagedAttentionWorkspaceSize(
infiniopPagedAttentionDescriptor_t desc, size_t *size); infiniopPagedAttentionDescriptor_t desc, size_t *size);
/** /**
...@@ -68,7 +68,7 @@ __C __export infiniStatus_t infiniopGetPagedAttentionWorkspaceSize( ...@@ -68,7 +68,7 @@ __C __export infiniStatus_t infiniopGetPagedAttentionWorkspaceSize(
* @param stream The CUDA stream for the operation. Can be NULL. * @param stream The CUDA stream for the operation. Can be NULL.
* @return infiniStatus_t Status code of the operation. * @return infiniStatus_t Status code of the operation.
*/ */
__C __export infiniStatus_t infiniopPagedAttention( __INFINI_C __export infiniStatus_t infiniopPagedAttention(
infiniopPagedAttentionDescriptor_t desc, infiniopPagedAttentionDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
...@@ -87,7 +87,7 @@ __C __export infiniStatus_t infiniopPagedAttention( ...@@ -87,7 +87,7 @@ __C __export infiniStatus_t infiniopPagedAttention(
* @param desc The descriptor to be destroyed. * @param desc The descriptor to be destroyed.
* @return infiniStatus_t Status code of the operation. * @return infiniStatus_t Status code of the operation.
*/ */
__C __export infiniStatus_t infiniopDestroyPagedAttentionDescriptor( __INFINI_C __export infiniStatus_t infiniopDestroyPagedAttentionDescriptor(
infiniopPagedAttentionDescriptor_t desc); infiniopPagedAttentionDescriptor_t desc);
#endif // __INFINIOP_PAGED_ATTENTION_API_H__ #endif // __INFINIOP_PAGED_ATTENTION_API_H__
...@@ -29,7 +29,7 @@ typedef struct InfiniopDescriptor *infiniopPagedAttentionPrefillDescriptor_t; ...@@ -29,7 +29,7 @@ typedef struct InfiniopDescriptor *infiniopPagedAttentionPrefillDescriptor_t;
* @param scale The attention scaling factor (typically 1.0 / sqrt(head_size)). * @param scale The attention scaling factor (typically 1.0 / sqrt(head_size)).
* @return infiniStatus_t Status code of the operation. * @return infiniStatus_t Status code of the operation.
*/ */
__C __export infiniStatus_t infiniopCreatePagedAttentionPrefillDescriptor( __INFINI_C __export infiniStatus_t infiniopCreatePagedAttentionPrefillDescriptor(
infiniopHandle_t handle, infiniopHandle_t handle,
infiniopPagedAttentionPrefillDescriptor_t *desc_ptr, infiniopPagedAttentionPrefillDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t out_desc, infiniopTensorDescriptor_t out_desc,
...@@ -45,7 +45,7 @@ __C __export infiniStatus_t infiniopCreatePagedAttentionPrefillDescriptor( ...@@ -45,7 +45,7 @@ __C __export infiniStatus_t infiniopCreatePagedAttentionPrefillDescriptor(
/** /**
* @brief Retrieves the workspace size required for the Paged Attention Prefill operation. * @brief Retrieves the workspace size required for the Paged Attention Prefill operation.
*/ */
__C __export infiniStatus_t infiniopGetPagedAttentionPrefillWorkspaceSize( __INFINI_C __export infiniStatus_t infiniopGetPagedAttentionPrefillWorkspaceSize(
infiniopPagedAttentionPrefillDescriptor_t desc, size_t *size); infiniopPagedAttentionPrefillDescriptor_t desc, size_t *size);
/** /**
...@@ -64,7 +64,7 @@ __C __export infiniStatus_t infiniopGetPagedAttentionPrefillWorkspaceSize( ...@@ -64,7 +64,7 @@ __C __export infiniStatus_t infiniopGetPagedAttentionPrefillWorkspaceSize(
* @param stream The device stream (e.g., cudaStream_t) for the operation. * @param stream The device stream (e.g., cudaStream_t) for the operation.
* @return infiniStatus_t Status code of the operation. * @return infiniStatus_t Status code of the operation.
*/ */
__C __export infiniStatus_t infiniopPagedAttentionPrefill( __INFINI_C __export infiniStatus_t infiniopPagedAttentionPrefill(
infiniopPagedAttentionPrefillDescriptor_t desc, infiniopPagedAttentionPrefillDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
...@@ -81,7 +81,7 @@ __C __export infiniStatus_t infiniopPagedAttentionPrefill( ...@@ -81,7 +81,7 @@ __C __export infiniStatus_t infiniopPagedAttentionPrefill(
/** /**
* @brief Destroys a Paged Attention Prefill descriptor. * @brief Destroys a Paged Attention Prefill descriptor.
*/ */
__C __export infiniStatus_t infiniopDestroyPagedAttentionPrefillDescriptor( __INFINI_C __export infiniStatus_t infiniopDestroyPagedAttentionPrefillDescriptor(
infiniopPagedAttentionPrefillDescriptor_t desc); infiniopPagedAttentionPrefillDescriptor_t desc);
#endif // __INFINIOP_PAGED_ATTENTION_PREFILL_API_H__ #endif // __INFINIOP_PAGED_ATTENTION_PREFILL_API_H__
...@@ -21,7 +21,7 @@ typedef struct InfiniopDescriptor *infiniopPagedCachingDescriptor_t; ...@@ -21,7 +21,7 @@ typedef struct InfiniopDescriptor *infiniopPagedCachingDescriptor_t;
* @param slot_mapping_desc Descriptor for the slot mapping tensor. * @param slot_mapping_desc Descriptor for the slot mapping tensor.
* @return infiniStatus_t Status code of the operation. * @return infiniStatus_t Status code of the operation.
*/ */
__C __export infiniStatus_t infiniopCreatePagedCachingDescriptor( __INFINI_C __export infiniStatus_t infiniopCreatePagedCachingDescriptor(
infiniopHandle_t handle, infiniopHandle_t handle,
infiniopPagedCachingDescriptor_t *desc_ptr, infiniopPagedCachingDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t k_cache_desc, infiniopTensorDescriptor_t k_cache_desc,
...@@ -37,7 +37,7 @@ __C __export infiniStatus_t infiniopCreatePagedCachingDescriptor( ...@@ -37,7 +37,7 @@ __C __export infiniStatus_t infiniopCreatePagedCachingDescriptor(
* @param size A pointer to store the required workspace size in bytes (typically 0). * @param size A pointer to store the required workspace size in bytes (typically 0).
* @return infiniStatus_t Status code of the operation. * @return infiniStatus_t Status code of the operation.
*/ */
__C __export infiniStatus_t infiniopGetPagedCachingWorkspaceSize( __INFINI_C __export infiniStatus_t infiniopGetPagedCachingWorkspaceSize(
infiniopPagedCachingDescriptor_t desc, size_t *size); infiniopPagedCachingDescriptor_t desc, size_t *size);
/** /**
...@@ -54,7 +54,7 @@ __C __export infiniStatus_t infiniopGetPagedCachingWorkspaceSize( ...@@ -54,7 +54,7 @@ __C __export infiniStatus_t infiniopGetPagedCachingWorkspaceSize(
* @param stream The CUDA stream for the operation. Can be NULL. * @param stream The CUDA stream for the operation. Can be NULL.
* @return infiniStatus_t Status code of the operation. * @return infiniStatus_t Status code of the operation.
*/ */
__C __export infiniStatus_t infiniopPagedCaching( __INFINI_C __export infiniStatus_t infiniopPagedCaching(
infiniopPagedCachingDescriptor_t desc, infiniopPagedCachingDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
...@@ -71,7 +71,7 @@ __C __export infiniStatus_t infiniopPagedCaching( ...@@ -71,7 +71,7 @@ __C __export infiniStatus_t infiniopPagedCaching(
* @param desc The descriptor to be destroyed. * @param desc The descriptor to be destroyed.
* @return infiniStatus_t Status code of the operation. * @return infiniStatus_t Status code of the operation.
*/ */
__C __export infiniStatus_t infiniopDestroyPagedCachingDescriptor( __INFINI_C __export infiniStatus_t infiniopDestroyPagedCachingDescriptor(
infiniopPagedCachingDescriptor_t desc); infiniopPagedCachingDescriptor_t desc);
#endif // __INFINIOP_PAGED_CACHING_API_H__ #endif // __INFINIOP_PAGED_CACHING_API_H__
...@@ -5,16 +5,16 @@ ...@@ -5,16 +5,16 @@
typedef InfiniopDescriptor *infiniopPerChannelQuantI8Descriptor_t; typedef InfiniopDescriptor *infiniopPerChannelQuantI8Descriptor_t;
__C __export infiniStatus_t infiniopCreatePerChannelQuantI8Descriptor(infiniopHandle_t handle, __INFINI_C __export infiniStatus_t infiniopCreatePerChannelQuantI8Descriptor(infiniopHandle_t handle,
infiniopPerChannelQuantI8Descriptor_t *desc_ptr, infiniopPerChannelQuantI8Descriptor_t *desc_ptr,
infiniopTensorDescriptor_t x_packed_desc, infiniopTensorDescriptor_t x_packed_desc,
infiniopTensorDescriptor_t x_scale_desc, infiniopTensorDescriptor_t x_scale_desc,
infiniopTensorDescriptor_t x_zero_desc, infiniopTensorDescriptor_t x_zero_desc,
infiniopTensorDescriptor_t x_desc); infiniopTensorDescriptor_t x_desc);
__C __export infiniStatus_t infiniopGetPerChannelQuantI8WorkspaceSize(infiniopPerChannelQuantI8Descriptor_t desc, size_t *size); __INFINI_C __export infiniStatus_t infiniopGetPerChannelQuantI8WorkspaceSize(infiniopPerChannelQuantI8Descriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopPerChannelQuantI8(infiniopPerChannelQuantI8Descriptor_t desc, __INFINI_C __export infiniStatus_t infiniopPerChannelQuantI8(infiniopPerChannelQuantI8Descriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
void *x_packed, void *x_packed,
...@@ -23,6 +23,6 @@ __C __export infiniStatus_t infiniopPerChannelQuantI8(infiniopPerChannelQuantI8D ...@@ -23,6 +23,6 @@ __C __export infiniStatus_t infiniopPerChannelQuantI8(infiniopPerChannelQuantI8D
const void *x, const void *x,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroyPerChannelQuantI8Descriptor(infiniopPerChannelQuantI8Descriptor_t desc); __INFINI_C __export infiniStatus_t infiniopDestroyPerChannelQuantI8Descriptor(infiniopPerChannelQuantI8Descriptor_t desc);
#endif #endif
...@@ -5,23 +5,23 @@ ...@@ -5,23 +5,23 @@
typedef struct InfiniopDescriptor *infiniopRandomSampleDescriptor_t; typedef struct InfiniopDescriptor *infiniopRandomSampleDescriptor_t;
__C __export infiniStatus_t infiniopCreateRandomSampleDescriptor( __INFINI_C __export infiniStatus_t infiniopCreateRandomSampleDescriptor(
infiniopHandle_t handle, infiniopHandle_t handle,
infiniopRandomSampleDescriptor_t *desc_ptr, infiniopRandomSampleDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t result, infiniopTensorDescriptor_t result,
infiniopTensorDescriptor_t probs); infiniopTensorDescriptor_t probs);
__C __export infiniStatus_t infiniopGetRandomSampleWorkspaceSize( __INFINI_C __export infiniStatus_t infiniopGetRandomSampleWorkspaceSize(
infiniopRandomSampleDescriptor_t desc, infiniopRandomSampleDescriptor_t desc,
size_t *size); size_t *size);
__C __export infiniStatus_t infiniopCreateRandomSampleBatchDescriptor( __INFINI_C __export infiniStatus_t infiniopCreateRandomSampleBatchDescriptor(
infiniopHandle_t handle, infiniopHandle_t handle,
infiniopRandomSampleDescriptor_t *desc_ptr, infiniopRandomSampleDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t result, infiniopTensorDescriptor_t result,
infiniopTensorDescriptor_t probs); infiniopTensorDescriptor_t probs);
__C __export infiniStatus_t infiniopRandomSample( __INFINI_C __export infiniStatus_t infiniopRandomSample(
infiniopRandomSampleDescriptor_t desc, infiniopRandomSampleDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
...@@ -33,7 +33,7 @@ __C __export infiniStatus_t infiniopRandomSample( ...@@ -33,7 +33,7 @@ __C __export infiniStatus_t infiniopRandomSample(
float temperature, float temperature,
void *stream); void *stream);
__C __export infiniStatus_t infiniopRandomSampleBatch( __INFINI_C __export infiniStatus_t infiniopRandomSampleBatch(
infiniopRandomSampleDescriptor_t desc, infiniopRandomSampleDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
...@@ -46,7 +46,7 @@ __C __export infiniStatus_t infiniopRandomSampleBatch( ...@@ -46,7 +46,7 @@ __C __export infiniStatus_t infiniopRandomSampleBatch(
int batch_size, int batch_size,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroyRandomSampleDescriptor( __INFINI_C __export infiniStatus_t infiniopDestroyRandomSampleDescriptor(
infiniopRandomSampleDescriptor_t desc); infiniopRandomSampleDescriptor_t desc);
#endif #endif
...@@ -5,19 +5,19 @@ ...@@ -5,19 +5,19 @@
typedef struct InfiniopDescriptor *infiniopRearrangeDescriptor_t; typedef struct InfiniopDescriptor *infiniopRearrangeDescriptor_t;
__C __export infiniStatus_t infiniopCreateRearrangeDescriptor( __INFINI_C __export infiniStatus_t infiniopCreateRearrangeDescriptor(
infiniopHandle_t handle, infiniopHandle_t handle,
infiniopRearrangeDescriptor_t *desc_ptr, infiniopRearrangeDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t dst, infiniopTensorDescriptor_t dst,
infiniopTensorDescriptor_t src); infiniopTensorDescriptor_t src);
__C __export infiniStatus_t infiniopRearrange( __INFINI_C __export infiniStatus_t infiniopRearrange(
infiniopRearrangeDescriptor_t desc, infiniopRearrangeDescriptor_t desc,
void *dst, void *dst,
const void *src, const void *src,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroyRearrangeDescriptor( __INFINI_C __export infiniStatus_t infiniopDestroyRearrangeDescriptor(
infiniopRearrangeDescriptor_t desc); infiniopRearrangeDescriptor_t desc);
#endif #endif
...@@ -5,20 +5,20 @@ ...@@ -5,20 +5,20 @@
typedef struct InfiniopDescriptor *infiniopReluDescriptor_t; typedef struct InfiniopDescriptor *infiniopReluDescriptor_t;
__C __export infiniStatus_t infiniopCreateReluDescriptor(infiniopHandle_t handle, __INFINI_C __export infiniStatus_t infiniopCreateReluDescriptor(infiniopHandle_t handle,
infiniopReluDescriptor_t *desc_ptr, infiniopReluDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y, infiniopTensorDescriptor_t y,
infiniopTensorDescriptor_t x); infiniopTensorDescriptor_t x);
__C __export infiniStatus_t infiniopGetReluWorkspaceSize(infiniopReluDescriptor_t desc, size_t *size); __INFINI_C __export infiniStatus_t infiniopGetReluWorkspaceSize(infiniopReluDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopRelu(infiniopReluDescriptor_t desc, __INFINI_C __export infiniStatus_t infiniopRelu(infiniopReluDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
void *y, void *y,
const void *x, const void *x,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroyReluDescriptor(infiniopReluDescriptor_t desc); __INFINI_C __export infiniStatus_t infiniopDestroyReluDescriptor(infiniopReluDescriptor_t desc);
#endif #endif
...@@ -5,7 +5,7 @@ ...@@ -5,7 +5,7 @@
typedef struct InfiniopDescriptor *infiniopRMSNormDescriptor_t; typedef struct InfiniopDescriptor *infiniopRMSNormDescriptor_t;
__C __export infiniStatus_t infiniopCreateRMSNormDescriptor( __INFINI_C __export infiniStatus_t infiniopCreateRMSNormDescriptor(
infiniopHandle_t handle, infiniopHandle_t handle,
infiniopRMSNormDescriptor_t *desc_ptr, infiniopRMSNormDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y_desc, infiniopTensorDescriptor_t y_desc,
...@@ -13,11 +13,11 @@ __C __export infiniStatus_t infiniopCreateRMSNormDescriptor( ...@@ -13,11 +13,11 @@ __C __export infiniStatus_t infiniopCreateRMSNormDescriptor(
infiniopTensorDescriptor_t w_desc, infiniopTensorDescriptor_t w_desc,
float epsilon); float epsilon);
__C __export infiniStatus_t infiniopGetRMSNormWorkspaceSize(infiniopRMSNormDescriptor_t desc, size_t *size); __INFINI_C __export infiniStatus_t infiniopGetRMSNormWorkspaceSize(infiniopRMSNormDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopRMSNorm(infiniopRMSNormDescriptor_t desc, void *workspace, size_t workspace_size, __INFINI_C __export infiniStatus_t infiniopRMSNorm(infiniopRMSNormDescriptor_t desc, void *workspace, size_t workspace_size,
void *y, const void *x, const void *w, void *stream); void *y, const void *x, const void *w, void *stream);
__C __export infiniStatus_t infiniopDestroyRMSNormDescriptor(infiniopRMSNormDescriptor_t desc); __INFINI_C __export infiniStatus_t infiniopDestroyRMSNormDescriptor(infiniopRMSNormDescriptor_t desc);
#endif #endif
...@@ -12,7 +12,7 @@ typedef enum { ...@@ -12,7 +12,7 @@ typedef enum {
typedef struct InfiniopDescriptor *infiniopRoPEDescriptor_t; typedef struct InfiniopDescriptor *infiniopRoPEDescriptor_t;
__C __export infiniStatus_t infiniopCreateRoPEDescriptor( __INFINI_C __export infiniStatus_t infiniopCreateRoPEDescriptor(
infiniopHandle_t handle, infiniopHandle_t handle,
infiniopRoPEDescriptor_t *desc_ptr, infiniopRoPEDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y, infiniopTensorDescriptor_t y,
...@@ -22,9 +22,9 @@ __C __export infiniStatus_t infiniopCreateRoPEDescriptor( ...@@ -22,9 +22,9 @@ __C __export infiniStatus_t infiniopCreateRoPEDescriptor(
infiniopTensorDescriptor_t cos_table, infiniopTensorDescriptor_t cos_table,
infiniopRoPEAlgo_t algo); infiniopRoPEAlgo_t algo);
__C __export infiniStatus_t infiniopGetRoPEWorkspaceSize(infiniopRoPEDescriptor_t desc, size_t *size); __INFINI_C __export infiniStatus_t infiniopGetRoPEWorkspaceSize(infiniopRoPEDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopRoPE( __INFINI_C __export infiniStatus_t infiniopRoPE(
infiniopRoPEDescriptor_t desc, infiniopRoPEDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
...@@ -35,6 +35,6 @@ __C __export infiniStatus_t infiniopRoPE( ...@@ -35,6 +35,6 @@ __C __export infiniStatus_t infiniopRoPE(
void const *cos_table, void const *cos_table,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroyRoPEDescriptor(infiniopRoPEDescriptor_t desc); __INFINI_C __export infiniStatus_t infiniopDestroyRoPEDescriptor(infiniopRoPEDescriptor_t desc);
#endif #endif
...@@ -5,20 +5,20 @@ ...@@ -5,20 +5,20 @@
typedef struct InfiniopDescriptor *infiniopSigmoidDescriptor_t; typedef struct InfiniopDescriptor *infiniopSigmoidDescriptor_t;
__C __export infiniStatus_t infiniopCreateSigmoidDescriptor(infiniopHandle_t handle, __INFINI_C __export infiniStatus_t infiniopCreateSigmoidDescriptor(infiniopHandle_t handle,
infiniopSigmoidDescriptor_t *desc_ptr, infiniopSigmoidDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y, infiniopTensorDescriptor_t y,
infiniopTensorDescriptor_t x); infiniopTensorDescriptor_t x);
__C __export infiniStatus_t infiniopGetSigmoidWorkspaceSize(infiniopSigmoidDescriptor_t desc, size_t *size); __INFINI_C __export infiniStatus_t infiniopGetSigmoidWorkspaceSize(infiniopSigmoidDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopSigmoid(infiniopSigmoidDescriptor_t desc, __INFINI_C __export infiniStatus_t infiniopSigmoid(infiniopSigmoidDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
void *y, void *y,
const void *x, const void *x,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroySigmoidDescriptor(infiniopSigmoidDescriptor_t desc); __INFINI_C __export infiniStatus_t infiniopDestroySigmoidDescriptor(infiniopSigmoidDescriptor_t desc);
#endif #endif
...@@ -5,20 +5,20 @@ ...@@ -5,20 +5,20 @@
typedef struct InfiniopDescriptor *infiniopSiluDescriptor_t; typedef struct InfiniopDescriptor *infiniopSiluDescriptor_t;
__C __export infiniStatus_t infiniopCreateSiluDescriptor(infiniopHandle_t handle, __INFINI_C __export infiniStatus_t infiniopCreateSiluDescriptor(infiniopHandle_t handle,
infiniopSiluDescriptor_t *desc_ptr, infiniopSiluDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output, infiniopTensorDescriptor_t output,
infiniopTensorDescriptor_t intput); infiniopTensorDescriptor_t intput);
__C __export infiniStatus_t infiniopGetSiluWorkspaceSize(infiniopSiluDescriptor_t desc, size_t *size); __INFINI_C __export infiniStatus_t infiniopGetSiluWorkspaceSize(infiniopSiluDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopSilu(infiniopSiluDescriptor_t desc, __INFINI_C __export infiniStatus_t infiniopSilu(infiniopSiluDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
void *output, void *output,
const void *intput, const void *intput,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroySiluDescriptor(infiniopSiluDescriptor_t desc); __INFINI_C __export infiniStatus_t infiniopDestroySiluDescriptor(infiniopSiluDescriptor_t desc);
#endif #endif
...@@ -22,7 +22,7 @@ typedef struct InfiniopDescriptor *infiniopSiluAndMulDescriptor_t; ...@@ -22,7 +22,7 @@ typedef struct InfiniopDescriptor *infiniopSiluAndMulDescriptor_t;
* @param input Descriptor for the input tensor. Shape [..., 2*d]. * @param input Descriptor for the input tensor. Shape [..., 2*d].
* @return infiniStatus_t Status code of the operation. * @return infiniStatus_t Status code of the operation.
*/ */
__C __export infiniStatus_t infiniopCreateSiluAndMulDescriptor( __INFINI_C __export infiniStatus_t infiniopCreateSiluAndMulDescriptor(
infiniopHandle_t handle, infiniopHandle_t handle,
infiniopSiluAndMulDescriptor_t *desc_ptr, infiniopSiluAndMulDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t output, infiniopTensorDescriptor_t output,
...@@ -34,7 +34,7 @@ __C __export infiniStatus_t infiniopCreateSiluAndMulDescriptor( ...@@ -34,7 +34,7 @@ __C __export infiniStatus_t infiniopCreateSiluAndMulDescriptor(
* @param size Pointer to store the required workspace size in bytes. * @param size Pointer to store the required workspace size in bytes.
* @return infiniStatus_t Status code of the operation. * @return infiniStatus_t Status code of the operation.
*/ */
__C __export infiniStatus_t infiniopGetSiluAndMulWorkspaceSize( __INFINI_C __export infiniStatus_t infiniopGetSiluAndMulWorkspaceSize(
infiniopSiluAndMulDescriptor_t desc, infiniopSiluAndMulDescriptor_t desc,
size_t *size); size_t *size);
...@@ -52,7 +52,7 @@ __C __export infiniStatus_t infiniopGetSiluAndMulWorkspaceSize( ...@@ -52,7 +52,7 @@ __C __export infiniStatus_t infiniopGetSiluAndMulWorkspaceSize(
* @param stream Pointer to the execution stream (e.g., CUDA stream). Can be NULL for default stream. * @param stream Pointer to the execution stream (e.g., CUDA stream). Can be NULL for default stream.
* @return infiniStatus_t Status code of the operation. * @return infiniStatus_t Status code of the operation.
*/ */
__C __export infiniStatus_t infiniopSiluAndMul( __INFINI_C __export infiniStatus_t infiniopSiluAndMul(
infiniopSiluAndMulDescriptor_t desc, infiniopSiluAndMulDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
...@@ -65,7 +65,7 @@ __C __export infiniStatus_t infiniopSiluAndMul( ...@@ -65,7 +65,7 @@ __C __export infiniStatus_t infiniopSiluAndMul(
* @param desc The descriptor to destroy. * @param desc The descriptor to destroy.
* @return infiniStatus_t Status code of the operation. * @return infiniStatus_t Status code of the operation.
*/ */
__C __export infiniStatus_t infiniopDestroySiluAndMulDescriptor( __INFINI_C __export infiniStatus_t infiniopDestroySiluAndMulDescriptor(
infiniopSiluAndMulDescriptor_t desc); infiniopSiluAndMulDescriptor_t desc);
#endif // __INFINIOP_SILU_AND_MUL_API_H__ #endif // __INFINIOP_SILU_AND_MUL_API_H__
...@@ -5,16 +5,16 @@ ...@@ -5,16 +5,16 @@
typedef struct InfiniopDescriptor *infiniopSoftmaxDescriptor_t; typedef struct InfiniopDescriptor *infiniopSoftmaxDescriptor_t;
__C __export infiniStatus_t infiniopCreateSoftmaxDescriptor( __INFINI_C __export infiniStatus_t infiniopCreateSoftmaxDescriptor(
infiniopHandle_t handle, infiniopHandle_t handle,
infiniopSoftmaxDescriptor_t *desc_ptr, infiniopSoftmaxDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y_desc, infiniopTensorDescriptor_t y_desc,
infiniopTensorDescriptor_t x_desc, infiniopTensorDescriptor_t x_desc,
int axis); int axis);
__C __export infiniStatus_t infiniopGetSoftmaxWorkspaceSize(infiniopSoftmaxDescriptor_t desc, size_t *size); __INFINI_C __export infiniStatus_t infiniopGetSoftmaxWorkspaceSize(infiniopSoftmaxDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopSoftmax( __INFINI_C __export infiniStatus_t infiniopSoftmax(
infiniopSoftmaxDescriptor_t desc, infiniopSoftmaxDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
...@@ -22,6 +22,6 @@ __C __export infiniStatus_t infiniopSoftmax( ...@@ -22,6 +22,6 @@ __C __export infiniStatus_t infiniopSoftmax(
const void *x, const void *x,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroySoftmaxDescriptor(infiniopSoftmaxDescriptor_t desc); __INFINI_C __export infiniStatus_t infiniopDestroySoftmaxDescriptor(infiniopSoftmaxDescriptor_t desc);
#endif #endif
...@@ -5,20 +5,20 @@ ...@@ -5,20 +5,20 @@
typedef struct InfiniopDescriptor *infiniopSoftplusDescriptor_t; typedef struct InfiniopDescriptor *infiniopSoftplusDescriptor_t;
__C __export infiniStatus_t infiniopCreateSoftplusDescriptor(infiniopHandle_t handle, __INFINI_C __export infiniStatus_t infiniopCreateSoftplusDescriptor(infiniopHandle_t handle,
infiniopSoftplusDescriptor_t *desc_ptr, infiniopSoftplusDescriptor_t *desc_ptr,
infiniopTensorDescriptor_t y, infiniopTensorDescriptor_t y,
infiniopTensorDescriptor_t x); infiniopTensorDescriptor_t x);
__C __export infiniStatus_t infiniopGetSoftplusWorkspaceSize(infiniopSoftplusDescriptor_t desc, size_t *size); __INFINI_C __export infiniStatus_t infiniopGetSoftplusWorkspaceSize(infiniopSoftplusDescriptor_t desc, size_t *size);
__C __export infiniStatus_t infiniopSoftplus(infiniopSoftplusDescriptor_t desc, __INFINI_C __export infiniStatus_t infiniopSoftplus(infiniopSoftplusDescriptor_t desc,
void *workspace, void *workspace,
size_t workspace_size, size_t workspace_size,
void *y, void *y,
const void *x, const void *x,
void *stream); void *stream);
__C __export infiniStatus_t infiniopDestroySoftplusDescriptor(infiniopSoftplusDescriptor_t desc); __INFINI_C __export infiniStatus_t infiniopDestroySoftplusDescriptor(infiniopSoftplusDescriptor_t desc);
#endif #endif
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment