Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
jerrrrry
infinicore
Commits
f06eb359
Commit
f06eb359
authored
Jul 10, 2025
by
YdrMaster
Browse files
issue/291/refactor: 改造 +-*
Signed-off-by:
YdrMaster
<
ydrml@hotmail.com
>
parent
c235afb1
Changes
13
Show whitespace changes
Inline
Side-by-side
Showing
13 changed files
with
47 additions
and
48 deletions
+47
-48
src/infiniop/ops/add/cuda/kernel.cuh
src/infiniop/ops/add/cuda/kernel.cuh
+0
-0
src/infiniop/ops/add/nvidia/add_nvidia.cu
src/infiniop/ops/add/nvidia/add_nvidia.cu
+7
-7
src/infiniop/ops/add/nvidia/add_nvidia.cuh
src/infiniop/ops/add/nvidia/add_nvidia.cuh
+1
-1
src/infiniop/ops/add/operator.cc
src/infiniop/ops/add/operator.cc
+8
-8
src/infiniop/ops/clip/nvidia/clip_nvidia.cuh
src/infiniop/ops/clip/nvidia/clip_nvidia.cuh
+0
-1
src/infiniop/ops/mul/cuda/kernel.cuh
src/infiniop/ops/mul/cuda/kernel.cuh
+0
-0
src/infiniop/ops/mul/nvidia/mul_nvidia.cu
src/infiniop/ops/mul/nvidia/mul_nvidia.cu
+8
-8
src/infiniop/ops/mul/nvidia/mul_nvidia.cuh
src/infiniop/ops/mul/nvidia/mul_nvidia.cuh
+1
-1
src/infiniop/ops/mul/operator.cc
src/infiniop/ops/mul/operator.cc
+7
-7
src/infiniop/ops/sub/cuda/kernel.cuh
src/infiniop/ops/sub/cuda/kernel.cuh
+0
-0
src/infiniop/ops/sub/nvidia/sub_nvidia.cu
src/infiniop/ops/sub/nvidia/sub_nvidia.cu
+7
-7
src/infiniop/ops/sub/nvidia/sub_nvidia.cuh
src/infiniop/ops/sub/nvidia/sub_nvidia.cuh
+1
-1
src/infiniop/ops/sub/operator.cc
src/infiniop/ops/sub/operator.cc
+7
-7
No files found.
src/infiniop/ops/add/cuda/
add_cuda_int
ern
a
l.cuh
→
src/infiniop/ops/add/cuda/
k
ern
e
l.cuh
View file @
f06eb359
File moved
src/infiniop/ops/add/
cud
a/add_
cud
a.cu
→
src/infiniop/ops/add/
nvidi
a/add_
nvidi
a.cu
View file @
f06eb359
#include "add_
cud
a.cuh"
#include "
add_cuda_int
ern
a
l.cuh"
#include "add_
nvidi
a.cuh"
#include "
../cuda/k
ern
e
l.cuh"
namespace
op
::
add
::
cud
a
{
namespace
op
::
add
::
nvidi
a
{
Descriptor
::~
Descriptor
()
=
default
;
...
...
@@ -43,13 +43,13 @@ infiniStatus_t Descriptor::calculate(
switch
(
_dtype
)
{
case
INFINI_DTYPE_F16
:
return
_device_info
->
calculate
<
256
,
AddOp
,
half
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
return
_device_info
->
calculate
<
256
,
cuda
::
AddOp
,
half
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
case
INFINI_DTYPE_BF16
:
return
_device_info
->
calculate
<
256
,
AddOp
,
__nv_bfloat16
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
return
_device_info
->
calculate
<
256
,
cuda
::
AddOp
,
__nv_bfloat16
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
case
INFINI_DTYPE_F32
:
return
_device_info
->
calculate
<
256
,
AddOp
,
float
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
return
_device_info
->
calculate
<
256
,
cuda
::
AddOp
,
float
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
case
INFINI_DTYPE_F64
:
return
_device_info
->
calculate
<
256
,
AddOp
,
double
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
return
_device_info
->
calculate
<
256
,
cuda
::
AddOp
,
double
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
default:
return
INFINI_STATUS_BAD_TENSOR_DTYPE
;
}
...
...
src/infiniop/ops/add/
cud
a/add_
cud
a.cuh
→
src/infiniop/ops/add/
nvidi
a/add_
nvidi
a.cuh
View file @
f06eb359
...
...
@@ -3,6 +3,6 @@
#include "../../../elementwise/cuda/elementwise_cuda_api.cuh"
ELEMENTWISE_DESCRIPTOR
(
add
,
cud
a
,
cuda
)
ELEMENTWISE_DESCRIPTOR
(
add
,
nvidi
a
,
cuda
)
#endif // __ADD_CUDA_API_H__
src/infiniop/ops/add/operator.cc
View file @
f06eb359
...
...
@@ -6,7 +6,7 @@
#include "cpu/add_cpu.h"
#endif
#ifdef ENABLE_NVIDIA_API
#include "
cud
a/add_
cud
a.cuh"
#include "
nvidi
a/add_
nvidi
a.cuh"
#endif
__C
infiniStatus_t
infiniopCreateAddDescriptor
(
...
...
@@ -31,7 +31,7 @@ __C infiniStatus_t infiniopCreateAddDescriptor(
CREATE
(
INFINI_DEVICE_CPU
,
cpu
);
#endif
#ifdef ENABLE_NVIDIA_API
CREATE
(
INFINI_DEVICE_NVIDIA
,
cud
a
);
CREATE
(
INFINI_DEVICE_NVIDIA
,
nvidi
a
);
#endif
default:
...
...
@@ -46,14 +46,14 @@ __C infiniStatus_t infiniopGetAddWorkspaceSize(infiniopAddDescriptor_t desc, siz
#define GET(CASE, NAMESPACE) \
case CASE: \
*size = reinterpret_cast<op::add::NAMESPACE::Descriptor *>(desc)->workspaceSize(); \
return INFINI_STATUS_SUCCESS
;
return INFINI_STATUS_SUCCESS
switch
(
desc
->
device_type
)
{
#ifdef ENABLE_CPU_API
GET
(
INFINI_DEVICE_CPU
,
cpu
)
GET
(
INFINI_DEVICE_CPU
,
cpu
)
;
#endif
#ifdef ENABLE_NVIDIA_API
GET
(
INFINI_DEVICE_NVIDIA
,
cud
a
)
GET
(
INFINI_DEVICE_NVIDIA
,
nvidi
a
)
;
#endif
default:
return
INFINI_STATUS_DEVICE_TYPE_NOT_SUPPORTED
;
...
...
@@ -83,7 +83,7 @@ __C infiniStatus_t infiniopAdd(
CALCULATE
(
INFINI_DEVICE_CPU
,
cpu
);
#endif
#ifdef ENABLE_NVIDIA_API
CALCULATE
(
INFINI_DEVICE_NVIDIA
,
cud
a
);
CALCULATE
(
INFINI_DEVICE_NVIDIA
,
nvidi
a
);
#endif
default:
...
...
@@ -99,7 +99,7 @@ infiniopDestroyAddDescriptor(infiniopAddDescriptor_t desc) {
#define DELETE(CASE, NAMESPACE) \
case CASE: \
delete reinterpret_cast<const op::add::NAMESPACE::Descriptor *>(desc); \
return INFINI_STATUS_SUCCESS
;
return INFINI_STATUS_SUCCESS
switch
(
desc
->
device_type
)
{
...
...
@@ -107,7 +107,7 @@ infiniopDestroyAddDescriptor(infiniopAddDescriptor_t desc) {
DELETE
(
INFINI_DEVICE_CPU
,
cpu
);
#endif
#ifdef ENABLE_NVIDIA_API
DELETE
(
INFINI_DEVICE_NVIDIA
,
cud
a
);
DELETE
(
INFINI_DEVICE_NVIDIA
,
nvidi
a
);
#endif
default:
...
...
src/infiniop/ops/clip/nvidia/clip_nvidia.cuh
View file @
f06eb359
...
...
@@ -2,7 +2,6 @@
#define __CLIP_CUDA_API_H__
#include "../../../elementwise/cuda/elementwise_cuda_api.cuh"
#include "infiniop/ops/clip.h"
ELEMENTWISE_DESCRIPTOR
(
clip
,
nvidia
,
cuda
)
...
...
src/infiniop/ops/mul/cuda/
mul_cuda_int
ern
a
l.cuh
→
src/infiniop/ops/mul/cuda/
k
ern
e
l.cuh
View file @
f06eb359
File moved
src/infiniop/ops/mul/
cud
a/mul_
cud
a.cu
→
src/infiniop/ops/mul/
nvidi
a/mul_
nvidi
a.cu
View file @
f06eb359
#include "mul_
cud
a.cuh"
#include "
mul_cuda_int
ern
a
l.cuh"
#include "mul_
nvidi
a.cuh"
#include "
../cuda/k
ern
e
l.cuh"
namespace
op
::
mul
::
cud
a
{
namespace
op
::
mul
::
nvidi
a
{
Descriptor
::~
Descriptor
()
=
default
;
...
...
@@ -43,17 +43,17 @@ infiniStatus_t Descriptor::calculate(
switch
(
_dtype
)
{
case
INFINI_DTYPE_F16
:
return
_device_info
->
calculate
<
256
,
MulOp
,
half
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
return
_device_info
->
calculate
<
256
,
cuda
::
MulOp
,
half
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
case
INFINI_DTYPE_F32
:
return
_device_info
->
calculate
<
256
,
MulOp
,
float
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
return
_device_info
->
calculate
<
256
,
cuda
::
MulOp
,
float
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
case
INFINI_DTYPE_F64
:
return
_device_info
->
calculate
<
256
,
MulOp
,
double
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
return
_device_info
->
calculate
<
256
,
cuda
::
MulOp
,
double
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
case
INFINI_DTYPE_BF16
:
return
_device_info
->
calculate
<
256
,
MulOp
,
__nv_bfloat16
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
return
_device_info
->
calculate
<
256
,
cuda
::
MulOp
,
__nv_bfloat16
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
default:
return
INFINI_STATUS_BAD_TENSOR_DTYPE
;
}
return
INFINI_STATUS_SUCCESS
;
}
}
// namespace op::mul::
cud
a
}
// namespace op::mul::
nvidi
a
src/infiniop/ops/mul/
cud
a/mul_
cud
a.cuh
→
src/infiniop/ops/mul/
nvidi
a/mul_
nvidi
a.cuh
View file @
f06eb359
...
...
@@ -3,6 +3,6 @@
#include "../../../elementwise/cuda/elementwise_cuda_api.cuh"
ELEMENTWISE_DESCRIPTOR
(
mul
,
cud
a
,
cuda
)
ELEMENTWISE_DESCRIPTOR
(
mul
,
nvidi
a
,
cuda
)
#endif // __MUL_CUDA_API_H__
src/infiniop/ops/mul/operator.cc
View file @
f06eb359
...
...
@@ -7,7 +7,7 @@
#endif
#ifdef ENABLE_NVIDIA_API
#include "
cud
a/mul_
cud
a.cuh"
#include "
nvidi
a/mul_
nvidi
a.cuh"
#endif
__C
infiniStatus_t
infiniopCreateMulDescriptor
(
...
...
@@ -32,7 +32,7 @@ __C infiniStatus_t infiniopCreateMulDescriptor(
CREATE
(
INFINI_DEVICE_CPU
,
cpu
);
#endif
#ifdef ENABLE_NVIDIA_API
CREATE
(
INFINI_DEVICE_NVIDIA
,
cud
a
);
CREATE
(
INFINI_DEVICE_NVIDIA
,
nvidi
a
);
#endif
default:
...
...
@@ -47,14 +47,14 @@ __C infiniStatus_t infiniopGetMulWorkspaceSize(infiniopMulDescriptor_t desc, siz
#define GET(CASE, NAMESPACE) \
case CASE: \
*size = reinterpret_cast<op::mul::NAMESPACE::Descriptor *>(desc)->workspaceSize(); \
return INFINI_STATUS_SUCCESS
;
return INFINI_STATUS_SUCCESS
switch
(
desc
->
device_type
)
{
#ifdef ENABLE_CPU_API
GET
(
INFINI_DEVICE_CPU
,
cpu
)
GET
(
INFINI_DEVICE_CPU
,
cpu
)
;
#endif
#ifdef ENABLE_NVIDIA_API
GET
(
INFINI_DEVICE_NVIDIA
,
cud
a
)
GET
(
INFINI_DEVICE_NVIDIA
,
nvidi
a
)
;
#endif
default:
return
INFINI_STATUS_DEVICE_TYPE_NOT_SUPPORTED
;
...
...
@@ -84,7 +84,7 @@ __C infiniStatus_t infiniopMul(
CALCULATE
(
INFINI_DEVICE_CPU
,
cpu
);
#endif
#ifdef ENABLE_NVIDIA_API
CALCULATE
(
INFINI_DEVICE_NVIDIA
,
cud
a
);
CALCULATE
(
INFINI_DEVICE_NVIDIA
,
nvidi
a
);
#endif
default:
...
...
@@ -108,7 +108,7 @@ infiniopDestroyMulDescriptor(infiniopMulDescriptor_t desc) {
DELETE
(
INFINI_DEVICE_CPU
,
cpu
);
#endif
#ifdef ENABLE_NVIDIA_API
DELETE
(
INFINI_DEVICE_NVIDIA
,
cud
a
);
DELETE
(
INFINI_DEVICE_NVIDIA
,
nvidi
a
);
#endif
default:
...
...
src/infiniop/ops/sub/cuda/
sub_cuda_int
ern
a
l.cuh
→
src/infiniop/ops/sub/cuda/
k
ern
e
l.cuh
View file @
f06eb359
File moved
src/infiniop/ops/sub/
cud
a/sub_
cud
a.cu
→
src/infiniop/ops/sub/
nvidi
a/sub_
nvidi
a.cu
View file @
f06eb359
#include "sub_
cud
a.cuh"
#include "
sub_cuda_int
ern
a
l.cuh"
#include "sub_
nvidi
a.cuh"
#include "
../cuda/k
ern
e
l.cuh"
namespace
op
::
sub
::
cud
a
{
namespace
op
::
sub
::
nvidi
a
{
Descriptor
::~
Descriptor
()
=
default
;
...
...
@@ -43,13 +43,13 @@ infiniStatus_t Descriptor::calculate(
switch
(
_dtype
)
{
case
INFINI_DTYPE_F16
:
return
_device_info
->
calculate
<
256
,
SubOp
,
half
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
return
_device_info
->
calculate
<
256
,
cuda
::
SubOp
,
half
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
case
INFINI_DTYPE_F32
:
return
_device_info
->
calculate
<
256
,
SubOp
,
float
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
return
_device_info
->
calculate
<
256
,
cuda
::
SubOp
,
float
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
case
INFINI_DTYPE_F64
:
return
_device_info
->
calculate
<
256
,
SubOp
,
double
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
return
_device_info
->
calculate
<
256
,
cuda
::
SubOp
,
double
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
case
INFINI_DTYPE_BF16
:
return
_device_info
->
calculate
<
256
,
SubOp
,
__nv_bfloat16
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
return
_device_info
->
calculate
<
256
,
cuda
::
SubOp
,
__nv_bfloat16
>
(
_info
,
workspace
,
output
,
inputs
,
stream
);
default:
return
INFINI_STATUS_BAD_TENSOR_DTYPE
;
}
...
...
src/infiniop/ops/sub/
cud
a/sub_
cud
a.cuh
→
src/infiniop/ops/sub/
nvidi
a/sub_
nvidi
a.cuh
View file @
f06eb359
...
...
@@ -3,6 +3,6 @@
#include "../../../elementwise/cuda/elementwise_cuda_api.cuh"
ELEMENTWISE_DESCRIPTOR
(
sub
,
cud
a
,
cuda
)
ELEMENTWISE_DESCRIPTOR
(
sub
,
nvidi
a
,
cuda
)
#endif // __SUB_CUDA_API_H__
src/infiniop/ops/sub/operator.cc
View file @
f06eb359
...
...
@@ -6,7 +6,7 @@
#include "cpu/sub_cpu.h"
#endif
#ifdef ENABLE_NVIDIA_API
#include "
cud
a/sub_
cud
a.cuh"
#include "
nvidi
a/sub_
nvidi
a.cuh"
#endif
__C
infiniStatus_t
infiniopCreateSubDescriptor
(
...
...
@@ -31,7 +31,7 @@ __C infiniStatus_t infiniopCreateSubDescriptor(
CREATE
(
INFINI_DEVICE_CPU
,
cpu
);
#endif
#ifdef ENABLE_NVIDIA_API
CREATE
(
INFINI_DEVICE_NVIDIA
,
cud
a
);
CREATE
(
INFINI_DEVICE_NVIDIA
,
nvidi
a
);
#endif
default:
...
...
@@ -46,14 +46,14 @@ __C infiniStatus_t infiniopGetSubWorkspaceSize(infiniopSubDescriptor_t desc, siz
#define GET(CASE, NAMESPACE) \
case CASE: \
*size = reinterpret_cast<op::sub::NAMESPACE::Descriptor *>(desc)->workspaceSize(); \
return INFINI_STATUS_SUCCESS
;
return INFINI_STATUS_SUCCESS
switch
(
desc
->
device_type
)
{
#ifdef ENABLE_CPU_API
GET
(
INFINI_DEVICE_CPU
,
cpu
)
GET
(
INFINI_DEVICE_CPU
,
cpu
)
;
#endif
#ifdef ENABLE_NVIDIA_API
GET
(
INFINI_DEVICE_NVIDIA
,
cud
a
)
GET
(
INFINI_DEVICE_NVIDIA
,
nvidi
a
)
;
#endif
default:
return
INFINI_STATUS_DEVICE_TYPE_NOT_SUPPORTED
;
...
...
@@ -83,7 +83,7 @@ __C infiniStatus_t infiniopSub(
CALCULATE
(
INFINI_DEVICE_CPU
,
cpu
);
#endif
#ifdef ENABLE_NVIDIA_API
CALCULATE
(
INFINI_DEVICE_NVIDIA
,
cud
a
);
CALCULATE
(
INFINI_DEVICE_NVIDIA
,
nvidi
a
);
#endif
default:
...
...
@@ -107,7 +107,7 @@ infiniopDestroySubDescriptor(infiniopSubDescriptor_t desc) {
DELETE
(
INFINI_DEVICE_CPU
,
cpu
);
#endif
#ifdef ENABLE_NVIDIA_API
DELETE
(
INFINI_DEVICE_NVIDIA
,
cud
a
);
DELETE
(
INFINI_DEVICE_NVIDIA
,
nvidi
a
);
#endif
default:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment