Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
ColossalAI
Commits
db544194
Commit
db544194
authored
Mar 31, 2022
by
Shawn-Kong
Committed by
binmakeswell
Apr 06, 2022
Browse files
fix format (#613)
Co-authored-by:
evin K
<
evink@evins-MacBook-Air.local
>
parent
5ecef13c
Changes
1
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
11 additions
and
15 deletions
+11
-15
colossalai/kernel/cuda_native/csrc/kernels/include/kernels.h
colossalai/kernel/cuda_native/csrc/kernels/include/kernels.h
+11
-15
No files found.
colossalai/kernel/cuda_native/csrc/kernels/include/kernels.h
View file @
db544194
...
...
@@ -3,9 +3,9 @@
#include <cuda.h>
#include <cuda_fp16.h>
#include <curand_kernel.h>
#include <stdexcept>
#include <stdio.h>
#include <stdlib.h>
#include <stdexcept>
#define MAX_THREADS 1024
#define WARP_SIZE 32
...
...
@@ -132,9 +132,8 @@ __forceinline__ __host__ __device__ int flat_3dim(int id1, int id2, int id3,
}
/* Convert 4-dim tensor index into vector index */
__forceinline__
__host__
__device__
int
flat_4dim
(
int
id1
,
int
id2
,
int
id3
,
int
id4
,
int
dim2
,
int
dim3
,
int
dim4
)
{
__forceinline__
__host__
__device__
int
flat_4dim
(
int
id1
,
int
id2
,
int
id3
,
int
id4
,
int
dim2
,
int
dim3
,
int
dim4
)
{
// return id1*(dim2*dim3*dim4) + id2*(dim3*dim4) + id3*dim4 + id4;
int
res
=
id4
;
...
...
@@ -202,9 +201,9 @@ __forceinline__ __host__ __device__ int flat_6dim(int id1, int id2, int id3,
}
/* Convert vector index to 6-dim tensor index */
__forceinline__
__host__
__device__
void
decompose_6dim
(
int
src
,
int
dim1
,
int
dim2
,
int
dim3
,
int
dim4
,
int
dim5
,
int
*
id0
,
int
*
id1
,
int
*
id2
,
int
*
id3
,
int
*
id4
,
int
*
id5
)
{
__forceinline__
__host__
__device__
void
decompose_6dim
(
int
src
,
int
dim1
,
int
dim2
,
int
dim3
,
int
dim4
,
int
dim5
,
int
*
id0
,
int
*
id1
,
int
*
id2
,
int
*
id3
,
int
*
id4
,
int
*
id5
)
{
*
id5
=
src
%
dim5
;
src
/=
dim5
;
...
...
@@ -222,11 +221,9 @@ __forceinline__ __host__ __device__ void decompose_6dim(
}
/* Convert vector index to 5-dim tensor index */
__forceinline__
__host__
__device__
void
decompose_5dim
(
int
src
,
int
dim1
,
int
dim2
,
int
dim3
,
int
dim4
,
int
*
id0
,
int
*
id1
,
int
*
id2
,
int
*
id3
,
int
*
id4
)
{
__forceinline__
__host__
__device__
void
decompose_5dim
(
int
src
,
int
dim1
,
int
dim2
,
int
dim3
,
int
dim4
,
int
*
id0
,
int
*
id1
,
int
*
id2
,
int
*
id3
,
int
*
id4
)
{
*
id4
=
src
%
dim4
;
src
/=
dim4
;
...
...
@@ -256,9 +253,8 @@ __forceinline__ __host__ __device__ void decompose_4dim(int src, int dim1,
}
/* Convert vector index to 3-dim tensor index */
__forceinline__
__host__
__device__
void
decompose_3dim
(
int
src
,
int
dim1
,
int
dim2
,
int
*
id0
,
int
*
id1
,
int
*
id2
)
{
__forceinline__
__host__
__device__
void
decompose_3dim
(
int
src
,
int
dim1
,
int
dim2
,
int
*
id0
,
int
*
id1
,
int
*
id2
)
{
*
id2
=
src
%
dim2
;
src
/=
dim2
;
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment