Unverified Commit 86aaf3c1 authored by Tong WU's avatar Tong WU Committed by GitHub
Browse files

Add fast sine and cosine definitions in common.h for CUDA templates (#865)

parent 48c9a352
...@@ -18,6 +18,8 @@ using int4_t = int4; ...@@ -18,6 +18,8 @@ using int4_t = int4;
#define hexp cutlass::fast_exp #define hexp cutlass::fast_exp
#define hlog cutlass::fast_log #define hlog cutlass::fast_log
#define hsqrt cutlass::fast_sqrt #define hsqrt cutlass::fast_sqrt
#define hsin cutlass::fast_sin
#define hcos cutlass::fast_cos
#define htanh cutlass::fast_tanh #define htanh cutlass::fast_tanh
#define hpow powf #define hpow powf
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment