Unverified Commit 471cc7f8 authored by Wenhao Xie's avatar Wenhao Xie Committed by GitHub
Browse files

add bf16 exp fallback (#776)

parent 68af2159
...@@ -330,3 +330,8 @@ TL_DEVICE void __sync_thread_partial() { ...@@ -330,3 +330,8 @@ TL_DEVICE void __sync_thread_partial() {
asm volatile("bar.sync %0, %1;" : : "r"(barrier_id), "r"(thread_count)); asm volatile("bar.sync %0, %1;" : : "r"(barrier_id), "r"(thread_count));
} }
} // namespace tl } // namespace tl
namespace cutlass {
TL_DEVICE
bfloat16_t fast_exp(bfloat16_t x) { return ::hexp(x); }
} // namespace cutlass
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment