Commit 98a2cfcc authored by Chao Liu's avatar Chao Liu
Browse files

nvidia build

parent 00089cd6
......@@ -19,8 +19,6 @@ namespace ck {
enum address_space_t
{
generic = 0,
vgpr = 1,
lds = 2,
global = 3
};
......
......@@ -21,8 +21,6 @@ namespace ck {
enum address_space_t
{
generic = 0,
vgpr = generic,
lds = generic,
global = generic
};
......@@ -39,6 +37,17 @@ using index_t = int32_t;
using float2_t = float2;
using float4_t = float4;
// data type conversion
template <typename T>
struct type_convert
{
template <typename X>
__device__ T operator()(const X& x) const
{
return static_cast<T>(x);
}
};
template <class T>
__device__ void fused_multiply_accumulate(T& d, const T& s0, const T& s1)
{
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment