Commit 977fc1ed authored by Jing Zhang's avatar Jing Zhang
Browse files

clean

parent e6230689
...@@ -610,10 +610,10 @@ int main(int argc, char* argv[]) ...@@ -610,10 +610,10 @@ int main(int argc, char* argv[])
#elif 1 #elif 1
// 1x1 filter, 14x14 image, C = 512 // 1x1 filter, 14x14 image, C = 512
constexpr index_t N = 128; constexpr index_t N = 128;
constexpr index_t C = 128; constexpr index_t C = 512;
constexpr index_t HI = 14; constexpr index_t HI = 14;
constexpr index_t WI = 14; constexpr index_t WI = 14;
constexpr index_t K = 128; constexpr index_t K = 512;
constexpr index_t Y = 1; constexpr index_t Y = 1;
constexpr index_t X = 1; constexpr index_t X = 1;
......
...@@ -13,7 +13,7 @@ extern "C" __attribute__((address_space(3))) void* __to_local(void* p)[[hc]]; ...@@ -13,7 +13,7 @@ extern "C" __attribute__((address_space(3))) void* __to_local(void* p)[[hc]];
#define data4_t vector_type<float, 4>::MemoryType #define data4_t vector_type<float, 4>::MemoryType
#define data_t float #define data_t float
template<unsigned cnt> template<unsigned cnt>
inline __device__ void vmcnt() inline __device__ void vmcnt()
{ {
#if !NO_VM_WAIT #if !NO_VM_WAIT
...@@ -111,8 +111,8 @@ inline __device__ void outerProduct1x4(const data_t& a, ...@@ -111,8 +111,8 @@ inline __device__ void outerProduct1x4(const data_t& a,
"v"(a.x),"v"(b.x),"v"(b.y),"v"(b.z),"v"(b.w) "v"(a.x),"v"(b.x),"v"(b.y),"v"(b.z),"v"(b.w)
); );
#else #else
//hijack here due to a compiler issue that cannot perform proper register //hijack here due to a compiler issue that cannot perform proper register
//mapping for float4 c //mapping for float4 c
data_t *c_p = (data_t *)&c; data_t *c_p = (data_t *)&c;
asm volatile("\n \ asm volatile("\n \
v_mac_f32 %0, %4, %5 \n \ v_mac_f32 %0, %4, %5 \n \
...@@ -430,7 +430,7 @@ inline __device__ void global_load(data4_t& r, ...@@ -430,7 +430,7 @@ inline __device__ void global_load(data4_t& r,
#endif #endif
} }
inline __device__ void inline __device__ void
ds_write_b128(const data4_t& r, void* lds, index_t offset = 0) ds_write_b128(const data4_t& r, void* lds, index_t offset = 0)
{ {
#if !NO_DS_WRITE #if !NO_DS_WRITE
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment