Commit 8185c3d3 authored by guangzlu's avatar guangzlu
Browse files

fixed philox generator

parent d3577ab3
...@@ -179,7 +179,8 @@ int run(int argc, char* argv[]) ...@@ -179,7 +179,8 @@ int run(int argc, char* argv[])
b1_element_op, b1_element_op,
c_element_op, c_element_op,
0, // dropout ratio 0, // dropout ratio
{0, 64}); // dropout random seed and offset {0, 64}); // dropout random seed and offset, offset should be at least the number of
// elements on a thread
if(!gemm.IsSupportedArgument(argument)) if(!gemm.IsSupportedArgument(argument))
{ {
......
...@@ -97,24 +97,6 @@ class philox ...@@ -97,24 +97,6 @@ class philox
{ {
uint4 res; uint4 res;
// uint4 tmp;
// asm volatile("v_mov_b32 %8 1; \n"
// "v_mov_b32 %9 0; \n"
// "v_mov_b32 %10 0; \n"
// "v_mov_b32 %11 0; \n"
// "v_add_co_u32 %0, %4, %8; "
// "v_addc_co_u32 %1, %5, %9; "
// "v_addc_co_u32 %2, %6, %10; "
// "v_addc_u32 %3, %7, %11; "
// : "=v"(res.x), "=v"(res.y), "=v"(res.z), "=v"(res.w)
// : "v"(ctr.x),
// "v"(ctr.y),
// "v"(ctr.z),
// "v"(ctr.w),
// "v"(tmp.x),
// "v"(tmp.y),
// "v"(tmp.z),
// "v"(tmp.w));
res.x = ctr.x + 1; res.x = ctr.x + 1;
res.y = ctr.y; res.y = ctr.y;
res.z = ctr.z; res.z = ctr.z;
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment