Commit b6b6fc4f authored by fengzch's avatar fengzch
Browse files

fix: compile gemm_f16.cu complete

parent 03ac3784
...@@ -44,7 +44,7 @@ Tensor gemm_f16(Tensor input, // FP16 ...@@ -44,7 +44,7 @@ Tensor gemm_f16(Tensor input, // FP16
cutlass::layout::RowMajor, cutlass::layout::RowMajor,
ElementAccumulator, ElementAccumulator,
cutlass::arch::OpClassTensorOp, cutlass::arch::OpClassTensorOp,
cutlass::arch::Sm75>; cutlass::arch::Gfx928>;
// cutlass::gemm::GemmShape<128, 128, 64>, // cutlass::gemm::GemmShape<128, 128, 64>,
// cutlass::gemm::GemmShape<32, 64, 64>, cutlass::gemm::GemmShape<16, 8, 16>, // cutlass::gemm::GemmShape<32, 64, 64>, cutlass::gemm::GemmShape<16, 8, 16>,
// cutlass::epilogue::thread::LinearCombination< // cutlass::epilogue::thread::LinearCombination<
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment