Commit 083c2de9 authored by OlivierDehaene's avatar OlivierDehaene
Browse files

fix: fix quant linear autotune

parent 773aabdd
...@@ -88,7 +88,7 @@ class Autotuner(triton.KernelInterface): ...@@ -88,7 +88,7 @@ class Autotuner(triton.KernelInterface):
# In testings using only 40 reps seems to be close enough and it appears to be what PyTorch uses # In testings using only 40 reps seems to be close enough and it appears to be what PyTorch uses
# PyTorch also sets fast_flush to True, but I didn't see any speedup so I'll leave the default # PyTorch also sets fast_flush to True, but I didn't see any speedup so I'll leave the default
return triton.testing.do_bench( return triton.testing.do_bench(
kernel_call, percentiles=(0.5, 0.2, 0.8), rep=40 kernel_call, quantiles=(0.5, 0.2, 0.8), rep=40
) )
except triton.OutOfResources: except triton.OutOfResources:
return (float("inf"), float("inf"), float("inf")) return (float("inf"), float("inf"), float("inf"))
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment