@article{dao2022flashattention,title={Flashattention: Fast and memory-efficient exact attention with io-awareness},author={Dao, Tri and Fu, Daniel Y and Ermon, Stefano and Rudra, Atri and R{\'e}, Christopher},journal={arXiv preprint arXiv:2205.14135},year={2022}}