diag_cuda.h 182 Bytes
Newer Older
rusty1s's avatar
matmul  
rusty1s committed
1
2
3
4
5
6
#pragma once

#include <torch/extension.h>

torch::Tensor non_diag_mask_cuda(torch::Tensor row, torch::Tensor col,
                                 int64_t M, int64_t N, int64_t k);