gemv_cuda.h 255 Bytes
Newer Older
Casper's avatar
Casper committed
1
2
3
4
5
6
7
8
9
10
11
12
#pragma once
#include <torch/extension.h>

torch::Tensor gemv_forward_cuda_decode(
    torch::Tensor _in_feats,
    torch::Tensor _kernel,
    torch::Tensor _scaling_factors,
    torch::Tensor _zeros,
    int m,
    int n,
    int k,
    int group_size);