"docs/source/en/training/unconditional_training.mdx" did not exist on "c29d81c3e37713b2298e88c6ec16c73d4d352725"
quantization.cpp 486 Bytes
Newer Older
1
2
3
4
5
6
7
8
9
#include <torch/extension.h>

torch::Tensor awq_gemm(
  torch::Tensor _in_feats,
  torch::Tensor _kernel,
  torch::Tensor _scaling_factors,
  torch::Tensor _zeros,
  int split_k_iters);

chooper1's avatar
chooper1 committed
10
11
12
13
14
15
void squeezellm_gemm(
  torch::Tensor vec,
  torch::Tensor mat,
  torch::Tensor mul,
  torch::Tensor lookup_table);

16
PYBIND11_MODULE(TORCH_EXTENSION_NAME, m) {
chooper1's avatar
chooper1 committed
17
18
  m.def("awq_gemm", &awq_gemm, "Quantized GEMM for AWQ");
  m.def("squeezellm_gemm", &squeezellm_gemm, "Quantized GEMM for SqueezeLLM");
19
}