"rocshmem_dir/lib/cmake/rocshmem/rocshmem-targets.cmake" did not exist on "da6ca24ef7c2594e058def142adfb8f2e31a7f85"
awq_gemm_asm.h 716 Bytes
Newer Older
Xiaowei.zhang's avatar
Xiaowei.zhang committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
#pragma once
// SPDX-License-Identifier: MIT
 
#include <torch/extension.h>
#include "aiter_enum.h"


void awq_gemm_asm(torch::Tensor &out,
                  torch::Tensor &mat1,              
                  torch::Tensor &mat2,
                  std::optional<torch::Tensor> &zero,              
                  std::optional<torch::Tensor> &scalar                  
);

void awq_gemm_asm_tuning(torch::Tensor &out,
                  torch::Tensor &mat1,              
                  torch::Tensor &mat2,
                  std::optional<torch::Tensor> &zero,              
                  std::optional<torch::Tensor> &scalar,
                  int solutionid, std::string& jsonfile                 
);