Makefile-awq 463 Bytes
Newer Older
jixx's avatar
init  
jixx committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
# Fork that adds only the correct stream to this kernel in order
# to make cuda graphs work.
awq_commit := bd1dc2d5254345cc76ab71894651fb821275bdd4

awq:
	rm -rf llm-awq
	git clone https://github.com/huggingface/llm-awq

build-awq: awq
	cd llm-awq/ && git fetch && git checkout $(awq_commit)
	cd llm-awq/awq/kernels && python setup.py build

install-awq: build-awq
	pip uninstall awq_inference_engine -y || true
	cd llm-awq/awq/kernels && python setup.py install