gen_linux.sh 3.56 KB
Newer Older
1
#!/bin/bash
2
# This script is intended to run inside the go generate
3
4
5
6
7
8
9
10
11
12
13
14
# working directory must be llm/llama.cpp

# First we build our default built-in library which will be linked into the CGO
# binary as a normal dependency. This default build is CPU based.
#
# Then we build a CUDA dynamic library (although statically linked with the CUDA
# library dependencies for maximum portability)
#
# Then if we detect ROCm, we build a dynamically loaded ROCm lib.  ROCm is particularly
# important to be a dynamic lib even if it's the only GPU library detected because
# we can't redistribute the objectfiles but must rely on dynamic libraries at
# runtime, which could lead the server not to start if not present.
15
16
17
18
19

set -ex
set -o pipefail

echo "Starting linux generate script"
20
if [ -z "${CUDACXX}" -a -x /usr/local/cuda/bin/nvcc ]; then
21
22
    export CUDACXX=/usr/local/cuda/bin/nvcc
fi
23
COMMON_CMAKE_DEFS="-DCMAKE_POSITION_INDEPENDENT_CODE=on -DLLAMA_ACCELERATE=on -DLLAMA_NATIVE=off -DLLAMA_AVX=on -DLLAMA_AVX2=off -DLLAMA_AVX512=off -DLLAMA_FMA=off -DLLAMA_F16C=off"
24
25
26
27
source $(dirname $0)/gen_common.sh
init_vars
git_module_setup
apply_patches
28
29
30
31
32

#
# CPU first for the default library
#
CMAKE_DEFS="${COMMON_CMAKE_DEFS} ${CMAKE_DEFS}"
33
34
BUILD_DIR="gguf/build/linux/cpu"

35
build
36
install
37

Daniel Hiltgen's avatar
Daniel Hiltgen committed
38
39
40
# Placeholder to keep go embed happy until we start building dynamic CPU lib variants
touch ${BUILD_DIR}/lib/dummy.so

41
42
43
44
if [ -d /usr/local/cuda/lib64/ ]; then
    echo "CUDA libraries detected - building dynamic CUDA library"
    init_vars
    CMAKE_DEFS="-DLLAMA_CUBLAS=on ${COMMON_CMAKE_DEFS} ${CMAKE_DEFS}"
45
    BUILD_DIR="gguf/build/linux/cuda"
46
47
    CUDA_LIB_DIR=/usr/local/cuda/lib64
    build
48
49
    install
    gcc -fPIC -g -shared -o ${BUILD_DIR}/lib/libext_server.so \
50
        -Wl,--whole-archive \
51
52
53
        ${BUILD_DIR}/lib/libext_server.a \
        ${BUILD_DIR}/lib/libcommon.a \
        ${BUILD_DIR}/lib/libllama.a \
54
55
56
57
58
59
60
        -Wl,--no-whole-archive \
        ${CUDA_LIB_DIR}/libcudart_static.a \
        ${CUDA_LIB_DIR}/libcublas_static.a \
        ${CUDA_LIB_DIR}/libcublasLt_static.a \
        ${CUDA_LIB_DIR}/libcudadevrt.a \
        ${CUDA_LIB_DIR}/libculibos.a \
        -lrt -lpthread -ldl -lstdc++ -lm
61
fi
62

63
if [ -z "${ROCM_PATH}" ]; then
64
65
66
67
    # Try the default location in case it exists
    ROCM_PATH=/opt/rocm
fi

68
if [ -z "${CLBlast_DIR}" ]; then
69
70
71
72
73
74
    # Try the default location in case it exists
    if [ -d /usr/lib/cmake/CLBlast ]; then
        export CLBlast_DIR=/usr/lib/cmake/CLBlast
    fi
fi

75
76
if [ -d "${ROCM_PATH}" ]; then
    echo "ROCm libraries detected - building dynamic ROCm library"
77
    init_vars
78
    CMAKE_DEFS="${COMMON_CMAKE_DEFS} ${CMAKE_DEFS} -DLLAMA_HIPBLAS=on -DCMAKE_C_COMPILER=$ROCM_PATH/llvm/bin/clang -DCMAKE_CXX_COMPILER=$ROCM_PATH/llvm/bin/clang++ -DAMDGPU_TARGETS='gfx803;gfx900;gfx906:xnack-;gfx908:xnack-;gfx90a:xnack+;gfx90a:xnack-;gfx1010;gfx1012;gfx1030;gfx1100;gfx1101;gfx1102' -DGPU_TARGETS='gfx803;gfx900;gfx906:xnack-;gfx908:xnack-;gfx90a:xnack+;gfx90a:xnack-;gfx1010;gfx1012;gfx1030;gfx1100;gfx1101;gfx1102'"
79
    BUILD_DIR="gguf/build/linux/rocm"
80
    build
81
82
    install
    gcc -fPIC -g -shared -o ${BUILD_DIR}/lib/libext_server.so \
83
        -Wl,--whole-archive \
84
85
86
        ${BUILD_DIR}/lib/libext_server.a \
        ${BUILD_DIR}/lib/libcommon.a \
        ${BUILD_DIR}/lib/libllama.a \
87
88
89
90
91
92
        -Wl,--no-whole-archive \
        -lrt -lpthread -ldl -lstdc++ -lm \
        -L/opt/rocm/lib -L/opt/amdgpu/lib/x86_64-linux-gnu/ \
        -Wl,-rpath,/opt/rocm/lib,-rpath,/opt/amdgpu/lib/x86_64-linux-gnu/ \
        -lhipblas -lrocblas -lamdhip64 -lrocsolver -lamd_comgr -lhsa-runtime64 -lrocsparse -ldrm -ldrm_amdgpu
fi
93
94

cleanup