"server/text_generation_server/models/flash_dbrx.py" did not exist on "5a58226130fcd35774cd14d8c5ba638a4adb2bf4"
build.py 2.19 KB
Newer Older
Hang Zhang's avatar
init  
Hang Zhang committed
1
2
3
4
5
6
7
8
9
10
11
12
##+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
## Created by: Hang Zhang
## ECE Department, Rutgers University
## Email: zhang.hang@rutgers.edu
## Copyright (c) 2017
##
## This source code is licensed under the MIT-style license found in the
## LICENSE file in the root directory of this source tree 
##+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++

import os
import torch
Hang Zhang's avatar
Hang Zhang committed
13
import platform
Hang Zhang's avatar
backend  
Hang Zhang committed
14
import subprocess
Hang Zhang's avatar
init  
Hang Zhang committed
15
16
from torch.utils.ffi import create_extension

Hang Zhang's avatar
Hang Zhang committed
17
lib_path = os.path.join(os.path.dirname(torch.__file__), 'lib')
Zhang's avatar
Zhang committed
18
19
cwd = os.path.join(os.path.dirname(os.path.realpath(__file__)), 'encoding/')
encoding_lib_path = os.path.join(cwd, "lib")
Hang Zhang's avatar
Hang Zhang committed
20

Hang Zhang's avatar
v0.1.0  
Hang Zhang committed
21
22
23
24
25
# clean the build files
clean_cmd = ['bash', 'clean.sh']
subprocess.check_call(clean_cmd)

# build CUDA library
Hang Zhang's avatar
Hang Zhang committed
26
27
os.environ['TORCH_BUILD_DIR'] = lib_path
if platform.system() == 'Darwin':
Zhang's avatar
Zhang committed
28
29
    os.environ['TH_LIBRARIES'] = os.path.join(lib_path,'libATen.dylib')
    ENCODING_LIB = os.path.join(cwd, 'lib/libENCODING.dylib')
Hang Zhang's avatar
path  
Hang Zhang committed
30

Hang Zhang's avatar
Hang Zhang committed
31
else:
Hang Zhang's avatar
v0.2.0  
Hang Zhang committed
32
    os.environ['CFLAGS'] = '-std=c99'
Zhang's avatar
Zhang committed
33
34
    os.environ['TH_LIBRARIES'] = os.path.join(lib_path,'libATen.so')
    ENCODING_LIB = os.path.join(cwd, 'lib/libENCODING.so')
Hang Zhang's avatar
Hang Zhang committed
35

Hang Zhang's avatar
backend  
Hang Zhang committed
36
build_all_cmd = ['bash', 'encoding/make.sh']
37
subprocess.check_call(build_all_cmd, env=dict(os.environ))
Hang Zhang's avatar
backend  
Hang Zhang committed
38

Hang Zhang's avatar
v0.1.0  
Hang Zhang committed
39
# build FFI
Hang Zhang's avatar
backend  
Hang Zhang committed
40
sources = ['encoding/src/encoding_lib.cpp']
Hang Zhang's avatar
v0.1.0  
Hang Zhang committed
41
42
43
headers = [
    'encoding/src/encoding_lib.h',
]
Hang Zhang's avatar
backend  
Hang Zhang committed
44
45
46
defines = [('WITH_CUDA', None)]
with_cuda = True 

Hang Zhang's avatar
Hang Zhang committed
47
include_path = [os.path.join(lib_path, 'include'),
Zhang's avatar
Zhang committed
48
49
50
                os.path.join(cwd,'kernel'),
                os.path.join(cwd,'kernel/include'),
                os.path.join(cwd,'src/')]
Hang Zhang's avatar
init  
Hang Zhang committed
51

Hang Zhang's avatar
Hang Zhang committed
52
def make_relative_rpath(path):
Hang Zhang's avatar
indent  
Hang Zhang committed
53
54
55
56
    if platform.system() == 'Darwin':
        return '-Wl,-rpath,' + path
    else:
        return '-Wl,-rpath,' + path
Hang Zhang's avatar
tested  
Hang Zhang committed
57

Hang Zhang's avatar
init  
Hang Zhang committed
58
ffi = create_extension(
Hang Zhang's avatar
indent  
Hang Zhang committed
59
60
61
62
63
64
65
    'encoding._ext.encoding_lib',
    package=True,
    headers=headers,
    sources=sources,
    define_macros=defines,
    relative_to=__file__,
    with_cuda=with_cuda,
Zhang's avatar
Zhang committed
66
    extra_compile_args=["-std=c99"],
Hang Zhang's avatar
v0.1.0  
Hang Zhang committed
67
68
69
    include_dirs = include_path,
    extra_link_args = [
        make_relative_rpath(lib_path),
Hang Zhang's avatar
path  
Hang Zhang committed
70
        make_relative_rpath(encoding_lib_path),
Hang Zhang's avatar
v0.1.0  
Hang Zhang committed
71
72
        ENCODING_LIB,
    ],
Hang Zhang's avatar
init  
Hang Zhang committed
73
74
75
76
)

if __name__ == '__main__':
    ffi.build()