pyproject.toml 2.63 KB
Newer Older
Olivier Dehaene's avatar
Init  
Olivier Dehaene committed
1
[tool.poetry]
2
name = "text-generation-server"
Nicolas Patry's avatar
Nicolas Patry committed
3
version = "2.0.5-dev0"
4
description = "Text Generation Inference Python gRPC Server"
Olivier Dehaene's avatar
Init  
Olivier Dehaene committed
5
6
authors = ["Olivier Dehaene <olivier@huggingface.co>"]

Olivier Dehaene's avatar
Olivier Dehaene committed
7
[tool.poetry.scripts]
8
text-generation-server = 'text_generation_server.cli:app'
Olivier Dehaene's avatar
Olivier Dehaene committed
9

Olivier Dehaene's avatar
Init  
Olivier Dehaene committed
10
[tool.poetry.dependencies]
Nicolas Patry's avatar
Nicolas Patry committed
11
python = ">=3.9,<3.13"
12
protobuf = "^4.25.3"
13
14
15
16
grpcio = "^1.51.1"
grpcio-status = "^1.51.1"
grpcio-reflection = "^1.51.1"
grpc-interceptor = "^0.15.0"
Olivier Dehaene's avatar
Init  
Olivier Dehaene committed
17
typer = "^0.6.1"
abhishek thakur's avatar
abhishek thakur committed
18
accelerate = { version = "^0.29.1", optional = true }
19
bitsandbytes = { version = "^0.43.0", optional = true }
OlivierDehaene's avatar
OlivierDehaene committed
20
safetensors = "^0.4"
21
loguru = "^0.6.0"
22
23
24
opentelemetry-api = "^1.25.0"
opentelemetry-exporter-otlp = "^1.25.0"
opentelemetry-instrumentation-grpc = "^0.46b0"
25
hf-transfer = "^0.1.2"
26
sentencepiece = "^0.1.97"
27
tokenizers = "^0.19.1"
drbh's avatar
drbh committed
28
huggingface-hub = "^0.23"
29
transformers = "^4.43"
30
einops = "^0.6.1"
31
32
texttable = { version = "^1.6.7", optional = true }
datasets = { version = "^2.14.0", optional = true }
abhishek thakur's avatar
abhishek thakur committed
33
peft = { version = "^0.10", optional = true }
34
torch = { version = "^2.4.0", optional = true }
Nicolas Patry's avatar
Nicolas Patry committed
35
scipy = "^1.11.1"
36
pillow = "^10.0.0"
37
outlines= { version = "^0.0.34", optional = true }
Nicolas Patry's avatar
Nicolas Patry committed
38
39
prometheus-client = "^0.20.0"
py-cpuinfo = "^9.0.0"
Daniël de Kok's avatar
Daniël de Kok committed
40
41
# Remove later, temporary workaround for outlines.
numpy = "^1.26"
Olivier Dehaene's avatar
Init  
Olivier Dehaene committed
42

43
44
45
46
47
48
marlin-kernels = [
  { url = "https://github.com/danieldk/marlin-kernels/releases/download/v0.2.0/marlin_kernels-0.2.0+cu123torch2.4-cp39-cp39-linux_x86_64.whl", python = "~3.9", optional = true },
  { url = "https://github.com/danieldk/marlin-kernels/releases/download/v0.2.0/marlin_kernels-0.2.0+cu123torch2.4-cp310-cp310-linux_x86_64.whl", python = "~3.10", optional = true },
  { url = "https://github.com/danieldk/marlin-kernels/releases/download/v0.2.0/marlin_kernels-0.2.0+cu123torch2.4-cp311-cp311-linux_x86_64.whl", python = "~3.11", optional = true },
  { url = "https://github.com/danieldk/marlin-kernels/releases/download/v0.2.0/marlin_kernels-0.2.0+cu123torch2.4-cp312-cp312-linux_x86_64.whl", python = "~3.12", optional = true },
]
49
rich = "^13.7.1"
50
syrupy = "^4.7.1"
51

52
[tool.poetry.extras]
53
torch = ["torch"]
54
accelerate = ["accelerate"]
55
bnb = ["bitsandbytes"]
56
marlin = ["marlin-kernels"]
57
peft = ["peft"]
58
quantize = ["texttable", "datasets", "accelerate"]
OlivierDehaene's avatar
OlivierDehaene committed
59
outlines = ["outlines"]
60

Olivier Dehaene's avatar
Init  
Olivier Dehaene committed
61
[tool.poetry.group.dev.dependencies]
62
grpcio-tools = "^1.51.1"
63
pytest = "^7.3.0"
Olivier Dehaene's avatar
Init  
Olivier Dehaene committed
64

65
66
67

[[tool.poetry.source]]
name = "pytorch-gpu-src"
68
url = "https://download.pytorch.org/whl/cu121"
69
70
priority = "explicit"

71
72
73
[tool.pytest.ini_options]
markers = ["private: marks tests as requiring an admin hf token (deselect with '-m \"not private\"')"]

Olivier Dehaene's avatar
Init  
Olivier Dehaene committed
74
[build-system]
75
76
77
requires = [
    "poetry-core>=1.0.0",
]
Olivier Dehaene's avatar
Init  
Olivier Dehaene committed
78
build-backend = "poetry.core.masonry.api"