pyproject.toml 2.27 KB
Newer Older
zzg_666's avatar
zzg_666 committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
[build-system]
requires = ["setuptools>=42", "wheel"]
build-backend = "setuptools.build_meta"

[project]
name = "open-dataflow"
authors = [
    {name = "Hao Liang", email = "hao.liang@stu.pku.edu.cn"},
    {name = "Xiaochen Ma", email = "xiaochen.ma.cs@gmail.com"},
]
description = "Modern Data Centric AI system for Large Language Models"
readme = {file = "README.md", content-type = "text/markdown"}
requires-python = ">=3.7, <4"
license = {text = "Apache-2.0"}
classifiers = [
    "Development Status :: 3 - Alpha",
    "Intended Audience :: Developers",
    "Intended Audience :: Science/Research",
    "Topic :: Scientific/Engineering :: Artificial Intelligence",
    "License :: Free For Educational Use",
    "Programming Language :: Python :: 3",
    "Programming Language :: Python :: 3.7",
    "Programming Language :: Python :: 3.8",
    "Programming Language :: Python :: 3.9",
    "Programming Language :: Python :: 3.10",
    "Programming Language :: Python :: 3 :: Only",
]
keywords = [
    "AI",
    "artificial intelligence",
]
dynamic = ["version", "dependencies"]

[project.urls]
Github = "https://github.com/Open-DataFlow/DataFlow"
Documentation = "https://open-dataflow.github.io/DataFlow-Doc/"
"Bug Reports" = "https://github.com/Open-DataFlow/DataFlow/issues"

[project.scripts]
dataflow = "dataflow.cli:main"

[tool.setuptools]
include-package-data = true
packages = ["dataflow"]  # 显式指定主包


[tool.setuptools.dynamic]
version = {attr = "dataflow.version.__version__"}
dependencies = {file = "requirements.txt"}


[project.optional-dependencies]
vllm =["vllm>=0.7.0,<=0.9.2", "numpy<2.0.0"]
vllm07 = ["vllm<0.8", "numpy<2.0.0"]
vllm08 = ["vllm<0.9"]
# 要求numpy版本大于1.24小于2.0.0
kbc = ["vllm==0.6.3", "mineru[pipeline]==2.0.6"]
mineru = ["mineru[all]", "numpy>=1.24,<2.0.0", "sglang[all]>=0.4.8", "pypdf", "reportlab"]
myscale = ["clickhouse-driver"]
sglang =["sglang[all]"]
litellm = ["litellm>=1.70.0,<2.0.0"]
audio = ['librosa', 'soundfile']
vectorsql = ["sqlite-vec", "sqlite-lembed", "sentence_transformers"]
# 当前pdf2model环境不支持muxi
pdf2model =[
    "llamafactory[torch,metrics]>=0.9.0",
    "vllm>=0.7.0,<0.9.2", 
    "numpy>=1.24,<2.0.0",
    "mineru[pipeline]",
    "mineru-vl-utils"
]
eval =[
    "vllm>=0.7.0,<0.9.2"
]
rag = ["lightrag-hku", "asyncio"]