Unverified Commit ef0a4721 authored by dagil-nvidia's avatar dagil-nvidia Committed by GitHub
Browse files

fix: update ai-dynamo[vllm] version and pin transformers (#4592)


Signed-off-by: default avatarDan Gil <dagil@nvidia.com>
parent 6e9782ba
......@@ -46,7 +46,8 @@ dependencies = [
"pydantic>=2",
"tabulate",
"types-tabulate",
"transformers<=4.57.1",
# Satisfies vLLM 0.11.0 (>=4.55.2), vLLM 0.11.2 (>=4.56.0,<5), TRT-LLM 1.2.0rc2/rc3 (==4.56.0), SGLang 0.5.4.post3 (==4.57.1)
"transformers>=4.56.0,<=4.57.1",
"pytest-mypy",
]
......
......@@ -36,7 +36,12 @@ scipy<1.14.0 # Pin scipy version for pmdarima compatibility
sentencepiece
tensorboard==2.19.0
tensorboardX==2.6.2.2
transformers<=4.57.1
# Transformers version constraint for container builds
# - vLLM 0.11.0: >=4.55.2, vLLM 0.11.2: >=4.56.0,<5
# - TensorRT-LLM 1.2.0rc2/rc3: ==4.56.0
# - SGLang 0.5.4.post3: ==4.57.1
# Using >=4.56.0 to satisfy all frameworks
transformers>=4.56.0,<=4.57.1
types-aiofiles
types-PyYAML
uvicorn
......@@ -14,6 +14,7 @@ license-files = ["LICENSE"]
requires-python = ">=3.10"
dependencies = [
"ai-dynamo-runtime==0.7.0",
"transformers>=4.56.0,<=4.57.1",
"pytest>=8.3.4",
"types-psutil>=7.0.0.20250218",
"kubernetes>=32.0.1,<33.0.0",
......@@ -55,7 +56,7 @@ trtllm =[
vllm = [
"uvloop",
"nixl[cu12]<=0.7.1",
"vllm[flashinfer]==0.10.2",
"vllm[flashinfer]==0.11.0",
]
sglang = [
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment