Unverified Commit ef0a4721 authored by dagil-nvidia's avatar dagil-nvidia Committed by GitHub
Browse files

fix: update ai-dynamo[vllm] version and pin transformers (#4592)


Signed-off-by: default avatarDan Gil <dagil@nvidia.com>
parent 6e9782ba
...@@ -46,7 +46,8 @@ dependencies = [ ...@@ -46,7 +46,8 @@ dependencies = [
"pydantic>=2", "pydantic>=2",
"tabulate", "tabulate",
"types-tabulate", "types-tabulate",
"transformers<=4.57.1", # Satisfies vLLM 0.11.0 (>=4.55.2), vLLM 0.11.2 (>=4.56.0,<5), TRT-LLM 1.2.0rc2/rc3 (==4.56.0), SGLang 0.5.4.post3 (==4.57.1)
"transformers>=4.56.0,<=4.57.1",
"pytest-mypy", "pytest-mypy",
] ]
...@@ -86,4 +87,4 @@ addopts = [ ...@@ -86,4 +87,4 @@ addopts = [
"--ignore-glob=*model.py", "--ignore-glob=*model.py",
"--ignore-glob=*_inc.py", "--ignore-glob=*_inc.py",
"--ignore-glob=deploy/cloud/api-store/*", "--ignore-glob=deploy/cloud/api-store/*",
] ]
\ No newline at end of file
...@@ -36,7 +36,12 @@ scipy<1.14.0 # Pin scipy version for pmdarima compatibility ...@@ -36,7 +36,12 @@ scipy<1.14.0 # Pin scipy version for pmdarima compatibility
sentencepiece sentencepiece
tensorboard==2.19.0 tensorboard==2.19.0
tensorboardX==2.6.2.2 tensorboardX==2.6.2.2
transformers<=4.57.1 # Transformers version constraint for container builds
# - vLLM 0.11.0: >=4.55.2, vLLM 0.11.2: >=4.56.0,<5
# - TensorRT-LLM 1.2.0rc2/rc3: ==4.56.0
# - SGLang 0.5.4.post3: ==4.57.1
# Using >=4.56.0 to satisfy all frameworks
transformers>=4.56.0,<=4.57.1
types-aiofiles types-aiofiles
types-PyYAML types-PyYAML
uvicorn uvicorn
...@@ -14,6 +14,7 @@ license-files = ["LICENSE"] ...@@ -14,6 +14,7 @@ license-files = ["LICENSE"]
requires-python = ">=3.10" requires-python = ">=3.10"
dependencies = [ dependencies = [
"ai-dynamo-runtime==0.7.0", "ai-dynamo-runtime==0.7.0",
"transformers>=4.56.0,<=4.57.1",
"pytest>=8.3.4", "pytest>=8.3.4",
"types-psutil>=7.0.0.20250218", "types-psutil>=7.0.0.20250218",
"kubernetes>=32.0.1,<33.0.0", "kubernetes>=32.0.1,<33.0.0",
...@@ -55,7 +56,7 @@ trtllm =[ ...@@ -55,7 +56,7 @@ trtllm =[
vllm = [ vllm = [
"uvloop", "uvloop",
"nixl[cu12]<=0.7.1", "nixl[cu12]<=0.7.1",
"vllm[flashinfer]==0.10.2", "vllm[flashinfer]==0.11.0",
] ]
sglang = [ sglang = [
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment