Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
text-generation-inference
Commits
e6bb3ff8
Unverified
Commit
e6bb3ff8
authored
Feb 28, 2024
by
OlivierDehaene
Committed by
GitHub
Feb 28, 2024
Browse files
v1.4.3 (#1609)
parent
26cdea5c
Changes
12
Show whitespace changes
Inline
Side-by-side
Showing
12 changed files
with
86 additions
and
88 deletions
+86
-88
Cargo.lock
Cargo.lock
+75
-75
Cargo.toml
Cargo.toml
+1
-1
docs/openapi.json
docs/openapi.json
+1
-1
docs/source/_toctree.yml
docs/source/_toctree.yml
+0
-2
docs/source/conceptual/guidance.md
docs/source/conceptual/guidance.md
+2
-2
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_no_tools.json
..._/test_tools_llama/test_flash_llama_grammar_no_tools.json
+1
-1
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools.json
...ts__/test_tools_llama/test_flash_llama_grammar_tools.json
+1
-1
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools_auto.json
...test_tools_llama/test_flash_llama_grammar_tools_auto.json
+1
-1
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools_choice.json
...st_tools_llama/test_flash_llama_grammar_tools_choice.json
+1
-1
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools_stream.json
...st_tools_llama/test_flash_llama_grammar_tools_stream.json
+1
-1
integration-tests/pyproject.toml
integration-tests/pyproject.toml
+1
-1
server/pyproject.toml
server/pyproject.toml
+1
-1
No files found.
Cargo.lock
View file @
e6bb3ff8
...
@@ -19,9 +19,9 @@ checksum = "f26201604c87b1e01bd3d98f8d5d9a8fcbb815e8cedb41ffccbeb4bf593a35fe"
...
@@ -19,9 +19,9 @@ checksum = "f26201604c87b1e01bd3d98f8d5d9a8fcbb815e8cedb41ffccbeb4bf593a35fe"
[[package]]
[[package]]
name = "ahash"
name = "ahash"
version = "0.8.
9
"
version = "0.8.
10
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
d713b3834d76b85304d4d525563c1276e2e30dc97cc67bfb4585a4a29fc2c89f
"
checksum = "
8b79b82693f705137f8fb9b37871d99e4f9a7df12b917eed79c3d3954830a60b
"
dependencies = [
dependencies = [
"cfg-if",
"cfg-if",
"getrandom",
"getrandom",
...
@@ -42,9 +42,9 @@ dependencies = [
...
@@ -42,9 +42,9 @@ dependencies = [
[[package]]
[[package]]
name = "anstream"
name = "anstream"
version = "0.6.1
2
"
version = "0.6.1
3
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "96b
09b5178381e0874812a9b157f7fe84982617e48f71f4e3235482775e5b540
"
checksum = "
d
96b
d03f33fe50a863e394ee9718a706f988b9079b20c3784fb726e7678b62fb
"
dependencies = [
dependencies = [
"anstyle",
"anstyle",
"anstyle-parse",
"anstyle-parse",
...
@@ -130,7 +130,7 @@ checksum = "16e62a023e7c117e27523144c5d2459f4397fcc3cab0085af8e2224f643a0193"
...
@@ -130,7 +130,7 @@ checksum = "16e62a023e7c117e27523144c5d2459f4397fcc3cab0085af8e2224f643a0193"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -141,7 +141,7 @@ checksum = "c980ee35e870bd1a4d2c8294d4c04d0499e67bca1e4b5cefcc693c2fa00caea9"
...
@@ -141,7 +141,7 @@ checksum = "c980ee35e870bd1a4d2c8294d4c04d0499e67bca1e4b5cefcc693c2fa00caea9"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -305,9 +305,9 @@ dependencies = [
...
@@ -305,9 +305,9 @@ dependencies = [
[[package]]
[[package]]
name = "bumpalo"
name = "bumpalo"
version = "3.15.
1
"
version = "3.15.
3
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
c764d619ca78fccbf3069b37bd7af92577f044bb15236036662d79b6559f2
5b
7
"
checksum = "
8ea184aa71bb362a1157c896979544cc23974e08fd265f29ea96b59f0b4a55
5b"
[[package]]
[[package]]
name = "bytecount"
name = "bytecount"
...
@@ -367,9 +367,9 @@ checksum = "df8670b8c7b9dae1793364eafadf7239c40d669904660c5960d74cfd80b46a53"
...
@@ -367,9 +367,9 @@ checksum = "df8670b8c7b9dae1793364eafadf7239c40d669904660c5960d74cfd80b46a53"
[[package]]
[[package]]
name = "cc"
name = "cc"
version = "1.0.8
6
"
version = "1.0.8
8
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
7f9fa1897e4325be0d68d48df6aa1a
71ac
2ed4d27723887e7754192705350730
"
checksum = "
02f341c093d19155a6e41631ce59
71a
a
c
4e9a868262212153124c15fa22d1cdc
"
[[package]]
[[package]]
name = "cfg-if"
name = "cfg-if"
...
@@ -408,7 +408,7 @@ dependencies = [
...
@@ -408,7 +408,7 @@ dependencies = [
"heck",
"heck",
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -870,7 +870,7 @@ checksum = "87750cf4b7a4c0625b1529e4c543c2182106e4dedc60a2a6455e00d212c489ac"
...
@@ -870,7 +870,7 @@ checksum = "87750cf4b7a4c0625b1529e4c543c2182106e4dedc60a2a6455e00d212c489ac"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -999,9 +999,9 @@ checksum = "95505c38b4572b2d910cecb0281560f54b440a19336cbbcb27bf6ce6adc6f5a8"
...
@@ -999,9 +999,9 @@ checksum = "95505c38b4572b2d910cecb0281560f54b440a19336cbbcb27bf6ce6adc6f5a8"
[[package]]
[[package]]
name = "hermit-abi"
name = "hermit-abi"
version = "0.3.
6
"
version = "0.3.
8
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
bd5256b483761cd2369
9d
0
da
46cc6fd2ee3be420bbe6d020ae4a091e70b7e9fd
"
checksum = "
37
9d
a
da
1584ad501b383485dd706b8afb7a70fcbc7f4da7d780638a5a6124a60
"
[[package]]
[[package]]
name = "hf-hub"
name = "hf-hub"
...
@@ -1438,7 +1438,7 @@ checksum = "38b4faf00617defe497754acde3024865bc143d44a86799b24e191ecff91354f"
...
@@ -1438,7 +1438,7 @@ checksum = "38b4faf00617defe497754acde3024865bc143d44a86799b24e191ecff91354f"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -1526,7 +1526,7 @@ checksum = "f686d68a09079e63b1d2c64aa305095887ce50565f00a922ebfaeeee0d9ba6ce"
...
@@ -1526,7 +1526,7 @@ checksum = "f686d68a09079e63b1d2c64aa305095887ce50565f00a922ebfaeeee0d9ba6ce"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -1822,7 +1822,7 @@ checksum = "a948666b637a0f465e8564c73e89d4dde00d72d4d473cc972f390fc3dcee7d9c"
...
@@ -1822,7 +1822,7 @@ checksum = "a948666b637a0f465e8564c73e89d4dde00d72d4d473cc972f390fc3dcee7d9c"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -1833,9 +1833,9 @@ checksum = "ff011a302c396a5197692431fc1948019154afc178baf7d8e37367442a4601cf"
...
@@ -1833,9 +1833,9 @@ checksum = "ff011a302c396a5197692431fc1948019154afc178baf7d8e37367442a4601cf"
[[package]]
[[package]]
name = "openssl-sys"
name = "openssl-sys"
version = "0.9.10
0
"
version = "0.9.10
1
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
ae94056a791d0e1217d18b6cbdccb02c61e3054fc69893607f4067e3bb0b1fd1
"
checksum = "
dda2b0f344e78efc2facf7d195d098df0dd72151b26ab98da807afc26c198dff
"
dependencies = [
dependencies = [
"cc",
"cc",
"libc",
"libc",
...
@@ -2038,7 +2038,7 @@ checksum = "266c042b60c9c76b8d53061e52b2e0d1116abc57cefc8c5cd671619a56ac3690"
...
@@ -2038,7 +2038,7 @@ checksum = "266c042b60c9c76b8d53061e52b2e0d1116abc57cefc8c5cd671619a56ac3690"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -2084,7 +2084,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
...
@@ -2084,7 +2084,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "a41cf62165e97c7f814d2221421dbb9afcbcdb0a88068e5ea206e19951c2cbb5"
checksum = "a41cf62165e97c7f814d2221421dbb9afcbcdb0a88068e5ea206e19951c2cbb5"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -2157,7 +2157,7 @@ dependencies = [
...
@@ -2157,7 +2157,7 @@ dependencies = [
"prost 0.12.3",
"prost 0.12.3",
"prost-types",
"prost-types",
"regex",
"regex",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
"tempfile",
"tempfile",
"which",
"which",
]
]
...
@@ -2185,7 +2185,7 @@ dependencies = [
...
@@ -2185,7 +2185,7 @@ dependencies = [
"itertools 0.11.0",
"itertools 0.11.0",
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -2280,9 +2280,9 @@ dependencies = [
...
@@ -2280,9 +2280,9 @@ dependencies = [
[[package]]
[[package]]
name = "rayon"
name = "rayon"
version = "1.
8.1
"
version = "1.
9.0
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
fa7237101a77a10773db45d62004a272517633fbcc3df19d96455ede1122e051
"
checksum = "
e4963ed1bc86e4f3ee217022bd855b297cef07fb9eac5dfa1f788b220b49b3bd
"
dependencies = [
dependencies = [
"either",
"either",
"rayon-core",
"rayon-core",
...
@@ -2470,7 +2470,7 @@ dependencies = [
...
@@ -2470,7 +2470,7 @@ dependencies = [
"quote",
"quote",
"rust-embed-utils",
"rust-embed-utils",
"shellexpand",
"shellexpand",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
"walkdir",
"walkdir",
]
]
...
@@ -2549,9 +2549,9 @@ dependencies = [
...
@@ -2549,9 +2549,9 @@ dependencies = [
[[package]]
[[package]]
name = "rustls-pki-types"
name = "rustls-pki-types"
version = "1.3.
0
"
version = "1.3.
1
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
048a63e5b3ac996d78d402940b5fa47973d2d080c6c6fffa1d0f19c4445310b7
"
checksum = "
5ede67b28608b4c60685c7d54122d4400d90f62b40caee7700e700380a390fa8
"
[[package]]
[[package]]
name = "rustls-webpki"
name = "rustls-webpki"
...
@@ -2659,7 +2659,7 @@ checksum = "7eb0b34b42edc17f6b7cac84a52a1c5f0e1bb2227e997ca9011ea3dd34e8610b"
...
@@ -2659,7 +2659,7 @@ checksum = "7eb0b34b42edc17f6b7cac84a52a1c5f0e1bb2227e997ca9011ea3dd34e8610b"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -2786,12 +2786,12 @@ checksum = "e6ecd384b10a64542d77071bd64bd7b231f4ed5940fba55e98c3de13824cf3d7"
...
@@ -2786,12 +2786,12 @@ checksum = "e6ecd384b10a64542d77071bd64bd7b231f4ed5940fba55e98c3de13824cf3d7"
[[package]]
[[package]]
name = "socket2"
name = "socket2"
version = "0.5.
5
"
version = "0.5.
6
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
7b5fac59a5cb5dd637972e5fca70daf0523c9067fcdc4842f053dae04a18f8e9
"
checksum = "
05ffd9c0a93b7543e062e759284fcf5f5e3b098501104bfbdde4d404db792871
"
dependencies = [
dependencies = [
"libc",
"libc",
"windows-sys 0.
48
.0",
"windows-sys 0.
52
.0",
]
]
[[package]]
[[package]]
...
@@ -2849,7 +2849,7 @@ dependencies = [
...
@@ -2849,7 +2849,7 @@ dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"rustversion",
"rustversion",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -2871,9 +2871,9 @@ dependencies = [
...
@@ -2871,9 +2871,9 @@ dependencies = [
[[package]]
[[package]]
name = "syn"
name = "syn"
version = "2.0.5
0
"
version = "2.0.5
1
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
74f1bdc9872430ce9b75da68329d1c1746faf50ffac5f19e02b71e37ff881ffb
"
checksum = "
6ab617d94515e94ae53b8406c628598680aa0c9587474ecbe58188f7b345d66c
"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
...
@@ -2947,9 +2947,9 @@ dependencies = [
...
@@ -2947,9 +2947,9 @@ dependencies = [
[[package]]
[[package]]
name = "tempfile"
name = "tempfile"
version = "3.10.
0
"
version = "3.10.
1
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
a365e8cd18e44762ef95d87f284f4b5cd04107fec2ff3052bd6a3e6069669e67
"
checksum = "
85b77fafb263dd9d05cbeac119526425676db3784113aa9295c88498cbf8bff1
"
dependencies = [
dependencies = [
"cfg-if",
"cfg-if",
"fastrand",
"fastrand",
...
@@ -2959,7 +2959,7 @@ dependencies = [
...
@@ -2959,7 +2959,7 @@ dependencies = [
[[package]]
[[package]]
name = "text-generation-benchmark"
name = "text-generation-benchmark"
version = "1.4.
2
"
version = "1.4.
3
"
dependencies = [
dependencies = [
"average",
"average",
"clap",
"clap",
...
@@ -2980,7 +2980,7 @@ dependencies = [
...
@@ -2980,7 +2980,7 @@ dependencies = [
[[package]]
[[package]]
name = "text-generation-client"
name = "text-generation-client"
version = "1.4.
2
"
version = "1.4.
3
"
dependencies = [
dependencies = [
"futures",
"futures",
"grpc-metadata",
"grpc-metadata",
...
@@ -2996,7 +2996,7 @@ dependencies = [
...
@@ -2996,7 +2996,7 @@ dependencies = [
[[package]]
[[package]]
name = "text-generation-launcher"
name = "text-generation-launcher"
version = "1.4.
2
"
version = "1.4.
3
"
dependencies = [
dependencies = [
"clap",
"clap",
"ctrlc",
"ctrlc",
...
@@ -3012,7 +3012,7 @@ dependencies = [
...
@@ -3012,7 +3012,7 @@ dependencies = [
[[package]]
[[package]]
name = "text-generation-router"
name = "text-generation-router"
version = "1.4.
2
"
version = "1.4.
3
"
dependencies = [
dependencies = [
"async-stream",
"async-stream",
"axum",
"axum",
...
@@ -3065,7 +3065,7 @@ checksum = "a953cb265bef375dae3de6663da4d3804eee9682ea80d8e2542529b73c531c81"
...
@@ -3065,7 +3065,7 @@ checksum = "a953cb265bef375dae3de6663da4d3804eee9682ea80d8e2542529b73c531c81"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -3231,7 +3231,7 @@ checksum = "5b8a1e28f2deaa14e508979454cb3a223b10b938b45af148bc0986de36f1923b"
...
@@ -3231,7 +3231,7 @@ checksum = "5b8a1e28f2deaa14e508979454cb3a223b10b938b45af148bc0986de36f1923b"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -3346,7 +3346,7 @@ dependencies = [
...
@@ -3346,7 +3346,7 @@ dependencies = [
"proc-macro2",
"proc-macro2",
"prost-build",
"prost-build",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -3419,7 +3419,7 @@ checksum = "34704c8d6ebcbc939824180af020566b01a7c01f80641264eba0999f6c2b6be7"
...
@@ -3419,7 +3419,7 @@ checksum = "34704c8d6ebcbc939824180af020566b01a7c01f80641264eba0999f6c2b6be7"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -3660,7 +3660,7 @@ dependencies = [
...
@@ -3660,7 +3660,7 @@ dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"regex",
"regex",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
@@ -3765,7 +3765,7 @@ dependencies = [
...
@@ -3765,7 +3765,7 @@ dependencies = [
"once_cell",
"once_cell",
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
"wasm-bindgen-shared",
"wasm-bindgen-shared",
]
]
...
@@ -3799,7 +3799,7 @@ checksum = "642f325be6301eb8107a83d12a8ac6c1e1c54345a7ef1a9261962dfefda09e66"
...
@@ -3799,7 +3799,7 @@ checksum = "642f325be6301eb8107a83d12a8ac6c1e1c54345a7ef1a9261962dfefda09e66"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
"wasm-bindgen-backend",
"wasm-bindgen-backend",
"wasm-bindgen-shared",
"wasm-bindgen-shared",
]
]
...
@@ -3889,7 +3889,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
...
@@ -3889,7 +3889,7 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "e48a53791691ab099e5e2ad123536d0fff50652600abaf43bbf952894110d0be"
checksum = "e48a53791691ab099e5e2ad123536d0fff50652600abaf43bbf952894110d0be"
dependencies = [
dependencies = [
"windows-core",
"windows-core",
"windows-targets 0.52.
0
",
"windows-targets 0.52.
3
",
]
]
[[package]]
[[package]]
...
@@ -3898,7 +3898,7 @@ version = "0.52.0"
...
@@ -3898,7 +3898,7 @@ version = "0.52.0"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "33ab640c8d7e35bf8ba19b884ba838ceb4fba93a4e8c65a9059d08afcfc683d9"
checksum = "33ab640c8d7e35bf8ba19b884ba838ceb4fba93a4e8c65a9059d08afcfc683d9"
dependencies = [
dependencies = [
"windows-targets 0.52.
0
",
"windows-targets 0.52.
3
",
]
]
[[package]]
[[package]]
...
@@ -3925,7 +3925,7 @@ version = "0.52.0"
...
@@ -3925,7 +3925,7 @@ version = "0.52.0"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "282be5f36a8ce781fad8c8ae18fa3f9beff57ec1b52cb3de0789201425d9a33d"
checksum = "282be5f36a8ce781fad8c8ae18fa3f9beff57ec1b52cb3de0789201425d9a33d"
dependencies = [
dependencies = [
"windows-targets 0.52.
0
",
"windows-targets 0.52.
3
",
]
]
[[package]]
[[package]]
...
@@ -3960,17 +3960,17 @@ dependencies = [
...
@@ -3960,17 +3960,17 @@ dependencies = [
[[package]]
[[package]]
name = "windows-targets"
name = "windows-targets"
version = "0.52.
0
"
version = "0.52.
3
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
8a18201040b24831fbb9e4eb208f8892e1f50a37feb53cc7ff887feb8f50e7cd
"
checksum = "
d380ba1dc7187569a8a9e91ed34b8ccfc33123bbacb8c0aed2d1ad7f3ef2dc5f
"
dependencies = [
dependencies = [
"windows_aarch64_gnullvm 0.52.
0
",
"windows_aarch64_gnullvm 0.52.
3
",
"windows_aarch64_msvc 0.52.
0
",
"windows_aarch64_msvc 0.52.
3
",
"windows_i686_gnu 0.52.
0
",
"windows_i686_gnu 0.52.
3
",
"windows_i686_msvc 0.52.
0
",
"windows_i686_msvc 0.52.
3
",
"windows_x86_64_gnu 0.52.
0
",
"windows_x86_64_gnu 0.52.
3
",
"windows_x86_64_gnullvm 0.52.
0
",
"windows_x86_64_gnullvm 0.52.
3
",
"windows_x86_64_msvc 0.52.
0
",
"windows_x86_64_msvc 0.52.
3
",
]
]
[[package]]
[[package]]
...
@@ -3987,9 +3987,9 @@ checksum = "2b38e32f0abccf9987a4e3079dfb67dcd799fb61361e53e2882c3cbaf0d905d8"
...
@@ -3987,9 +3987,9 @@ checksum = "2b38e32f0abccf9987a4e3079dfb67dcd799fb61361e53e2882c3cbaf0d905d8"
[[package]]
[[package]]
name = "windows_aarch64_gnullvm"
name = "windows_aarch64_gnullvm"
version = "0.52.
0
"
version = "0.52.
3
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
cb7764e35d4db8a7921e09562a0304bf2f93e0a51bfccee0bd0bb0b666b015ea
"
checksum = "
68e5dcfb9413f53afd9c8f86e56a7b4d86d9a2fa26090ea2dc9e40fba56c6ec6
"
[[package]]
[[package]]
name = "windows_aarch64_msvc"
name = "windows_aarch64_msvc"
...
@@ -4005,9 +4005,9 @@ checksum = "dc35310971f3b2dbbf3f0690a219f40e2d9afcf64f9ab7cc1be722937c26b4bc"
...
@@ -4005,9 +4005,9 @@ checksum = "dc35310971f3b2dbbf3f0690a219f40e2d9afcf64f9ab7cc1be722937c26b4bc"
[[package]]
[[package]]
name = "windows_aarch64_msvc"
name = "windows_aarch64_msvc"
version = "0.52.
0
"
version = "0.52.
3
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
bbaa0368d4f1d2aaefc55b6fcfee13f41544ddf36801e793edbbfd7d7df075e
f"
checksum = "
8dab469ebbc45798319e69eebf92308e541ce46760b49b18c6b3fe5e8965b30
f"
[[package]]
[[package]]
name = "windows_i686_gnu"
name = "windows_i686_gnu"
...
@@ -4023,9 +4023,9 @@ checksum = "a75915e7def60c94dcef72200b9a8e58e5091744960da64ec734a6c6e9b3743e"
...
@@ -4023,9 +4023,9 @@ checksum = "a75915e7def60c94dcef72200b9a8e58e5091744960da64ec734a6c6e9b3743e"
[[package]]
[[package]]
name = "windows_i686_gnu"
name = "windows_i686_gnu"
version = "0.52.
0
"
version = "0.52.
3
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
a28637cb1fa3560a16915793afb20081aba2c92ee8af57b4d5f28e4b3e7df313
"
checksum = "
2a4e9b6a7cac734a8b4138a4e1044eac3404d8326b6c0f939276560687a033fb
"
[[package]]
[[package]]
name = "windows_i686_msvc"
name = "windows_i686_msvc"
...
@@ -4041,9 +4041,9 @@ checksum = "8f55c233f70c4b27f66c523580f78f1004e8b5a8b659e05a4eb49d4166cca406"
...
@@ -4041,9 +4041,9 @@ checksum = "8f55c233f70c4b27f66c523580f78f1004e8b5a8b659e05a4eb49d4166cca406"
[[package]]
[[package]]
name = "windows_i686_msvc"
name = "windows_i686_msvc"
version = "0.52.
0
"
version = "0.52.
3
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
ffe5e8e31046ce6230cc7215707b816e339ff4d4d67c65dffa206fd0f7aa7b9a
"
checksum = "
28b0ec9c422ca95ff34a78755cfa6ad4a51371da2a5ace67500cf7ca5f232c58
"
[[package]]
[[package]]
name = "windows_x86_64_gnu"
name = "windows_x86_64_gnu"
...
@@ -4059,9 +4059,9 @@ checksum = "53d40abd2583d23e4718fddf1ebec84dbff8381c07cae67ff7768bbf19c6718e"
...
@@ -4059,9 +4059,9 @@ checksum = "53d40abd2583d23e4718fddf1ebec84dbff8381c07cae67ff7768bbf19c6718e"
[[package]]
[[package]]
name = "windows_x86_64_gnu"
name = "windows_x86_64_gnu"
version = "0.52.
0
"
version = "0.52.
3
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
3d6fa32db2bc4a2f5abeacf2b69f7992cd09dca97498da74a151a3132c26befd
"
checksum = "
704131571ba93e89d7cd43482277d6632589b18ecf4468f591fbae0a8b101614
"
[[package]]
[[package]]
name = "windows_x86_64_gnullvm"
name = "windows_x86_64_gnullvm"
...
@@ -4077,9 +4077,9 @@ checksum = "0b7b52767868a23d5bab768e390dc5f5c55825b6d30b86c844ff2dc7414044cc"
...
@@ -4077,9 +4077,9 @@ checksum = "0b7b52767868a23d5bab768e390dc5f5c55825b6d30b86c844ff2dc7414044cc"
[[package]]
[[package]]
name = "windows_x86_64_gnullvm"
name = "windows_x86_64_gnullvm"
version = "0.52.
0
"
version = "0.52.
3
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
1a657e1e9d3f514745a572a6846d3c7aa7dbe1658c056ed9c3344c4109a6949e
"
checksum = "
42079295511643151e98d61c38c0acc444e52dd42ab456f7ccfd5152e8ecf21c
"
[[package]]
[[package]]
name = "windows_x86_64_msvc"
name = "windows_x86_64_msvc"
...
@@ -4095,9 +4095,9 @@ checksum = "ed94fce61571a4006852b7389a063ab983c02eb1bb37b47f8272ce92d06d9538"
...
@@ -4095,9 +4095,9 @@ checksum = "ed94fce61571a4006852b7389a063ab983c02eb1bb37b47f8272ce92d06d9538"
[[package]]
[[package]]
name = "windows_x86_64_msvc"
name = "windows_x86_64_msvc"
version = "0.52.
0
"
version = "0.52.
3
"
source = "registry+https://github.com/rust-lang/crates.io-index"
source = "registry+https://github.com/rust-lang/crates.io-index"
checksum = "
dff9641d1cd4be8d1a070daf9e3773c5f67e78b4d9d42263020c057706765c04
"
checksum = "
0770833d60a970638e989b3fa9fd2bb1aaadcf88963d1659fd7d9990196ed2d6
"
[[package]]
[[package]]
name = "winreg"
name = "winreg"
...
@@ -4126,7 +4126,7 @@ checksum = "9ce1b18ccd8e73a9321186f97e46f9f04b778851177567b1975109d26a08d2a6"
...
@@ -4126,7 +4126,7 @@ checksum = "9ce1b18ccd8e73a9321186f97e46f9f04b778851177567b1975109d26a08d2a6"
dependencies = [
dependencies = [
"proc-macro2",
"proc-macro2",
"quote",
"quote",
"syn 2.0.5
0
",
"syn 2.0.5
1
",
]
]
[[package]]
[[package]]
...
...
Cargo.toml
View file @
e6bb3ff8
...
@@ -9,7 +9,7 @@ members = [
...
@@ -9,7 +9,7 @@ members = [
resolver
=
"2"
resolver
=
"2"
[workspace.package]
[workspace.package]
version
=
"1.4.
2
"
version
=
"1.4.
3
"
edition
=
"2021"
edition
=
"2021"
authors
=
[
"Olivier Dehaene"
]
authors
=
[
"Olivier Dehaene"
]
homepage
=
"https://github.com/huggingface/text-generation-inference"
homepage
=
"https://github.com/huggingface/text-generation-inference"
...
...
docs/openapi.json
View file @
e6bb3ff8
...
@@ -10,7 +10,7 @@
...
@@ -10,7 +10,7 @@
"name"
:
"Apache 2.0"
,
"name"
:
"Apache 2.0"
,
"url"
:
"https://www.apache.org/licenses/LICENSE-2.0"
"url"
:
"https://www.apache.org/licenses/LICENSE-2.0"
},
},
"version"
:
"1.4.
2
"
"version"
:
"1.4.
3
"
},
},
"paths"
:
{
"paths"
:
{
"/"
:
{
"/"
:
{
...
...
docs/source/_toctree.yml
View file @
e6bb3ff8
...
@@ -9,8 +9,6 @@
...
@@ -9,8 +9,6 @@
title
:
Supported Models and Hardware
title
:
Supported Models and Hardware
-
local
:
messages_api
-
local
:
messages_api
title
:
Messages API
title
:
Messages API
-
local
:
guidance
title
:
Guidance
title
:
Getting started
title
:
Getting started
-
sections
:
-
sections
:
-
local
:
basic_tutorials/consuming_tgi
-
local
:
basic_tutorials/consuming_tgi
...
...
docs/source/conceptual/guidance.md
View file @
e6bb3ff8
...
@@ -262,7 +262,7 @@ curl localhost:3000/v1/chat/completions \
...
@@ -262,7 +262,7 @@ curl localhost:3000/v1/chat/completions \
],
],
"tool_choice"
:
"get_current_weather"
"tool_choice"
:
"get_current_weather"
}
'
}
'
//
{
"id"
:
""
,
"object"
:
"text_completion"
,
"created"
:
1709051640
,
"model"
:
"HuggingFaceH4/zephyr-7b-beta"
,
"system_fingerprint"
:
"1.4.
2
-native"
,
"choices"
:[{
"index"
:
0
,
"message"
:{
"role"
:
"assistant"
,
"tool_calls"
:{
"id"
:
0
,
"type"
:
"function"
,
"function"
:{
"description"
:
null
,
"name"
:
"tools"
,
"parameters"
:{
"format"
:
"celsius"
,
"location"
:
"New York"
}}}},
"logprobs"
:
null
,
"finish_reason"
:
"eos_token"
}],
"usage"
:{
"prompt_tokens"
:
157
,
"completion_tokens"
:
19
,
"total_tokens"
:
176
}}
//
{
"id"
:
""
,
"object"
:
"text_completion"
,
"created"
:
1709051640
,
"model"
:
"HuggingFaceH4/zephyr-7b-beta"
,
"system_fingerprint"
:
"1.4.
3
-native"
,
"choices"
:[{
"index"
:
0
,
"message"
:{
"role"
:
"assistant"
,
"tool_calls"
:{
"id"
:
0
,
"type"
:
"function"
,
"function"
:{
"description"
:
null
,
"name"
:
"tools"
,
"parameters"
:{
"format"
:
"celsius"
,
"location"
:
"New York"
}}}},
"logprobs"
:
null
,
"finish_reason"
:
"eos_token"
}],
"usage"
:{
"prompt_tokens"
:
157
,
"completion_tokens"
:
19
,
"total_tokens"
:
176
}}
```
```
<details>
<details>
...
@@ -362,7 +362,7 @@ if __name__ == "__main__":
...
@@ -362,7 +362,7 @@ if __name__ == "__main__":
import
asyncio
import
asyncio
asyncio
.
run
(
main
())
asyncio
.
run
(
main
())
# {"id":"","object":"text_completion","created":1709051942,"model":"HuggingFaceH4/zephyr-7b-beta","system_fingerprint":"1.4.
2
-native","choices":[{"index":0,"message":{"role":"assistant","tool_calls":{"id":0,"type":"function","function":{"description":null,"name":"tools","parameters":{"format":"celsius","location":"New York"}}}},"logprobs":null,"finish_reason":"eos_token"}],"usage":{"prompt_tokens":157,"completion_tokens":20,"total_tokens":177}}
# {"id":"","object":"text_completion","created":1709051942,"model":"HuggingFaceH4/zephyr-7b-beta","system_fingerprint":"1.4.
3
-native","choices":[{"index":0,"message":{"role":"assistant","tool_calls":{"id":0,"type":"function","function":{"description":null,"name":"tools","parameters":{"format":"celsius","location":"New York"}}}},"logprobs":null,"finish_reason":"eos_token"}],"usage":{"prompt_tokens":157,"completion_tokens":20,"total_tokens":177}}
```
```
...
...
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_no_tools.json
View file @
e6bb3ff8
...
@@ -17,7 +17,7 @@
...
@@ -17,7 +17,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"1.4.
2
-native"
,
"system_fingerprint"
:
"1.4.
3
-native"
,
"usage"
:
{
"usage"
:
{
"completion_tokens"
:
100
,
"completion_tokens"
:
100
,
"prompt_tokens"
:
60
,
"prompt_tokens"
:
60
,
...
...
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools.json
View file @
e6bb3ff8
...
@@ -29,7 +29,7 @@
...
@@ -29,7 +29,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"1.4.
2
-native"
,
"system_fingerprint"
:
"1.4.
3
-native"
,
"usage"
:
{
"usage"
:
{
"completion_tokens"
:
29
,
"completion_tokens"
:
29
,
"prompt_tokens"
:
316
,
"prompt_tokens"
:
316
,
...
...
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools_auto.json
View file @
e6bb3ff8
...
@@ -29,7 +29,7 @@
...
@@ -29,7 +29,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"1.4.
2
-native"
,
"system_fingerprint"
:
"1.4.
3
-native"
,
"usage"
:
{
"usage"
:
{
"completion_tokens"
:
29
,
"completion_tokens"
:
29
,
"prompt_tokens"
:
316
,
"prompt_tokens"
:
316
,
...
...
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools_choice.json
View file @
e6bb3ff8
...
@@ -28,7 +28,7 @@
...
@@ -28,7 +28,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"1.4.
2
-native"
,
"system_fingerprint"
:
"1.4.
3
-native"
,
"usage"
:
{
"usage"
:
{
"completion_tokens"
:
21
,
"completion_tokens"
:
21
,
"prompt_tokens"
:
187
,
"prompt_tokens"
:
187
,
...
...
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools_stream.json
View file @
e6bb3ff8
...
@@ -23,5 +23,5 @@
...
@@ -23,5 +23,5 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"1.4.
2
-native"
"system_fingerprint"
:
"1.4.
3
-native"
}
}
integration-tests/pyproject.toml
View file @
e6bb3ff8
[tool.poetry]
[tool.poetry]
name
=
"text-generation-integration-tests"
name
=
"text-generation-integration-tests"
version
=
"1.4.
2
"
version
=
"1.4.
3
"
description
=
"Text Generation Inference integration tests"
description
=
"Text Generation Inference integration tests"
authors
=
[
"Nicolas Patry <nicolas@huggingface.co>"
]
authors
=
[
"Nicolas Patry <nicolas@huggingface.co>"
]
...
...
server/pyproject.toml
View file @
e6bb3ff8
[tool.poetry]
[tool.poetry]
name
=
"text-generation-server"
name
=
"text-generation-server"
version
=
"1.4.
2
"
version
=
"1.4.
3
"
description
=
"Text Generation Inference Python gRPC Server"
description
=
"Text Generation Inference Python gRPC Server"
authors
=
[
"Olivier Dehaene <olivier@huggingface.co>"
]
authors
=
[
"Olivier Dehaene <olivier@huggingface.co>"
]
...
...
huangwb
@huangwb
mentioned in commit
23fba672
·
May 30, 2024
mentioned in commit
23fba672
mentioned in commit 23fba672e8156ce19cc518470a5452a9543c56b9
Toggle commit list
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment