Skip to content
GitLab
Menu
Projects
Groups
Snippets
Loading...
Help
Help
Support
Community forum
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
Menu
Open sidebar
OpenDAS
text-generation-inference
Commits
2d0a7173
Commit
2d0a7173
authored
Apr 18, 2024
by
OlivierDehaene
Browse files
v2.0.1
parent
f9ee2c41
Changes
13
Show whitespace changes
Inline
Side-by-side
Showing
13 changed files
with
55 additions
and
55 deletions
+55
-55
Cargo.lock
Cargo.lock
+4
-4
Cargo.toml
Cargo.toml
+1
-1
docs/openapi.json
docs/openapi.json
+1
-1
integration-tests/models/__snapshots__/test_chat_llama/test_flash_llama_simple.json
..._snapshots__/test_chat_llama/test_flash_llama_simple.json
+1
-1
integration-tests/models/__snapshots__/test_completion_prompts/test_flash_llama_completion_many_prompts.json
...ion_prompts/test_flash_llama_completion_many_prompts.json
+1
-1
integration-tests/models/__snapshots__/test_completion_prompts/test_flash_llama_completion_many_prompts_stream.json
...mpts/test_flash_llama_completion_many_prompts_stream.json
+40
-40
integration-tests/models/__snapshots__/test_completion_prompts/test_flash_llama_completion_single_prompt.json
...on_prompts/test_flash_llama_completion_single_prompt.json
+1
-1
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools.json
...ts__/test_tools_llama/test_flash_llama_grammar_tools.json
+1
-1
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools_auto.json
...test_tools_llama/test_flash_llama_grammar_tools_auto.json
+1
-1
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools_choice.json
...st_tools_llama/test_flash_llama_grammar_tools_choice.json
+1
-1
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools_stream.json
...st_tools_llama/test_flash_llama_grammar_tools_stream.json
+1
-1
integration-tests/pyproject.toml
integration-tests/pyproject.toml
+1
-1
server/pyproject.toml
server/pyproject.toml
+1
-1
No files found.
Cargo.lock
View file @
2d0a7173
...
@@ -3393,7 +3393,7 @@ dependencies = [
...
@@ -3393,7 +3393,7 @@ dependencies = [
[[package]]
[[package]]
name = "text-generation-benchmark"
name = "text-generation-benchmark"
version = "2.0.
0
"
version = "2.0.
1
"
dependencies = [
dependencies = [
"average",
"average",
"clap",
"clap",
...
@@ -3414,7 +3414,7 @@ dependencies = [
...
@@ -3414,7 +3414,7 @@ dependencies = [
[[package]]
[[package]]
name = "text-generation-client"
name = "text-generation-client"
version = "2.0.
0
"
version = "2.0.
1
"
dependencies = [
dependencies = [
"futures",
"futures",
"grpc-metadata",
"grpc-metadata",
...
@@ -3430,7 +3430,7 @@ dependencies = [
...
@@ -3430,7 +3430,7 @@ dependencies = [
[[package]]
[[package]]
name = "text-generation-launcher"
name = "text-generation-launcher"
version = "2.0.
0
"
version = "2.0.
1
"
dependencies = [
dependencies = [
"clap",
"clap",
"ctrlc",
"ctrlc",
...
@@ -3448,7 +3448,7 @@ dependencies = [
...
@@ -3448,7 +3448,7 @@ dependencies = [
[[package]]
[[package]]
name = "text-generation-router"
name = "text-generation-router"
version = "2.0.
0
"
version = "2.0.
1
"
dependencies = [
dependencies = [
"async-stream",
"async-stream",
"axum",
"axum",
...
...
Cargo.toml
View file @
2d0a7173
...
@@ -9,7 +9,7 @@ members = [
...
@@ -9,7 +9,7 @@ members = [
resolver
=
"2"
resolver
=
"2"
[workspace.package]
[workspace.package]
version
=
"2.0.
0
"
version
=
"2.0.
1
"
edition
=
"2021"
edition
=
"2021"
authors
=
[
"Olivier Dehaene"
]
authors
=
[
"Olivier Dehaene"
]
homepage
=
"https://github.com/huggingface/text-generation-inference"
homepage
=
"https://github.com/huggingface/text-generation-inference"
...
...
docs/openapi.json
View file @
2d0a7173
...
@@ -10,7 +10,7 @@
...
@@ -10,7 +10,7 @@
"name"
:
"Apache 2.0"
,
"name"
:
"Apache 2.0"
,
"url"
:
"https://www.apache.org/licenses/LICENSE-2.0"
"url"
:
"https://www.apache.org/licenses/LICENSE-2.0"
},
},
"version"
:
"2.0.
0
"
"version"
:
"2.0.
1
"
},
},
"paths"
:
{
"paths"
:
{
"/"
:
{
"/"
:
{
...
...
integration-tests/models/__snapshots__/test_chat_llama/test_flash_llama_simple.json
View file @
2d0a7173
...
@@ -17,7 +17,7 @@
...
@@ -17,7 +17,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
,
"system_fingerprint"
:
"2.0.
1
-native"
,
"usage"
:
{
"usage"
:
{
"completion_tokens"
:
100
,
"completion_tokens"
:
100
,
"prompt_tokens"
:
60
,
"prompt_tokens"
:
60
,
...
...
integration-tests/models/__snapshots__/test_completion_prompts/test_flash_llama_completion_many_prompts.json
View file @
2d0a7173
...
@@ -29,7 +29,7 @@
...
@@ -29,7 +29,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
,
"system_fingerprint"
:
"2.0.
1
-native"
,
"usage"
:
{
"usage"
:
{
"completion_tokens"
:
36
,
"completion_tokens"
:
36
,
"prompt_tokens"
:
8
,
"prompt_tokens"
:
8
,
...
...
integration-tests/models/__snapshots__/test_completion_prompts/test_flash_llama_completion_many_prompts_stream.json
View file @
2d0a7173
...
@@ -12,7 +12,7 @@
...
@@ -12,7 +12,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -27,7 +27,7 @@
...
@@ -27,7 +27,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -42,7 +42,7 @@
...
@@ -42,7 +42,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -57,7 +57,7 @@
...
@@ -57,7 +57,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -72,7 +72,7 @@
...
@@ -72,7 +72,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -87,7 +87,7 @@
...
@@ -87,7 +87,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -102,7 +102,7 @@
...
@@ -102,7 +102,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -117,7 +117,7 @@
...
@@ -117,7 +117,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -132,7 +132,7 @@
...
@@ -132,7 +132,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -147,7 +147,7 @@
...
@@ -147,7 +147,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -162,7 +162,7 @@
...
@@ -162,7 +162,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -177,7 +177,7 @@
...
@@ -177,7 +177,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -192,7 +192,7 @@
...
@@ -192,7 +192,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -207,7 +207,7 @@
...
@@ -207,7 +207,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -222,7 +222,7 @@
...
@@ -222,7 +222,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -237,7 +237,7 @@
...
@@ -237,7 +237,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -252,7 +252,7 @@
...
@@ -252,7 +252,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -267,7 +267,7 @@
...
@@ -267,7 +267,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -282,7 +282,7 @@
...
@@ -282,7 +282,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -297,7 +297,7 @@
...
@@ -297,7 +297,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -312,7 +312,7 @@
...
@@ -312,7 +312,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -327,7 +327,7 @@
...
@@ -327,7 +327,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -342,7 +342,7 @@
...
@@ -342,7 +342,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -357,7 +357,7 @@
...
@@ -357,7 +357,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -372,7 +372,7 @@
...
@@ -372,7 +372,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -387,7 +387,7 @@
...
@@ -387,7 +387,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -402,7 +402,7 @@
...
@@ -402,7 +402,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -417,7 +417,7 @@
...
@@ -417,7 +417,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -432,7 +432,7 @@
...
@@ -432,7 +432,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -447,7 +447,7 @@
...
@@ -447,7 +447,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -462,7 +462,7 @@
...
@@ -462,7 +462,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -477,7 +477,7 @@
...
@@ -477,7 +477,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -492,7 +492,7 @@
...
@@ -492,7 +492,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -507,7 +507,7 @@
...
@@ -507,7 +507,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -522,7 +522,7 @@
...
@@ -522,7 +522,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -537,7 +537,7 @@
...
@@ -537,7 +537,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -552,7 +552,7 @@
...
@@ -552,7 +552,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -567,7 +567,7 @@
...
@@ -567,7 +567,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -582,7 +582,7 @@
...
@@ -582,7 +582,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
},
},
{
{
"choices"
:
[
"choices"
:
[
...
@@ -597,6 +597,6 @@
...
@@ -597,6 +597,6 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
}
}
]
]
integration-tests/models/__snapshots__/test_completion_prompts/test_flash_llama_completion_single_prompt.json
View file @
2d0a7173
...
@@ -11,7 +11,7 @@
...
@@ -11,7 +11,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
,
"system_fingerprint"
:
"2.0.
1
-native"
,
"usage"
:
{
"usage"
:
{
"completion_tokens"
:
5
,
"completion_tokens"
:
5
,
"prompt_tokens"
:
6
,
"prompt_tokens"
:
6
,
...
...
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools.json
View file @
2d0a7173
...
@@ -30,7 +30,7 @@
...
@@ -30,7 +30,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
,
"system_fingerprint"
:
"2.0.
1
-native"
,
"usage"
:
{
"usage"
:
{
"completion_tokens"
:
37
,
"completion_tokens"
:
37
,
"prompt_tokens"
:
524
,
"prompt_tokens"
:
524
,
...
...
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools_auto.json
View file @
2d0a7173
...
@@ -30,7 +30,7 @@
...
@@ -30,7 +30,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
,
"system_fingerprint"
:
"2.0.
1
-native"
,
"usage"
:
{
"usage"
:
{
"completion_tokens"
:
37
,
"completion_tokens"
:
37
,
"prompt_tokens"
:
524
,
"prompt_tokens"
:
524
,
...
...
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools_choice.json
View file @
2d0a7173
...
@@ -30,7 +30,7 @@
...
@@ -30,7 +30,7 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
,
"system_fingerprint"
:
"2.0.
1
-native"
,
"usage"
:
{
"usage"
:
{
"completion_tokens"
:
48
,
"completion_tokens"
:
48
,
"prompt_tokens"
:
320
,
"prompt_tokens"
:
320
,
...
...
integration-tests/models/__snapshots__/test_tools_llama/test_flash_llama_grammar_tools_stream.json
View file @
2d0a7173
...
@@ -23,5 +23,5 @@
...
@@ -23,5 +23,5 @@
"id"
:
""
,
"id"
:
""
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"model"
:
"TinyLlama/TinyLlama-1.1B-Chat-v1.0"
,
"object"
:
"text_completion"
,
"object"
:
"text_completion"
,
"system_fingerprint"
:
"2.0.
0
-native"
"system_fingerprint"
:
"2.0.
1
-native"
}
}
integration-tests/pyproject.toml
View file @
2d0a7173
[tool.poetry]
[tool.poetry]
name
=
"text-generation-integration-tests"
name
=
"text-generation-integration-tests"
version
=
"2.0.
0
"
version
=
"2.0.
1
"
description
=
"Text Generation Inference integration tests"
description
=
"Text Generation Inference integration tests"
authors
=
[
"Nicolas Patry <nicolas@huggingface.co>"
]
authors
=
[
"Nicolas Patry <nicolas@huggingface.co>"
]
...
...
server/pyproject.toml
View file @
2d0a7173
[tool.poetry]
[tool.poetry]
name
=
"text-generation-server"
name
=
"text-generation-server"
version
=
"2.0.
0
"
version
=
"2.0.
1
"
description
=
"Text Generation Inference Python gRPC Server"
description
=
"Text Generation Inference Python gRPC Server"
authors
=
[
"Olivier Dehaene <olivier@huggingface.co>"
]
authors
=
[
"Olivier Dehaene <olivier@huggingface.co>"
]
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
.
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment