Unverified Commit efa647b7 authored by Graham King's avatar Graham King Committed by GitHub
Browse files

fix(dynamo-run): Fix naming the model in single-process mode (#3955)


Signed-off-by: default avatarGraham King <grahamk@nvidia.com>
parent a430bbb6
...@@ -174,8 +174,8 @@ pub async fn run(runtime: Runtime, engine_config: EngineConfig) -> anyhow::Resul ...@@ -174,8 +174,8 @@ pub async fn run(runtime: Runtime, engine_config: EngineConfig) -> anyhow::Resul
let engine = Arc::new(StreamingEngineAdapter::new(engine)); let engine = Arc::new(StreamingEngineAdapter::new(engine));
let manager = http_service.model_manager(); let manager = http_service.model_manager();
let checksum = model.card().mdcsum(); let checksum = model.card().mdcsum();
manager.add_completions_model(model.service_name(), checksum, engine.clone())?; manager.add_completions_model(model.display_name(), checksum, engine.clone())?;
manager.add_chat_completions_model(model.service_name(), checksum, engine)?; manager.add_chat_completions_model(model.display_name(), checksum, engine)?;
// Enable all endpoints // Enable all endpoints
for endpoint_type in EndpointType::all() { for endpoint_type in EndpointType::all() {
...@@ -199,14 +199,14 @@ pub async fn run(runtime: Runtime, engine_config: EngineConfig) -> anyhow::Resul ...@@ -199,14 +199,14 @@ pub async fn run(runtime: Runtime, engine_config: EngineConfig) -> anyhow::Resul
NvCreateChatCompletionStreamResponse, NvCreateChatCompletionStreamResponse,
>(model.card(), inner_engine.clone(), tokenizer_hf.clone()) >(model.card(), inner_engine.clone(), tokenizer_hf.clone())
.await?; .await?;
manager.add_chat_completions_model(model.service_name(), checksum, chat_pipeline)?; manager.add_chat_completions_model(model.display_name(), checksum, chat_pipeline)?;
let cmpl_pipeline = common::build_pipeline::< let cmpl_pipeline = common::build_pipeline::<
NvCreateCompletionRequest, NvCreateCompletionRequest,
NvCreateCompletionResponse, NvCreateCompletionResponse,
>(model.card(), inner_engine, tokenizer_hf) >(model.card(), inner_engine, tokenizer_hf)
.await?; .await?;
manager.add_completions_model(model.service_name(), checksum, cmpl_pipeline)?; manager.add_completions_model(model.display_name(), checksum, cmpl_pipeline)?;
// Enable all endpoints // Enable all endpoints
for endpoint_type in EndpointType::all() { for endpoint_type in EndpointType::all() {
http_service.enable_model_endpoint(endpoint_type, true); http_service.enable_model_endpoint(endpoint_type, true);
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment