"vscode:/vscode.git/clone" did not exist on "7eef9ac3328f674baf9c42ac857c7571ab04986f"
Unverified Commit efa647b7 authored by Graham King's avatar Graham King Committed by GitHub
Browse files

fix(dynamo-run): Fix naming the model in single-process mode (#3955)


Signed-off-by: default avatarGraham King <grahamk@nvidia.com>
parent a430bbb6
......@@ -174,8 +174,8 @@ pub async fn run(runtime: Runtime, engine_config: EngineConfig) -> anyhow::Resul
let engine = Arc::new(StreamingEngineAdapter::new(engine));
let manager = http_service.model_manager();
let checksum = model.card().mdcsum();
manager.add_completions_model(model.service_name(), checksum, engine.clone())?;
manager.add_chat_completions_model(model.service_name(), checksum, engine)?;
manager.add_completions_model(model.display_name(), checksum, engine.clone())?;
manager.add_chat_completions_model(model.display_name(), checksum, engine)?;
// Enable all endpoints
for endpoint_type in EndpointType::all() {
......@@ -199,14 +199,14 @@ pub async fn run(runtime: Runtime, engine_config: EngineConfig) -> anyhow::Resul
NvCreateChatCompletionStreamResponse,
>(model.card(), inner_engine.clone(), tokenizer_hf.clone())
.await?;
manager.add_chat_completions_model(model.service_name(), checksum, chat_pipeline)?;
manager.add_chat_completions_model(model.display_name(), checksum, chat_pipeline)?;
let cmpl_pipeline = common::build_pipeline::<
NvCreateCompletionRequest,
NvCreateCompletionResponse,
>(model.card(), inner_engine, tokenizer_hf)
.await?;
manager.add_completions_model(model.service_name(), checksum, cmpl_pipeline)?;
manager.add_completions_model(model.display_name(), checksum, cmpl_pipeline)?;
// Enable all endpoints
for endpoint_type in EndpointType::all() {
http_service.enable_model_endpoint(endpoint_type, true);
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment