triton_echo_client.py 1.83 KB
Newer Older
1
2
3
4
5
6
7
# SPDX-FileCopyrightText: Copyright (c) 2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0


import numpy as np
import tritonclient.grpc as grpcclient

8
9
10
11
12
13
14
15
16
SERVER_URL = "localhost:8000"


def check_health():
    triton_client = grpcclient.InferenceServerClient(url=SERVER_URL)
    assert triton_client.is_server_live()
    assert triton_client.is_server_ready()
    assert triton_client.is_model_ready("echo")

17
18

def run_infer():
19
    triton_client = grpcclient.InferenceServerClient(url=SERVER_URL)
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48

    model_name = "echo"

    # Infer
    inputs = []
    inputs.append(grpcclient.InferInput("INPUT0", [16], "INT32"))
    inputs.append(grpcclient.InferInput("INPUT1", [16], "BYTES"))

    # Create the data for the two input tensors. Initialize the first
    # to unique integers and the second to all ones.
    input0_data = np.arange(start=0, stop=16, dtype=np.int32).reshape([16])
    input1_data = np.array(
        [str(x).encode("utf-8") for x in input0_data.reshape(input0_data.size)],
        dtype=np.object_,
    ).reshape([16])

    # Initialize the data
    inputs[0].set_data_from_numpy(input0_data)
    inputs[1].set_data_from_numpy(input1_data)

    # Test with outputs
    results = triton_client.infer(model_name=model_name, inputs=inputs)

    # Get the output arrays from the results
    output0_data = results.as_numpy("INPUT0")
    output1_data = results.as_numpy("INPUT1")

    assert np.array_equal(input0_data, output0_data)
    assert np.array_equal(input1_data, output1_data)
49
50
51


def get_config():
52
    triton_client = grpcclient.InferenceServerClient(url=SERVER_URL)
53
54
55
56
57

    model_name = "echo"
    response = triton_client.get_model_config(model_name=model_name)
    # Check one of the field that can only be set by providing Triton model config
    assert response.config.model_transaction_policy.decoupled