identity.sh 4.11 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
#!/bin/bash
# SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0

# Launch script for Triton Server backend with Dynamo
# This runs the frontend and triton worker on the same node

set -e

# Setup cleanup trap
cleanup() {
    echo "Cleaning up background processes..."
    kill $FRONTEND_PID 2>/dev/null || true
    wait $FRONTEND_PID 2>/dev/null || true
    echo "Cleanup complete."
}
trap cleanup EXIT INT TERM

# Get the directory where this script is located
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
TRITON_DIR="$(dirname "$SCRIPT_DIR")"

# Default values
MODEL_NAME="identity"
MODEL_REPO="${TRITON_DIR}/model_repo"
BACKEND_DIR="${TRITON_DIR}/backends"
LOG_VERBOSE=1
28
DISCOVERY_BACKEND="${DYN_DISCOVERY_BACKEND:-file}"  # Default to file-based discovery (no etcd required)
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49

# Parse command line arguments
EXTRA_ARGS=()
while [[ $# -gt 0 ]]; do
    case $1 in
        --model-name)
            MODEL_NAME="$2"
            shift 2
            ;;
        --model-repository)
            MODEL_REPO="$2"
            shift 2
            ;;
        --backend-directory)
            BACKEND_DIR="$2"
            shift 2
            ;;
        --log-verbose)
            LOG_VERBOSE="$2"
            shift 2
            ;;
50
51
        --discovery-backend)
            DISCOVERY_BACKEND="$2"
52
53
54
55
56
57
58
59
60
61
62
63
            shift 2
            ;;
        -h|--help)
            echo "Usage: $0 [OPTIONS]"
            echo ""
            echo "Launch Triton Server backend with Dynamo frontend"
            echo ""
            echo "Options:"
            echo "  --model-name <name>         Model name to load (default: $MODEL_NAME)"
            echo "  --model-repository <path>   Path to model repository (default: $MODEL_REPO)"
            echo "  --backend-directory <path>  Path to Triton backends (default: $BACKEND_DIR)"
            echo "  --log-verbose <level>       Triton log verbosity 0-6 (default: $LOG_VERBOSE)"
64
            echo "  --discovery-backend <backend> Discovery backend: kubernetes, etcd, file, mem (default: $DISCOVERY_BACKEND)"
65
66
67
            echo "  -h, --help                  Show this help message"
            echo ""
            echo "Environment variables:"
68
            echo "  DYN_DISCOVERY_BACKEND  Discovery backend (default: file)"
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
            echo "  DYN_HTTP_PORT    Frontend HTTP port (default: 8000)"
            echo "  DYN_SYSTEM_PORT  Worker metrics port (default: 8081)"
            echo ""
            echo "Ports:"
            echo "  HTTP:  8000 (configurable via DYN_HTTP_PORT)"
            echo "  gRPC:  8787 (KServe gRPC for tensor models)"
            echo ""
            echo "Additional arguments will be passed to tritonworker.py"
            exit 0
            ;;
        *)
            EXTRA_ARGS+=("$1")
            shift
            ;;
    esac
done

# Validate paths
if [[ ! -d "$MODEL_REPO" ]]; then
    echo "Error: Model repository not found: $MODEL_REPO"
    exit 1
fi

if [[ ! -d "$BACKEND_DIR" ]]; then
    echo "Error: Backend directory not found: $BACKEND_DIR"
    exit 1
fi

echo "=== Triton Server with Dynamo ==="
echo "Model name:       $MODEL_NAME"
echo "Model repository: $MODEL_REPO"
echo "Backend directory: $BACKEND_DIR"
echo "Log verbose:      $LOG_VERBOSE"
102
echo "Discovery:        $DISCOVERY_BACKEND"
103
104
105
106
107
echo ""

# Set library path for Triton
export LD_LIBRARY_PATH="${TRITON_DIR}/lib:${BACKEND_DIR}:${LD_LIBRARY_PATH:-}"

108
109
# Export discovery backend setting for worker (read by @dynamo_worker decorator)
export DYN_DISCOVERY_BACKEND="$DISCOVERY_BACKEND"
110
111
112
113

# Run frontend in background
# --kserve-grpc-server enables the KServe gRPC endpoint for tensor models
echo "Starting Dynamo frontend..."
114
python3 -m dynamo.frontend --kserve-grpc-server --discovery-backend "$DISCOVERY_BACKEND" &
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
FRONTEND_PID=$!

# Give frontend time to start
sleep 2

# Run triton worker in foreground
echo "Starting Triton worker..."
DYN_SYSTEM_PORT=${DYN_SYSTEM_PORT:-8081} \
python3 "${TRITON_DIR}/src/tritonworker.py" \
    --model-name "$MODEL_NAME" \
    --model-repository "$MODEL_REPO" \
    --backend-directory "$BACKEND_DIR" \
    --log-verbose "$LOG_VERBOSE" \
    "${EXTRA_ARGS[@]}"