identity.sh 3.99 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
#!/bin/bash
# SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
# SPDX-License-Identifier: Apache-2.0

# Launch script for Triton Server backend with Dynamo
# This runs the frontend and triton worker on the same node

set -e

# Setup cleanup trap
cleanup() {
    echo "Cleaning up background processes..."
    kill $FRONTEND_PID 2>/dev/null || true
    wait $FRONTEND_PID 2>/dev/null || true
    echo "Cleanup complete."
}
trap cleanup EXIT INT TERM

# Get the directory where this script is located
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
TRITON_DIR="$(dirname "$SCRIPT_DIR")"

# Default values
MODEL_NAME="identity"
MODEL_REPO="${TRITON_DIR}/model_repo"
BACKEND_DIR="${TRITON_DIR}/backends"
LOG_VERBOSE=1
STORE_KV="${DYN_STORE_KV:-file}"  # Default to file-based KV (no etcd required)

# Parse command line arguments
EXTRA_ARGS=()
while [[ $# -gt 0 ]]; do
    case $1 in
        --model-name)
            MODEL_NAME="$2"
            shift 2
            ;;
        --model-repository)
            MODEL_REPO="$2"
            shift 2
            ;;
        --backend-directory)
            BACKEND_DIR="$2"
            shift 2
            ;;
        --log-verbose)
            LOG_VERBOSE="$2"
            shift 2
            ;;
        --store-kv)
            STORE_KV="$2"
            shift 2
            ;;
        -h|--help)
            echo "Usage: $0 [OPTIONS]"
            echo ""
            echo "Launch Triton Server backend with Dynamo frontend"
            echo ""
            echo "Options:"
            echo "  --model-name <name>         Model name to load (default: $MODEL_NAME)"
            echo "  --model-repository <path>   Path to model repository (default: $MODEL_REPO)"
            echo "  --backend-directory <path>  Path to Triton backends (default: $BACKEND_DIR)"
            echo "  --log-verbose <level>       Triton log verbosity 0-6 (default: $LOG_VERBOSE)"
            echo "  --store-kv <backend>        KV store backend: file, etcd, mem (default: $STORE_KV)"
            echo "  -h, --help                  Show this help message"
            echo ""
            echo "Environment variables:"
            echo "  DYN_STORE_KV     KV store backend (default: file)"
            echo "  DYN_HTTP_PORT    Frontend HTTP port (default: 8000)"
            echo "  DYN_SYSTEM_PORT  Worker metrics port (default: 8081)"
            echo ""
            echo "Ports:"
            echo "  HTTP:  8000 (configurable via DYN_HTTP_PORT)"
            echo "  gRPC:  8787 (KServe gRPC for tensor models)"
            echo ""
            echo "Additional arguments will be passed to tritonworker.py"
            exit 0
            ;;
        *)
            EXTRA_ARGS+=("$1")
            shift
            ;;
    esac
done

# Validate paths
if [[ ! -d "$MODEL_REPO" ]]; then
    echo "Error: Model repository not found: $MODEL_REPO"
    exit 1
fi

if [[ ! -d "$BACKEND_DIR" ]]; then
    echo "Error: Backend directory not found: $BACKEND_DIR"
    exit 1
fi

echo "=== Triton Server with Dynamo ==="
echo "Model name:       $MODEL_NAME"
echo "Model repository: $MODEL_REPO"
echo "Backend directory: $BACKEND_DIR"
echo "Log verbose:      $LOG_VERBOSE"
echo "KV store:         $STORE_KV"
echo ""

# Set library path for Triton
export LD_LIBRARY_PATH="${TRITON_DIR}/lib:${BACKEND_DIR}:${LD_LIBRARY_PATH:-}"

# Export KV store setting for worker (read by @dynamo_worker decorator)
export DYN_STORE_KV="$STORE_KV"

# Run frontend in background
# --kserve-grpc-server enables the KServe gRPC endpoint for tensor models
echo "Starting Dynamo frontend..."
python3 -m dynamo.frontend --kserve-grpc-server --store-kv "$STORE_KV" &
FRONTEND_PID=$!

# Give frontend time to start
sleep 2

# Run triton worker in foreground
echo "Starting Triton worker..."
DYN_SYSTEM_PORT=${DYN_SYSTEM_PORT:-8081} \
python3 "${TRITON_DIR}/src/tritonworker.py" \
    --model-name "$MODEL_NAME" \
    --model-repository "$MODEL_REPO" \
    --backend-directory "$BACKEND_DIR" \
    --log-verbose "$LOG_VERBOSE" \
    "${EXTRA_ARGS[@]}"