middle_server.py 2.22 KB
Newer Older
1
# SPDX-FileCopyrightText: Copyright (c) 2025-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
# SPDX-License-Identifier: Apache-2.0

"""
Middle server demonstration that proxies requests to backend servers
using round_robin() and passes context for cancellation support
"""

import asyncio

from dynamo._core import DistributedRuntime


class MiddleServer:
    """Middle server that forwards requests to backend servers"""

    def __init__(self, runtime):
        self.runtime = runtime
        self.backend_client = None

    async def initialize(self):
        """Initialize connection to backend servers"""
        # Connect to backend servers
24
        endpoint = self.runtime.endpoint("demo.server.generate")
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
        self.backend_client = await endpoint.client()
        await self.backend_client.wait_for_instances()
        print("Middle server: Connected to backend servers")

    async def generate(self, request, context):
        """Forward request to backend using round_robin and pass context"""
        print("Middle server: Received request, forwarding to backend")

        assert self.backend_client is not None, "Did you call initialize()?"

        # Forward request to backend using round_robin with the same context
        # This passes the cancellation context through to the backend
        stream = await self.backend_client.generate(request, context=context)

        # Stream responses back to client
40
41
42
43
44
45
        async for response in stream:
            data = response.data()
            print(f"Middle server: Forwarding response {data}")
            yield data

        print("Middle server: Backend stream ended")
46
47
48
49
50


async def main():
    """Start the middle server"""
    loop = asyncio.get_running_loop()
51
    runtime = DistributedRuntime(loop, "file", "nats")
52
53
54
55
56

    # Create middle server handler
    handler = MiddleServer(runtime)
    await handler.initialize()

57
58
    # Create middle server endpoint
    endpoint = runtime.endpoint("demo.middle.generate")
59
60
61
62
63
64
65
66
67
68
69
70

    print("Middle server started")
    print("Forwarding requests to backend servers...")

    # Serve the endpoint - this blocks until shutdown
    await endpoint.serve_endpoint(handler.generate)

    runtime.shutdown()


if __name__ == "__main__":
    asyncio.run(main())