push.rs 6.62 KB
Newer Older
1
2
3
4
5
6
7
8
9
10
11
12
13
14
// SPDX-FileCopyrightText: Copyright (c) 2024-2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
// SPDX-License-Identifier: Apache-2.0
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
Ryan Olson's avatar
Ryan Olson committed
15
16
17

use anyhow::Result;
use async_nats::client::Client;
18
use tracing as log;
Ryan Olson's avatar
Ryan Olson committed
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88

use super::*;

#[derive(Debug, Clone, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
enum RequestType {
    SingleIn,
    ManyIn,
}

#[derive(Debug, Clone, Serialize, Deserialize)]
#[serde(rename_all = "snake_case")]
enum ResponseType {
    SingleOut,
    ManyOut,
}

#[derive(Debug, Clone, Serialize, Deserialize)]
struct RequestControlMessage {
    id: String,
    request_type: RequestType,
    response_type: ResponseType,
    connection_info: ConnectionInfo,
}

pub type PushRouter<In, Out> =
    Arc<dyn AsyncEngine<SingleIn<AddressedRequest<In>>, ManyOut<Out>, Error>>;

pub struct AddressedRequest<T> {
    request: T,
    address: String,
}

impl<T> AddressedRequest<T> {
    pub fn new(request: T, address: String) -> Self {
        Self { request, address }
    }

    fn into_parts(self) -> (T, String) {
        (self.request, self.address)
    }
}

pub struct AddressedPushRouter {
    // todo: generalize with a generic
    req_transport: Client,

    // todo: generalize with a generic
    resp_transport: Arc<tcp::server::TcpStreamServer>,
}

impl AddressedPushRouter {
    pub fn new(
        req_transport: Client,
        resp_transport: Arc<tcp::server::TcpStreamServer>,
    ) -> Result<Arc<Self>> {
        Ok(Arc::new(Self {
            req_transport,
            resp_transport,
        }))
    }
}

#[async_trait]
impl<T, U> AsyncEngine<SingleIn<AddressedRequest<T>>, ManyOut<U>, Error> for AddressedPushRouter
where
    T: Data + Serialize,
    U: Data + for<'de> Deserialize<'de>,
{
    async fn generate(&self, request: SingleIn<AddressedRequest<T>>) -> Result<ManyOut<U>, Error> {
89
        let request_id = request.context().id().to_string();
Ryan Olson's avatar
Ryan Olson committed
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
        let (addressed_request, context) = request.transfer(());
        let (request, address) = addressed_request.into_parts();
        let engine_ctx = context.context();

        // registration options for the data plane in a singe in / many out configuration
        let options = StreamOptions::builder()
            .context(engine_ctx.clone())
            .enable_request_stream(false)
            .enable_response_stream(true)
            .build()
            .unwrap();

        // register our needs with the data plane
        // todo - generalize this with a generic data plane object which hides the specific transports
        let pending_connections: PendingConnections = self.resp_transport.register(options).await;

        // validate and unwrap the RegisteredStream object
        let pending_response_stream = match pending_connections.into_parts() {
            (None, Some(recv_stream)) => recv_stream,
            _ => {
                panic!("Invalid data plane registration for a SingleIn/ManyOut transport");
            }
        };

        // separate out the the connection info and the stream provider from the registered stream
        let (connection_info, response_stream_provider) = pending_response_stream.into_parts();

        // package up the connection info as part of the "header" component of the two part message
        // used to issue the request on the
        // todo -- this object should be automatically created by the register call, and achieved by to the two into_parts()
        // calls. all the information here is provided by the [`StreamOptions`] object and/or the dataplane object
        let control_message = RequestControlMessage {
            id: engine_ctx.id().to_string(),
            request_type: RequestType::SingleIn,
            response_type: ResponseType::ManyOut,
            connection_info,
        };

        // next build the two part message where we package the connection info and the request into
        // a single Vec<u8> that can be sent over the wire.
        // --- package this up in the WorkQueuePublisher ---
131
132
133
134
135
136
137
138
139
140
141
142
        let ctrl = match serde_json::to_vec(&control_message) {
            Ok(ctrl) => ctrl,
            Err(err) => {
                anyhow::bail!("Failed serializing RequestControlMessage to JSON array: {err}");
            }
        };
        let data = match serde_json::to_vec(&request) {
            Ok(data) => data,
            Err(err) => {
                anyhow::bail!("Failed serializing request to JSON array: {err}");
            }
        };
Ryan Olson's avatar
Ryan Olson committed
143

144
145
146
        log::trace!(
            request_id,
            "packaging two-part message; ctrl: {} bytes, data: {} bytes",
Ryan Olson's avatar
Ryan Olson committed
147
148
149
150
151
152
153
154
155
156
            ctrl.len(),
            data.len()
        );

        let msg = TwoPartMessage::from_parts(ctrl.into(), data.into());

        // the request plane / work queue should provide a two part message codec that can be used
        // or it should take a two part message directly
        // todo - update this
        let codec = TwoPartCodec::default();
157
        let buffer = codec.encode_message(msg)?;
Ryan Olson's avatar
Ryan Olson committed
158
159
160

        // TRANSPORT ABSTRACT REQUIRED - END HERE

161
        log::trace!(request_id, "enqueueing two-part message to nats");
Ryan Olson's avatar
Ryan Olson committed
162
163
164
165
166
167
168
169

        // we might need to add a timeout on this if there is no subscriber to the subject; however, I think nats
        // will handle this for us
        let _response = self
            .req_transport
            .request(address.to_string(), buffer)
            .await?;

170
        log::trace!(request_id, "awaiting transport handshake");
Ryan Olson's avatar
Ryan Olson committed
171
172
173
174
175
176
177
        let response_stream = response_stream_provider
            .await
            .map_err(|_| PipelineError::DetatchedStreamReceiver)?
            .map_err(PipelineError::ConnectionFailed)?;

        let stream = tokio_stream::wrappers::ReceiverStream::new(response_stream.rx);

178
179
180
181
182
        let stream = stream.filter_map(|msg| async move {
            match serde_json::from_slice::<U>(&msg) {
                Ok(r) => Some(r),
                Err(err) => {
                    let json_str = String::from_utf8_lossy(&msg);
183
                    log::warn!(%err, %json_str, "Failed deserializing JSON to response");
184
185
186
                    None
                }
            }
Ryan Olson's avatar
Ryan Olson committed
187
188
189
190
191
        });

        Ok(ResponseStream::new(Box::pin(stream), engine_ctx))
    }
}