component.rs 18.5 KB
Newer Older
1
2
// SPDX-FileCopyrightText: Copyright (c) 2024-2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
// SPDX-License-Identifier: Apache-2.0
Ryan Olson's avatar
Ryan Olson committed
3
4
5

//! The [Component] module defines the top-level API for building distributed applications.
//!
Graham King's avatar
Graham King committed
6
7
8
//! A distributed application consists of a set of [Component] that can host one
//! or more [Endpoint]. Each [Endpoint] is a network-accessible service
//! that can be accessed by other [Component] in the distributed application.
Ryan Olson's avatar
Ryan Olson committed
9
10
11
12
//!
//! A [Component] is made discoverable by registering it with the distributed runtime under
//! a [`Namespace`].
//!
Graham King's avatar
Graham King committed
13
//! A [`Namespace`] is a logical grouping of [Component] that are grouped together.
Ryan Olson's avatar
Ryan Olson committed
14
15
16
17
18
19
20
21
22
23
24
25
//!
//! We might extend namespace to include grouping behavior, which would define groups of
//! components that are tightly coupled.
//!
//! A [Component] is the core building block of a distributed application. It is a logical
//! unit of work such as a `Preprocessor` or `SmartRouter` that has a well-defined role in the
//! distributed application.
//!
//! A [Component] can present to the distributed application one or more configuration files
//! which define how that component was constructed/configured and what capabilities it can
//! provide.
//!
Graham King's avatar
Graham King committed
26
//! Other [Component] can write to watching locations within a [Component] etcd
Ryan Olson's avatar
Ryan Olson committed
27
28
29
30
31
//! path. This allows the [Component] to take dynamic actions depending on the watch
//! triggers.
//!
//! TODO: Top-level Overview of Endpoints/Functions

32
33
use std::fmt;

34
use crate::{
35
36
    config::HealthStatus,
    distributed::RequestPlaneMode,
37
    metrics::{MetricsHierarchy, MetricsRegistry, prometheus_names},
38
    service::ServiceClient,
39
    service::ServiceSet,
40
};
Ryan Olson's avatar
Ryan Olson committed
41

42
use super::{DistributedRuntime, Runtime, traits::*, transports::nats::Slug, utils::Duration};
Ryan Olson's avatar
Ryan Olson committed
43

44
use crate::pipeline::network::{PushWorkHandler, ingress::push_endpoint::PushEndpoint};
45
use crate::protocols::EndpointId;
46
use crate::service::ComponentNatsServerPrometheusMetrics;
Ryan Olson's avatar
Ryan Olson committed
47
48
49
50
51
52
53
54
use async_nats::{
    rustls::quic,
    service::{Service, ServiceExt},
};
use derive_builder::Builder;
use derive_getters::Getters;
use educe::Educe;
use serde::{Deserialize, Serialize};
55
use service::EndpointStatsHandler;
56
use std::{collections::HashMap, hash::Hash, sync::Arc};
Ryan Olson's avatar
Ryan Olson committed
57
58
59
use validator::{Validate, ValidationError};

mod client;
60
61
#[allow(clippy::module_inception)]
mod component;
Ryan Olson's avatar
Ryan Olson committed
62
mod endpoint;
Ryan Olson's avatar
Ryan Olson committed
63
mod namespace;
Ryan Olson's avatar
Ryan Olson committed
64
mod registry;
65
pub mod service;
Ryan Olson's avatar
Ryan Olson committed
66

67
pub use client::Client;
68

69
#[derive(Debug, Clone, Serialize, Deserialize, Eq, PartialEq, Hash)]
Ryan Olson's avatar
Ryan Olson committed
70
71
#[serde(rename_all = "snake_case")]
pub enum TransportType {
72
73
74
75
    #[serde(rename = "nats_tcp")]
    Nats(String),
    Http(String),
    Tcp(String),
Ryan Olson's avatar
Ryan Olson committed
76
77
}

78
79
#[derive(Default)]
pub struct RegistryInner {
80
81
82
    pub(crate) services: HashMap<String, Service>,
    pub(crate) stats_handlers:
        HashMap<String, Arc<parking_lot::Mutex<HashMap<String, EndpointStatsHandler>>>>,
83
84
}

Ryan Olson's avatar
Ryan Olson committed
85
86
#[derive(Clone)]
pub struct Registry {
87
    pub(crate) inner: Arc<tokio::sync::Mutex<RegistryInner>>,
Ryan Olson's avatar
Ryan Olson committed
88
89
}

90
#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
91
pub struct Instance {
Ryan Olson's avatar
Ryan Olson committed
92
93
94
    pub component: String,
    pub endpoint: String,
    pub namespace: String,
95
    pub instance_id: u64,
Ryan Olson's avatar
Ryan Olson committed
96
97
98
    pub transport: TransportType,
}

99
impl Instance {
100
    pub fn id(&self) -> u64 {
101
        self.instance_id
102
    }
103
104
105
106
107
108
109
    pub fn endpoint_id(&self) -> EndpointId {
        EndpointId {
            namespace: self.namespace.clone(),
            component: self.component.clone(),
            name: self.endpoint.clone(),
        }
    }
110
111
}

112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
impl fmt::Display for Instance {
    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
        write!(
            f,
            "{}/{}/{}/{}",
            self.namespace, self.component, self.endpoint, self.instance_id
        )
    }
}

/// Sort by string name
impl std::cmp::Ord for Instance {
    fn cmp(&self, other: &Self) -> std::cmp::Ordering {
        self.to_string().cmp(&other.to_string())
    }
}

impl PartialOrd for Instance {
    fn partial_cmp(&self, other: &Self) -> Option<std::cmp::Ordering> {
        // Since Ord is fully implemented, the comparison is always total.
        Some(self.cmp(other))
    }
}

Ryan Olson's avatar
Ryan Olson committed
136
/// A [Component] a discoverable entity in the distributed runtime.
Graham King's avatar
Graham King committed
137
138
/// You can host [Endpoint] on a [Component] by first creating
/// a [Service] then adding one or more [Endpoint] to the [Service].
Ryan Olson's avatar
Ryan Olson committed
139
140
///
/// You can also issue a request to a [Component]'s [Endpoint] by creating a [Client].
141
#[derive(Educe, Builder, Clone, Validate)]
Ryan Olson's avatar
Ryan Olson committed
142
#[educe(Debug)]
143
#[builder(pattern = "owned", build_fn(private, name = "build_internal"))]
Ryan Olson's avatar
Ryan Olson committed
144
145
146
pub struct Component {
    #[builder(private)]
    #[educe(Debug(ignore))]
147
    drt: Arc<DistributedRuntime>,
Ryan Olson's avatar
Ryan Olson committed
148
149
150

    /// Name of the component
    #[builder(setter(into))]
151
    #[validate(custom(function = "validate_allowed_chars"))]
Ryan Olson's avatar
Ryan Olson committed
152
153
    name: String,

154
155
156
157
    /// Additional labels for metrics
    #[builder(default = "Vec::new()")]
    labels: Vec<(String, String)>,

Ryan Olson's avatar
Ryan Olson committed
158
159
160
    // todo - restrict the namespace to a-z0-9-_A-Z
    /// Namespace
    #[builder(setter(into))]
161
    namespace: Namespace,
162

163
164
165
    /// This hierarchy's own metrics registry
    #[builder(default = "crate::MetricsRegistry::new()")]
    metrics_registry: crate::MetricsRegistry,
Ryan Olson's avatar
Ryan Olson committed
166
167
}

168
169
170
171
172
173
174
175
176
impl Hash for Component {
    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
        self.namespace.name().hash(state);
        self.name.hash(state);
    }
}

impl PartialEq for Component {
    fn eq(&self, other: &Self) -> bool {
177
        self.namespace.name() == other.namespace.name() && self.name == other.name
178
179
180
181
182
    }
}

impl Eq for Component {}

183
184
impl std::fmt::Display for Component {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
185
        write!(f, "{}.{}", self.namespace.name(), self.name)
186
187
188
    }
}

189
190
191
192
193
194
195
196
197
198
199
200
impl DistributedRuntimeProvider for Component {
    fn drt(&self) -> &DistributedRuntime {
        &self.drt
    }
}

impl RuntimeProvider for Component {
    fn rt(&self) -> &Runtime {
        self.drt.rt()
    }
}

201
impl MetricsHierarchy for Component {
202
203
204
205
    fn basename(&self) -> String {
        self.name.clone()
    }

206
207
208
209
210
211
212
213
214
215
216
217
218
219
    fn parent_hierarchies(&self) -> Vec<&dyn MetricsHierarchy> {
        let mut parents = vec![];

        // Get all ancestors of namespace (DRT, parent namespaces, etc.)
        parents.extend(self.namespace.parent_hierarchies());

        // Add namespace itself
        parents.push(&self.namespace as &dyn MetricsHierarchy);

        parents
    }

    fn get_metrics_registry(&self) -> &MetricsRegistry {
        &self.metrics_registry
220
221
222
    }
}

Ryan Olson's avatar
Ryan Olson committed
223
impl Component {
224
    pub fn service_name(&self) -> String {
225
        let service_name = format!("{}_{}", self.namespace.name(), self.name);
226
        Slug::slugify(&service_name).to_string()
Ryan Olson's avatar
Ryan Olson committed
227
228
    }

229
    pub fn namespace(&self) -> &Namespace {
230
231
232
        &self.namespace
    }

233
234
    pub fn name(&self) -> &str {
        &self.name
235
236
    }

237
238
239
240
    pub fn labels(&self) -> &[(String, String)] {
        &self.labels
    }

Ryan Olson's avatar
Ryan Olson committed
241
242
243
244
    pub fn endpoint(&self, endpoint: impl Into<String>) -> Endpoint {
        Endpoint {
            component: self.clone(),
            name: endpoint.into(),
245
            labels: Vec::new(),
246
            metrics_registry: crate::MetricsRegistry::new(),
Ryan Olson's avatar
Ryan Olson committed
247
248
249
        }
    }

250
    pub async fn list_instances(&self) -> anyhow::Result<Vec<Instance>> {
251
252
253
254
255
        let discovery = self.drt.discovery();

        let discovery_query = crate::discovery::DiscoveryQuery::ComponentEndpoints {
            namespace: self.namespace.name(),
            component: self.name.clone(),
256
        };
257
258
259
260
261
262
263
264
265
266
267
268

        let discovery_instances = discovery.list(discovery_query).await?;

        // Extract Instance from DiscoveryInstance::Endpoint wrapper
        let mut instances: Vec<Instance> = discovery_instances
            .into_iter()
            .filter_map(|di| match di {
                crate::discovery::DiscoveryInstance::Endpoint(instance) => Some(instance),
                _ => None, // Ignore all other variants (ModelCard, etc.)
            })
            .collect();

269
270
        instances.sort();
        Ok(instances)
Ryan Olson's avatar
Ryan Olson committed
271
272
    }

273
274
    /// Scrape ServiceSet, which contains NATS stats as well as user defined stats
    /// embedded in data field of ServiceInfo.
275
    async fn scrape_stats(&self, timeout: Duration) -> anyhow::Result<ServiceSet> {
276
        // Debug: scraping stats for component
Ryan Olson's avatar
Ryan Olson committed
277
        let service_name = self.service_name();
278
279
280
281
282
        let Some(service_client) = self
            .drt()
            .nats_client()
            .map(|nc| ServiceClient::new(nc.clone()))
        else {
283
284
            anyhow::bail!("ServiceSet is gathered via NATS, do not call this in non-NATS setups.");
        };
Ryan Olson's avatar
Ryan Olson committed
285
        service_client
286
            .collect_services(&service_name, timeout)
Ryan Olson's avatar
Ryan Olson committed
287
288
289
            .await
    }

290
    /// Add Prometheus metrics for this component's NATS service stats.
291
    ///
292
    /// Starts a background task that periodically requests service statistics from NATS
293
294
295
296
    /// and updates the corresponding Prometheus metrics. The first scrape happens immediately,
    /// then subsequent scrapes occur at a fixed interval of 9.8 seconds (MAX_WAIT_MS),
    /// which should be near or smaller than typical Prometheus scraping intervals to ensure
    /// metrics are fresh when Prometheus collects them.
297
    fn start_scraping_nats_service_component_metrics(&self) -> anyhow::Result<()> {
298
        const MAX_WAIT_MS: std::time::Duration = std::time::Duration::from_millis(9800); // Should be <= Prometheus scrape interval
299

300
301
        // If there is another component with the same service name, this will fail.
        let component_metrics = ComponentNatsServerPrometheusMetrics::new(self)?;
302
303
304

        let component_clone = self.clone();

305
306
307
308
        // Start a background task that scrapes stats every 5 seconds
        let m = component_metrics.clone();
        let c = component_clone.clone();

309
310
311
312
313
314
315
316
317
        // Use the DRT's runtime handle to spawn the background task.
        // We cannot use regular `tokio::spawn` here because:
        // 1. This method may be called from contexts without an active Tokio runtime
        //    (e.g., tests that create a DRT in a blocking context)
        // 2. Tests often create a temporary runtime just to build the DRT, then drop it
        // 3. `tokio::spawn` requires being called from within a runtime context
        // By using the DRT's own runtime handle, we ensure the task runs in the
        // correct runtime that will persist for the lifetime of the component.
        c.drt().runtime().secondary().spawn(async move {
318
319
            let timeout = std::time::Duration::from_millis(500);
            let mut interval = tokio::time::interval(MAX_WAIT_MS);
320
321
322
323
324
325
326
327
328
329
330
331
332
333
            interval.set_missed_tick_behavior(tokio::time::MissedTickBehavior::Skip);

            loop {
                match c.scrape_stats(timeout).await {
                    Ok(service_set) => {
                        m.update_from_service_set(&service_set);
                    }
                    Err(err) => {
                        tracing::error!(
                            "Background scrape failed for {}: {}",
                            c.service_name(),
                            err
                        );
                        m.reset_to_zeros();
334
335
                    }
                }
336

337
338
                interval.tick().await;
            }
339
340
341
342
343
        });

        Ok(())
    }

344
    // Gather NATS metrics
345
    async fn add_stats_service(&mut self) -> anyhow::Result<()> {
346
347
348
349
350
        let service_name = self.service_name();

        // Pre-check to save cost of creating the service, but don't hold the lock
        if self
            .drt
351
            .component_registry()
352
353
354
355
356
357
            .inner
            .lock()
            .await
            .services
            .contains_key(&service_name)
        {
358
359
360
361
            // The NATS service is per component, but it is called from `serve_endpoint`, and there
            // are often multiple endpoints for a component (e.g. `clear_kv_blocks` and `generate`).
            tracing::trace!("Service {service_name} already exists");
            return Ok(());
362
363
364
365
366
367
368
369
370
        }

        let Some(nats_client) = self.drt.nats_client() else {
            anyhow::bail!("Cannot create NATS service without NATS.");
        };
        let description = None;
        let (nats_service, stats_reg) =
            service::build_nats_service(nats_client, self, description).await?;

371
        let mut guard = self.drt.component_registry().inner.lock().await;
372
373
374
375
        if !guard.services.contains_key(&service_name) {
            // Normal case
            guard.services.insert(service_name.clone(), nats_service);
            guard.stats_handlers.insert(service_name.clone(), stats_reg);
376
377
378

            tracing::info!("Added NATS / stats service {service_name}");

379
380
381
382
            drop(guard);
        } else {
            drop(guard);
            let _ = nats_service.stop().await;
383
384
385
            // The NATS service is per component, but it is called from `serve_endpoint`, and there
            // are often multiple endpoints for a component (e.g. `clear_kv_blocks` and `generate`).
            return Ok(());
386
387
        }

388
389
390
391
392
393
        if let Err(err) = self.start_scraping_nats_service_component_metrics() {
            tracing::debug!(
                "Metrics registration failed for '{}': {}",
                self.service_name(),
                err
            );
394
395
        }
        Ok(())
Ryan Olson's avatar
Ryan Olson committed
396
397
398
399
    }
}

impl ComponentBuilder {
400
    pub fn from_runtime(drt: Arc<DistributedRuntime>) -> Self {
Ryan Olson's avatar
Ryan Olson committed
401
402
        Self::default().drt(drt)
    }
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417

    pub fn build(self) -> Result<Component, anyhow::Error> {
        let component = self.build_internal()?;
        // If this component is using NATS, gather it's metrics
        if component.drt().request_plane().is_nats() {
            let mut c = component.clone();
            // Start in the background to isolate the async, and because we don't need it yet
            component.drt().runtime().secondary().spawn(async move {
                if let Err(err) = c.add_stats_service().await {
                    tracing::error!(error = %err, component = c.service_name(), "Failed starting stats service");
                }
            });
        }
        Ok(component)
    }
Ryan Olson's avatar
Ryan Olson committed
418
419
420
421
422
423
424
425
426
}

#[derive(Debug, Clone)]
pub struct Endpoint {
    component: Component,

    // todo - restrict alphabet
    /// Endpoint name
    name: String,
427

428
429
    /// Additional labels for metrics
    labels: Vec<(String, String)>,
430
431
432

    /// This hierarchy's own metrics registry
    metrics_registry: crate::MetricsRegistry,
Ryan Olson's avatar
Ryan Olson committed
433
434
}

435
436
437
438
439
440
441
442
443
impl Hash for Endpoint {
    fn hash<H: std::hash::Hasher>(&self, state: &mut H) {
        self.component.hash(state);
        self.name.hash(state);
    }
}

impl PartialEq for Endpoint {
    fn eq(&self, other: &Self) -> bool {
444
        self.component == other.component && self.name == other.name
445
446
447
448
449
    }
}

impl Eq for Endpoint {}

450
451
452
453
454
455
456
457
458
459
460
461
impl DistributedRuntimeProvider for Endpoint {
    fn drt(&self) -> &DistributedRuntime {
        self.component.drt()
    }
}

impl RuntimeProvider for Endpoint {
    fn rt(&self) -> &Runtime {
        self.component.rt()
    }
}

462
impl MetricsHierarchy for Endpoint {
463
464
465
466
    fn basename(&self) -> String {
        self.name.clone()
    }

467
468
469
470
471
472
473
474
475
476
477
478
479
480
    fn parent_hierarchies(&self) -> Vec<&dyn MetricsHierarchy> {
        let mut parents = vec![];

        // Get all ancestors of component (DRT, Namespace, etc.)
        parents.extend(self.component.parent_hierarchies());

        // Add component itself
        parents.push(&self.component as &dyn MetricsHierarchy);

        parents
    }

    fn get_metrics_registry(&self) -> &MetricsRegistry {
        &self.metrics_registry
481
482
483
    }
}

Ryan Olson's avatar
Ryan Olson committed
484
impl Endpoint {
485
486
487
488
489
490
491
492
    pub fn id(&self) -> EndpointId {
        EndpointId {
            namespace: self.component.namespace().name().to_string(),
            component: self.component.name().to_string(),
            name: self.name().to_string(),
        }
    }

Ryan Olson's avatar
Ryan Olson committed
493
494
495
496
    pub fn name(&self) -> &str {
        &self.name
    }

497
498
499
500
    pub fn component(&self) -> &Component {
        &self.component
    }

501
    pub async fn client(&self) -> anyhow::Result<client::Client> {
502
        client::Client::new(self.clone()).await
Ryan Olson's avatar
Ryan Olson committed
503
504
505
506
507
508
509
    }

    pub fn endpoint_builder(&self) -> endpoint::EndpointConfigBuilder {
        endpoint::EndpointConfigBuilder::from_endpoint(self.clone())
    }
}

510
#[derive(Builder, Clone, Validate)]
Ryan Olson's avatar
Ryan Olson committed
511
512
513
#[builder(pattern = "owned")]
pub struct Namespace {
    #[builder(private)]
514
    runtime: Arc<DistributedRuntime>,
Ryan Olson's avatar
Ryan Olson committed
515

516
    #[validate(custom(function = "validate_allowed_chars"))]
Ryan Olson's avatar
Ryan Olson committed
517
    name: String,
518

519
520
    #[builder(default = "None")]
    parent: Option<Arc<Namespace>>,
521
522
523
524

    /// Additional labels for metrics
    #[builder(default = "Vec::new()")]
    labels: Vec<(String, String)>,
525
526
527
528

    /// This hierarchy's own metrics registry
    #[builder(default = "crate::MetricsRegistry::new()")]
    metrics_registry: crate::MetricsRegistry,
Ryan Olson's avatar
Ryan Olson committed
529
530
}

531
532
533
534
535
536
impl DistributedRuntimeProvider for Namespace {
    fn drt(&self) -> &DistributedRuntime {
        &self.runtime
    }
}

537
538
539
540
impl std::fmt::Debug for Namespace {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        write!(
            f,
541
542
            "Namespace {{ name: {}; parent: {:?} }}",
            self.name, self.parent
543
544
545
546
        )
    }
}

547
548
549
550
551
552
impl RuntimeProvider for Namespace {
    fn rt(&self) -> &Runtime {
        self.runtime.rt()
    }
}

553
554
555
556
557
558
impl std::fmt::Display for Namespace {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        write!(f, "{}", self.name)
    }
}

Ryan Olson's avatar
Ryan Olson committed
559
impl Namespace {
560
    pub(crate) fn new(runtime: DistributedRuntime, name: String) -> anyhow::Result<Self> {
Ryan Olson's avatar
Ryan Olson committed
561
        Ok(NamespaceBuilder::default()
562
            .runtime(Arc::new(runtime))
Ryan Olson's avatar
Ryan Olson committed
563
564
565
566
            .name(name)
            .build()?)
    }

567
    /// Create a [`Component`] in the namespace who's endpoints can be discovered with etcd
568
    pub fn component(&self, name: impl Into<String>) -> anyhow::Result<Component> {
569
        ComponentBuilder::from_runtime(self.runtime.clone())
Ryan Olson's avatar
Ryan Olson committed
570
            .name(name)
571
            .namespace(self.clone())
572
            .build()
Ryan Olson's avatar
Ryan Olson committed
573
    }
Ryan Olson's avatar
Ryan Olson committed
574

575
    /// Create a [`Namespace`] in the parent namespace
576
    pub fn namespace(&self, name: impl Into<String>) -> anyhow::Result<Namespace> {
577
578
579
580
581
582
583
584
585
586
587
588
        Ok(NamespaceBuilder::default()
            .runtime(self.runtime.clone())
            .name(name.into())
            .parent(Some(Arc::new(self.clone())))
            .build()?)
    }

    pub fn name(&self) -> String {
        match &self.parent {
            Some(parent) => format!("{}.{}", parent.name(), self.name),
            None => self.name.clone(),
        }
Ryan Olson's avatar
Ryan Olson committed
589
    }
Ryan Olson's avatar
Ryan Olson committed
590
591
592
593
594
595
596
597
598
599
600
601
602
}

// Custom validator function
fn validate_allowed_chars(input: &str) -> Result<(), ValidationError> {
    // Define the allowed character set using a regex
    let regex = regex::Regex::new(r"^[a-z0-9-_]+$").unwrap();

    if regex.is_match(input) {
        Ok(())
    } else {
        Err(ValidationError::new("invalid_characters"))
    }
}