factory.rs 6.6 KB
Newer Older
1
2
//! Factory for creating router instances

3
use super::{
4
    http::{openai_router::OpenAIRouter, pd_router::PDRouter, router::Router},
5
6
    RouterTrait,
};
7
use crate::config::{ConnectionMode, PolicyConfig, RoutingMode};
8
use crate::policies::PolicyFactory;
9
10
use crate::server::AppContext;
use std::sync::Arc;
11
12
13
14
15

/// Factory for creating router instances based on configuration
pub struct RouterFactory;

impl RouterFactory {
16
    /// Create a router instance from application context
17
    pub async fn create_router(ctx: &Arc<AppContext>) -> Result<Box<dyn RouterTrait>, String> {
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
        // Check connection mode and route to appropriate implementation
        match ctx.router_config.connection_mode {
            ConnectionMode::Grpc => {
                // Route to gRPC implementation based on routing mode
                match &ctx.router_config.mode {
                    RoutingMode::Regular { worker_urls } => {
                        Self::create_grpc_router(worker_urls, &ctx.router_config.policy, ctx).await
                    }
                    RoutingMode::PrefillDecode {
                        prefill_urls,
                        decode_urls,
                        prefill_policy,
                        decode_policy,
                    } => {
                        Self::create_grpc_pd_router(
                            prefill_urls,
                            decode_urls,
                            prefill_policy.as_ref(),
                            decode_policy.as_ref(),
                            &ctx.router_config.policy,
                            ctx,
                        )
                        .await
                    }
42
43
44
                    RoutingMode::OpenAI { .. } => {
                        Err("OpenAI mode requires HTTP connection_mode".to_string())
                    }
45
                }
46
            }
47
48
49
50
            ConnectionMode::Http => {
                // Route to HTTP implementation based on routing mode
                match &ctx.router_config.mode {
                    RoutingMode::Regular { worker_urls } => {
51
                        Self::create_regular_router(worker_urls, ctx).await
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
                    }
                    RoutingMode::PrefillDecode {
                        prefill_urls,
                        decode_urls,
                        prefill_policy,
                        decode_policy,
                    } => {
                        Self::create_pd_router(
                            prefill_urls,
                            decode_urls,
                            prefill_policy.as_ref(),
                            decode_policy.as_ref(),
                            &ctx.router_config.policy,
                            ctx,
                        )
                        .await
                    }
69
70
71
                    RoutingMode::OpenAI { worker_urls, .. } => {
                        Self::create_openai_router(worker_urls.clone(), ctx).await
                    }
72
                }
73
            }
74
75
76
        }
    }

77
78
    /// Create a regular router
    pub async fn create_regular_router(
79
        worker_urls: &[String],
80
        ctx: &Arc<AppContext>,
81
    ) -> Result<Box<dyn RouterTrait>, String> {
82
83
        // Create regular router with context
        let router = Router::new(worker_urls.to_vec(), ctx).await?;
84
85
86
87
88

        Ok(Box::new(router))
    }

    /// Create a PD router with injected policy
89
    pub async fn create_pd_router(
90
91
        prefill_urls: &[(String, Option<u16>)],
        decode_urls: &[String],
92
93
94
        prefill_policy_config: Option<&PolicyConfig>,
        decode_policy_config: Option<&PolicyConfig>,
        main_policy_config: &PolicyConfig,
95
        ctx: &Arc<AppContext>,
96
    ) -> Result<Box<dyn RouterTrait>, String> {
97
        // Initialize policies in PolicyRegistry - use specific policies if provided, otherwise fall back to main policy
98
99
100
101
        let prefill_policy =
            PolicyFactory::create_from_config(prefill_policy_config.unwrap_or(main_policy_config));
        let decode_policy =
            PolicyFactory::create_from_config(decode_policy_config.unwrap_or(main_policy_config));
102

103
104
105
106
107
108
        // Set the prefill and decode policies in the registry
        ctx.policy_registry.set_prefill_policy(prefill_policy);
        ctx.policy_registry.set_decode_policy(decode_policy);

        // Create PD router with context (policies are in PolicyRegistry)
        let router = PDRouter::new(prefill_urls.to_vec(), decode_urls.to_vec(), ctx).await?;
109
110
111

        Ok(Box::new(router))
    }
112

113
114
    /// Create a gRPC router with injected policy
    pub async fn create_grpc_router(
115
116
117
        worker_urls: &[String],
        policy_config: &PolicyConfig,
        ctx: &Arc<AppContext>,
118
    ) -> Result<Box<dyn RouterTrait>, String> {
119
120
121
122
123
        use super::grpc::router::GrpcRouter;

        // Create policy
        let policy = PolicyFactory::create_from_config(policy_config);

124
125
        // Create gRPC router with context
        let router = GrpcRouter::new(worker_urls.to_vec(), policy, ctx).await?;
126
127

        Ok(Box::new(router))
128
129
    }

130
    /// Create a gRPC PD router with tokenizer and worker configuration
131
    pub async fn create_grpc_pd_router(
132
133
134
135
136
137
        prefill_urls: &[(String, Option<u16>)],
        decode_urls: &[String],
        prefill_policy_config: Option<&PolicyConfig>,
        decode_policy_config: Option<&PolicyConfig>,
        main_policy_config: &PolicyConfig,
        ctx: &Arc<AppContext>,
138
    ) -> Result<Box<dyn RouterTrait>, String> {
139
140
141
142
143
144
145
146
        use super::grpc::pd_router::GrpcPDRouter;

        // Create policies - use specific policies if provided, otherwise fall back to main policy
        let prefill_policy =
            PolicyFactory::create_from_config(prefill_policy_config.unwrap_or(main_policy_config));
        let decode_policy =
            PolicyFactory::create_from_config(decode_policy_config.unwrap_or(main_policy_config));

147
        // Create gRPC PD router with context
148
149
150
151
152
        let router = GrpcPDRouter::new(
            prefill_urls.to_vec(),
            decode_urls.to_vec(),
            prefill_policy,
            decode_policy,
153
            ctx,
154
155
156
157
        )
        .await?;

        Ok(Box::new(router))
158
159
    }

160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
    /// Create an OpenAI router
    async fn create_openai_router(
        worker_urls: Vec<String>,
        ctx: &Arc<AppContext>,
    ) -> Result<Box<dyn RouterTrait>, String> {
        // Use the first worker URL as the OpenAI-compatible base
        let base_url = worker_urls
            .first()
            .cloned()
            .ok_or_else(|| "OpenAI mode requires at least one worker URL".to_string())?;

        let router =
            OpenAIRouter::new(base_url, Some(ctx.router_config.circuit_breaker.clone())).await?;

        Ok(Box::new(router))
    }
176
}