|
35 | 35 | class OpenAIDisaggServer: |
36 | 36 |
|
37 | 37 | def __init__(self, |
38 | | - ctx_servers: List[str] = None, |
39 | | - gen_servers: List[str] = None, |
| 38 | + ctx_servers: List[str], |
| 39 | + gen_servers: List[str], |
40 | 40 | req_timeout_secs: int = 180, |
41 | 41 | server_start_timeout_secs: int = 180, |
42 | 42 | ctx_router_config: Optional[RouterConfig] = None, |
43 | 43 | gen_router_config: Optional[RouterConfig] = None, |
44 | 44 | conditional_disagg_config: Optional[ConditionalDisaggConfig] = None, |
45 | | - metadata_server_cfg: MetadataServerConfig = None): |
| 45 | + metadata_server_cfg: Optional[MetadataServerConfig] = None): |
46 | 46 |
|
47 | 47 | self.ctx_servers = ctx_servers |
48 | 48 | self.gen_servers = gen_servers |
49 | 49 | self.metadata_server = create_metadata_server(metadata_server_cfg) |
50 | | - self.ctx_router = create_router(ctx_router_config, ctx_servers, self.metadata_server) |
51 | | - self.gen_router = create_router(gen_router_config, gen_servers, self.metadata_server) |
| 50 | + self.ctx_router = create_router(ctx_router_config, ctx_servers, metadata_server_cfg, self.metadata_server) |
| 51 | + self.gen_router = create_router(gen_router_config, gen_servers, metadata_server_cfg, self.metadata_server) |
52 | 52 | self.conditional_disagg_config = conditional_disagg_config |
53 | 53 |
|
54 | 54 |
|
@@ -76,8 +76,8 @@ async def lifespan(app: FastAPI): |
76 | 76 |
|
77 | 77 | if self.metadata_server: |
78 | 78 | logger.info("Starting server monitoring via metadata service") |
79 | | - await self.ctx_router.start_server_monitoring() |
80 | | - await self.gen_router.start_server_monitoring() |
| 79 | + await self.ctx_router.start_server_monitoring(metadata_server_cfg.refresh_interval) |
| 80 | + await self.gen_router.start_server_monitoring(metadata_server_cfg.refresh_interval) |
81 | 81 |
|
82 | 82 | yield |
83 | 83 |
|
|
0 commit comments