Skip to content

Commit dadf0e2

Browse files
authored
chore: Remove old DisaggregatedRouter, making etcd presence optional (#4011)
Signed-off-by: Graham King <[email protected]>
1 parent 30d8588 commit dadf0e2

File tree

10 files changed

+16
-376
lines changed

10 files changed

+16
-376
lines changed

lib/bindings/python/rust/lib.rs

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -150,7 +150,6 @@ fn _core(m: &Bound<'_, PyModule>) -> PyResult<()> {
150150
m.add_class::<Endpoint>()?;
151151
m.add_class::<Client>()?;
152152
m.add_class::<AsyncResponseStream>()?;
153-
m.add_class::<llm::disagg_router::DisaggregatedRouter>()?;
154153
m.add_class::<llm::entrypoint::EntrypointArgs>()?;
155154
m.add_class::<llm::entrypoint::EngineConfig>()?;
156155
m.add_class::<llm::entrypoint::EngineType>()?;

lib/bindings/python/rust/llm.rs

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -27,7 +27,6 @@
2727
use super::*;
2828

2929
pub mod backend;
30-
pub mod disagg_router;
3130
pub mod entrypoint;
3231
pub mod kv;
3332
pub mod local_model;

lib/bindings/python/rust/llm/disagg_router.rs

Lines changed: 0 additions & 58 deletions
This file was deleted.

lib/bindings/python/src/dynamo/_core.pyi

Lines changed: 0 additions & 52 deletions
Original file line numberDiff line numberDiff line change
@@ -217,58 +217,6 @@ class Client:
217217
"""
218218
...
219219

220-
class DisaggregatedRouter:
221-
"""
222-
A router that determines whether to perform prefill locally or remotely based on
223-
sequence length thresholds.
224-
"""
225-
226-
def __init__(
227-
self,
228-
drt: DistributedRuntime,
229-
model_name: str,
230-
default_max_local_prefill_length: int,
231-
) -> None:
232-
"""
233-
Create a `DisaggregatedRouter` object.
234-
235-
Args:
236-
drt: The distributed runtime instance
237-
model_name: Name of the model
238-
default_max_local_prefill_length: Default maximum sequence length that can be processed locally
239-
"""
240-
...
241-
242-
def prefill_remote(self, prefill_length: int, prefix_hit_length: int) -> bool:
243-
"""
244-
Determine if prefill should be performed remotely based on sequence lengths.
245-
246-
Args:
247-
prefill_length: Total length of the sequence to prefill
248-
prefix_hit_length: Length of the prefix that was already processed
249-
250-
Returns:
251-
True if prefill should be performed remotely, False otherwise
252-
"""
253-
...
254-
255-
def update_value(self, max_local_prefill_length: int) -> None:
256-
"""
257-
Update the maximum local prefill length threshold.
258-
259-
Args:
260-
max_local_prefill_length: New maximum sequence length that can be processed locally
261-
"""
262-
...
263-
264-
def get_model_name(self) -> str:
265-
"""
266-
Get the name of the model associated with this router.
267-
268-
Returns:
269-
The model name as a string
270-
"""
271-
...
272220

273221
def compute_block_hash_for_seq_py(tokens: List[int], kv_block_size: int) -> List[int]:
274222
"""

lib/bindings/python/src/dynamo/llm/__init__.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,6 @@
66
import logging
77

88
from dynamo._core import ApproxKvIndexer as ApproxKvIndexer
9-
from dynamo._core import DisaggregatedRouter as DisaggregatedRouter
109
from dynamo._core import EngineType
1110
from dynamo._core import EntrypointArgs as EntrypointArgs
1211
from dynamo._core import ForwardPassMetrics as ForwardPassMetrics

lib/llm/src/disagg_router.rs

Lines changed: 0 additions & 250 deletions
This file was deleted.

0 commit comments

Comments
 (0)