Skip to content

Commit 53e28ab

Browse files
chore: stragglers rename (ai-dynamo#69)
Co-authored-by: Harrison King Saturley-Hall <[email protected]>
1 parent 4e8b97c commit 53e28ab

File tree

7 files changed

+9
-10
lines changed

7 files changed

+9
-10
lines changed

examples/python_rs/llm/vllm/scripts/disaggregated.sh

+2-2
Original file line numberDiff line numberDiff line change
@@ -99,7 +99,7 @@ PREFILL_CMD="VLLM_WORKER_MULTIPROC_METHOD=spawn CUDA_VISIBLE_DEVICES=0 \
9999
--max-model-len 1000 \
100100
--tensor-parallel-size 1 \
101101
--kv-transfer-config \
102-
'{\"kv_connector\":\"TritonNcclConnector\",\"kv_role\":\"kv_producer\",\"kv_rank\":0,\"kv_parallel_size\":2}'"
102+
'{\"kv_connector\":\"DynamoNcclConnector\",\"kv_role\":\"kv_producer\",\"kv_rank\":0,\"kv_parallel_size\":2}'"
103103

104104
tmux select-pane -t 2
105105
tmux send-keys "$INIT_CMD && $PREFILL_CMD" C-m
@@ -115,7 +115,7 @@ DECODE_CMD="VLLM_WORKER_MULTIPROC_METHOD=spawn CUDA_VISIBLE_DEVICES=1 \
115115
--max-model-len 1000 \
116116
--tensor-parallel-size 1 \
117117
--kv-transfer-config \
118-
'{\"kv_connector\":\"TritonNcclConnector\",\"kv_role\":\"kv_consumer\",\"kv_rank\":1,\"kv_parallel_size\":2}'"
118+
'{\"kv_connector\":\"DynamoNcclConnector\",\"kv_role\":\"kv_consumer\",\"kv_rank\":1,\"kv_parallel_size\":2}'"
119119

120120
tmux select-pane -t 3
121121
tmux send-keys "$INIT_CMD && $DECODE_CMD" C-m

examples/python_rs/llm/vllm_nixl/router/prefill_worker.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -94,7 +94,7 @@ async def worker(runtime: DistributedRuntime, engine_args: AsyncEngineArgs):
9494

9595
request_handler = RequestHandler(engine_client, metadata_store)
9696

97-
# TODO: integrate prefill_queue to an triton_distributed endpoint
97+
# TODO: integrate prefill_queue to a dynamo endpoint
9898
async with PrefillQueue.get_instance(
9999
nats_server=prefill_queue_nats_server,
100100
stream_name=prefill_queue_stream_name,

examples/python_rs/llm/vllm_nixl/router/worker.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -70,7 +70,7 @@ def __init__(
7070
print("RequestHandler initialized")
7171

7272
def get_remote_prefill_request_callback(self):
73-
# TODO: integrate prefill_queue to an triton_distributed endpoint
73+
# TODO: integrate prefill_queue to dynamo endpoint
7474
async def callback(request: RemotePrefillRequest):
7575
async with PrefillQueue.get_instance(
7676
nats_server=self._prefill_queue_nats_server,

lib/bindings/cpp/nvllm-trt/include/nvidia/nvllm/nvllm_trt.h

+1-1
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,7 @@ nvllm_trt_engine_t nvllm_trt_engine_create(const char* config_proto);
3333
// Create a nvLLM TRT Engine from an instance of the engine
3434
// This requires the raw engine pointer to be an instantiated object at the exact same
3535
// commit version as the version of TRTLLM used to build the nvLLM C API.
36-
// This is a workaround to enable the Triton TensorRT LLM backend to use nvLLM.
36+
// This is a workaround to enable the Dynamo TensorRT LLM backend to use nvLLM.
3737
nvllm_trt_engine_t nvllm_trt_engine_unsafe_create_from_executor(void* engine);
3838

3939
// Source: Enqueue a streaming request via a json message to the request queue

lib/bindings/python/uv.lock

+1-1
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

lib/runtime/src/component/service.rs

+1-2
Original file line numberDiff line numberDiff line change
@@ -27,8 +27,7 @@ pub type StatsHandler =
2727
pub type EndpointStatsHandler =
2828
Box<dyn FnMut(endpoint::Stats) -> serde_json::Value + Send + Sync + 'static>;
2929

30-
// TODO(rename) - pending rename of project
31-
pub const PROJECT_NAME: &str = "Triton";
30+
pub const PROJECT_NAME: &str = "Dynamo";
3231

3332
#[derive(Educe, Builder, Dissolve)]
3433
#[educe(Debug)]

lib/runtime/src/lib.rs

+2-2
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
// See the License for the specific language governing permissions and
1414
// limitations under the License.
1515

16-
//! Triton
16+
//! Dynamo
1717
1818
#![allow(dead_code)]
1919
#![allow(unused_imports)]
@@ -49,7 +49,7 @@ pub use futures::stream;
4949
pub use tokio_util::sync::CancellationToken;
5050
pub use worker::Worker;
5151

52-
/// Types of Tokio runtimes that can be used to construct a Triton [Runtime].
52+
/// Types of Tokio runtimes that can be used to construct a Dynamo [Runtime].
5353
#[derive(Clone)]
5454
enum RuntimeType {
5555
Shared(Arc<tokio::runtime::Runtime>),

0 commit comments

Comments
 (0)