Skip to content

Commit ced1a73

Browse files
authored
Merge branch 'main' into rmccormick/cp_anish_docs_to_main
2 parents fc63b57 + fb10ffb commit ced1a73

File tree

4 files changed

+2
-6
lines changed

4 files changed

+2
-6
lines changed

.github/workflows/trigger_ci.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -52,7 +52,7 @@ jobs:
5252
- 'components/backends/vllm/**'
5353
- 'tests/serve/test_vllm.py'
5454
trtllm:
55-
- 'container/Dockerfile.tensorrt_llm'
55+
- 'container/Dockerfile.trtllm'
5656
- 'components/backends/trtllm/**'
5757
- 'container/build.sh'
5858
- 'container/build_trtllm_wheel.sh'

components/backends/trtllm/src/dynamo/trtllm/main.py

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -229,9 +229,6 @@ async def init(runtime: DistributedRuntime, config: Config):
229229
endpoint = component.endpoint(config.endpoint)
230230

231231
if is_first_worker(config):
232-
# Get runtime configuration from the engine
233-
runtime_config = await get_engine_runtime_config(engine, config)
234-
235232
# Register the model with runtime config
236233
await register_llm(
237234
modelType,
@@ -240,7 +237,6 @@ async def init(runtime: DistributedRuntime, config: Config):
240237
config.served_model_name,
241238
kv_cache_block_size=config.kv_block_size,
242239
migration_limit=config.migration_limit,
243-
runtime_config=runtime_config, # Add runtime config here
244240
)
245241
# publisher will be set later if publishing is enabled.
246242
handler_config = RequestHandlerConfig(

components/backends/vllm/README.md

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -41,6 +41,7 @@ git checkout $(git describe --tags $(git rev-list --tags --max-count=1))
4141
| [**SLA-Based Planner**](../../../docs/architecture/sla_planner.md) || |
4242
| [**Load Based Planner**](../../../docs/architecture/load_planner.md) | 🚧 | WIP |
4343
| [**KVBM**](../../../docs/architecture/kvbm_architecture.md) | 🚧 | WIP |
44+
| [**LMCache**](./LMCache_Integration.md) || |
4445

4546
### Large Scale P/D and WideEP Features
4647

components/backends/vllm/src/dynamo/vllm/main.py

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -132,7 +132,6 @@ async def init_prefill(runtime: DistributedRuntime, config: Config):
132132
"""
133133
Instantiate and serve
134134
"""
135-
136135
component = runtime.namespace(config.namespace).component(config.component)
137136
await component.create_service()
138137

0 commit comments

Comments
 (0)