Undo extra changes

ai-dynamo · tanmayv25 · Jul 31, 2025 · Jul 23, 2025 · Jul 28, 2025 · Jul 28, 2025
commit 004a801c6c55f79280e9b6740bc5143d5cf94373
diff --git a/components/backends/trtllm/engine_configs/agg.yaml b/components/backends/trtllm/engine_configs/agg.yaml
@@ -16,6 +16,7 @@ tensor_parallel_size: 1
 moe_expert_parallel_size: 1
 enable_attention_dp: false
 max_num_tokens: 8192
+max_batch_size: 16
 trust_remote_code: true
 backend: pytorch
 enable_chunked_prefill: true

@@ -94,6 +94,8 @@ TRTLLM_USE_NIXL_KVCACHE_EXPERIMENTAL="0"
 
 # TensorRT-LLM PyPI index URL
 TENSORRTLLM_INDEX_URL="https://pypi.python.org/simple"
+# TODO: Remove the version specification from here and use the ai-dynamo[trtllm] package.
+# Need to update the Dockerfile.tensorrt_llm to use the ai-dynamo[trtllm] package.
 DEFAULT_TENSORRTLLM_PIP_WHEEL="tensorrt-llm==1.0.0rc4"
 TENSORRTLLM_PIP_WHEEL=""