fix: Update TRT-LLM Wide-EP Disagg GB200 Recipe to be compatible with TRT-LLM Version (#5383)

a98406d4 · Rohan Varma · GitHub · 9ca2923d · a98406d4
Unverified Commit a98406d4 authored Jan 13, 2026 by Rohan Varma Committed by GitHub Jan 13, 2026
Hide whitespace changes
Inline Side-by-side

Showing with 6 additions and 8 deletions

recipes/deepseek-r1/trtllm/disagg/wide_ep/gb200/deploy.yaml recipes/deepseek-r1/trtllm/disagg/wide_ep/gb200/deploy.yaml +6 -8

No files found.
--- a/recipes/deepseek-r1/trtllm/disagg/wide_ep/gb200/deploy.yaml
+++ b/recipes/deepseek-r1/trtllm/disagg/wide_ep/gb200/deploy.yaml
@@ -20,10 +20,9 @@ metadata:
  name: prefill-config
 data:
  prefill_config.yaml: |
-    build_config:
+    max_batch_size: 4
-        max_batch_size: 4
+    max_num_tokens: 4608
-        max_num_tokens: 4608
+    max_seq_len: 1227
-        max_seq_len: 1227
    tensor_parallel_size: 4
    moe_expert_parallel_size: 4
    enable_attention_dp: true
@@ -52,10 +51,9 @@ data:
    moe_expert_parallel_size: 32
    enable_attention_dp: true
    pipeline_parallel_size: 1
-    build_config:
+    max_batch_size: 32
-        max_batch_size: 32
+    max_num_tokens: 32
-        max_num_tokens: 32
+    max_seq_len: 2251
-        max_seq_len: 2251
    cuda_graph_config:
      enable_padding: true
      batch_sizes: