[https://nvbugs/5451426][fix] Avoid torch compile on full eagle3 worker (#7245)

liji-nv · web-flow · commit 877e1f44d3b4 · 2025-08-27T09:59:06.000+08:00
Signed-off-by: Jin Li &lt;59594262+liji-nv@users.noreply.github.com&gt;
diff --git a/tensorrt_llm/_torch/speculative/eagle3.py b/tensorrt_llm/_torch/speculative/eagle3.py
@@ -266,7 +266,6 @@ def __init__(self, spec_config: "EagleDecodingConfig", mapping: Mapping):
         self.max_draft_len = self.spec_config.max_draft_len
         self.mapping = mapping
 
-    @torch.compile(options={"max-autotune": True})
     def forward(self, input_ids, position_ids, hidden_states, logits,
                 attn_metadata, spec_metadata, draft_model):
         batch_size = attn_metadata.num_seqs