File tree Expand file tree Collapse file tree 2 files changed +10
-1
lines changed Expand file tree Collapse file tree 2 files changed +10
-1
lines changed Original file line number Diff line number Diff line change @@ -540,7 +540,7 @@ def fp8_block_scale_moe_runner(
540
540
541
541
@fp8_block_scale_moe_runner .register_fake
542
542
def _ (
543
- rrouting_logits : torch .Tensor ,
543
+ routing_logits : torch .Tensor ,
544
544
routing_bias : torch .Tensor ,
545
545
hidden_states : torch .Tensor ,
546
546
hidden_states_scale : torch .Tensor ,
Original file line number Diff line number Diff line change @@ -1797,6 +1797,15 @@ class TorchCompileConfig(BaseModel):
1797
1797
description =
1798
1798
"The maximum number of CUDA streams to use for torch.compile." )
1799
1799
1800
+ @field_validator ('max_num_streams' )
1801
+ @classmethod
1802
+ def validate_torch_compile_max_num_streams (cls , v ):
1803
+ """Validate torch_compile_config.max_num_streams >= 1."""
1804
+ if v < 1 :
1805
+ raise ValueError (
1806
+ "torch_compile_config.max_num_streams must be >= 1" )
1807
+ return v
1808
+
1800
1809
1801
1810
class TorchLlmArgs (BaseLlmArgs ):
1802
1811
# Just a dummy BuildConfig to allow code reuse with the TrtLlmArgs
You can’t perform that action at this time.
0 commit comments