diff --git a/vllm/model_executor/models/nemotron_nas.py b/vllm/model_executor/models/nemotron_nas.py index 19a942a5277cc..83ef5e7e1282d 100644 --- a/vllm/model_executor/models/nemotron_nas.py +++ b/vllm/model_executor/models/nemotron_nas.py @@ -169,10 +169,13 @@ class DeciLMDecoderLayer(nn.Module): self.input_layernorm = RMSNorm(config.hidden_size, eps=config.rms_norm_eps) if not self._is_no_op_ffn: - ffn_mult = block_config.ffn.ffn_mult - intermediate_size = _ffn_mult_to_intermediate_size( - ffn_mult, config.hidden_size - ) + if hasattr(block_config.ffn, "ffn_mult"): + ffn_mult = block_config.ffn.ffn_mult + intermediate_size = _ffn_mult_to_intermediate_size( + ffn_mult, config.hidden_size + ) + else: + intermediate_size = block_config.ffn.intermediate_size self.mlp = LlamaMLP( hidden_size=self.hidden_size,