diff --git a/vllm/model_executor/models/modernbert.py b/vllm/model_executor/models/modernbert.py index 5dbf38c690..5a0769f3bd 100644 --- a/vllm/model_executor/models/modernbert.py +++ b/vllm/model_executor/models/modernbert.py @@ -39,9 +39,12 @@ class ModernBertEmbeddings(nn.Module): self.tok_embeddings = VocabParallelEmbedding( config.vocab_size, config.hidden_size ) - self.norm = nn.LayerNorm( - config.hidden_size, eps=config.layer_norm_eps, bias=config.norm_bias + eps = ( + getattr(config, "norm_eps", None) + or getattr(config, "layer_norm_eps", None) + or 1e-5 ) + self.norm = nn.LayerNorm(config.hidden_size, eps=eps, bias=config.norm_bias) def get_input_embeddings(self, input_ids: torch.Tensor) -> torch.Tensor: return self.tok_embeddings(input_ids)