diff --git a/vllm/model_executor/models/aria.py b/vllm/model_executor/models/aria.py index d5179df3de1fc..8c6873de13627 100644 --- a/vllm/model_executor/models/aria.py +++ b/vllm/model_executor/models/aria.py @@ -60,6 +60,9 @@ def __init__( prefix: str = "", ) -> None: super().__init__(config, quant_config, prefix) + # Unlike Idefics3VisionTransformer which uses LayerNorm after the + # final layer, Aria omits this normalization, so we replace it with an + # Identity layer self.post_layernorm = nn.Identity() def load_weights(self, weights: Iterable[Tuple[str,