Updates Gemma3n MLP layer

JustinTong0323 · JustinTong0323 · commit 41617a7f425b · 2025-06-26T11:54:57.000-07:00
Updates the Gemma3n MLP layer to use the intermediate size specified for each layer, addressing a potential issue where the model was not correctly configured based on layer-specific parameters.

Signed-off-by: Xinyuan Tong &lt;justinning0323@outlook.com&gt;
diff --git a/python/sglang/srt/models/gemma3n_causal.py b/python/sglang/srt/models/gemma3n_causal.py
@@ -62,7 +62,7 @@ class Gemma3nTextScaledWordEmbedding(Gemma3TextScaledWordEmbedding):
     pass
 
 
-class Gemma3nMLP(nn.Module):
+class Gemma3nTextMLP(nn.Module):
     def __init__(
         self,
         hidden_size: int,
@@ -514,10 +514,11 @@ def __init__(
             prefix=add_prefix("self_attn", prefix),
         )
 
+        intermediate_size = config.intermediate_size[layer_id]
         activation_sparsity = config.activation_sparsity_pattern[layer_id]
-        self.mlp = Gemma3nMLP(
+        self.mlp = Gemma3nTextMLP(
             hidden_size=self.hidden_size,
-            intermediate_size=config.intermediate_size,
+            intermediate_size=intermediate_size,
             hidden_activation=config.hidden_activation,
             activation_sparsity=activation_sparsity,
             quant_config=quant_config,