We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent f0ecff7 commit 0d1b1faCopy full SHA for 0d1b1fa
python/sglang/srt/models/deepseek_v2.py
@@ -252,8 +252,7 @@ def forward(self, hidden_states):
252
# NOTE: For some unknown reason, router_gemm seems degrade accept length.
253
if (
254
_is_cuda
255
- and not self.is_nextn
256
- and hidden_states.shape[0] < 4
+ and hidden_states.shape[0] <= 16
257
and hidden_states.shape[1] == 7168
258
and self.weight.shape[0] == 256
259
and _device_sm >= 90
0 commit comments