We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent c1927e1 commit 1519acfCopy full SHA for 1519acf
1 file changed
python/sglang/srt/models/deepseek_v2.py
@@ -326,7 +326,7 @@ def forward(
326
and (self.weight.shape[0] == 256 or self.weight.shape[0] == 384)
327
and _device_sm >= 90
328
):
329
- if _device_sm >= 100 and self.weight.shape[0] == 256:
+ if _device_sm == 100 and self.weight.shape[0] == 256:
330
# router gemm output float32
331
logits = torch.empty(
332
hidden_states.shape[0],
0 commit comments