Skip to content

Commit

Permalink
Add flashinfer mla backend for deepseek v3
Browse files Browse the repository at this point in the history
  • Loading branch information
Fridge003 committed Feb 22, 2025
1 parent 9087694 commit d9913bb
Show file tree
Hide file tree
Showing 4 changed files with 561 additions and 19 deletions.
1 change: 1 addition & 0 deletions python/sglang/srt/configs/model_config.py
Original file line number Diff line number Diff line change
Expand Up @@ -103,6 +103,7 @@ def __init__(
self.head_dim = 256
self.attention_arch = AttentionArch.MLA
self.kv_lora_rank = self.hf_config.kv_lora_rank
self.qk_nope_head_dim = self.hf_config.qk_nope_head_dim
self.qk_rope_head_dim = self.hf_config.qk_rope_head_dim
elif "MiniCPM3ForCausalLM" in self.hf_config.architectures:
self.head_dim = 128
Expand Down
Loading

0 comments on commit d9913bb

Please sign in to comment.