From 4a6e7d0b7b67776c20d6b802d9bf7f2b7007579e Mon Sep 17 00:00:00 2001 From: alcanderian Date: Sat, 7 Jun 2025 06:14:51 +0000 Subject: [PATCH 1/2] [sgl-kernel] update deepgemm --- sgl-kernel/CMakeLists.txt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/sgl-kernel/CMakeLists.txt b/sgl-kernel/CMakeLists.txt index ab11ded67ed4..e80d4aa52960 100644 --- a/sgl-kernel/CMakeLists.txt +++ b/sgl-kernel/CMakeLists.txt @@ -53,7 +53,7 @@ FetchContent_Populate(repo-cutlass) FetchContent_Declare( repo-deepgemm GIT_REPOSITORY https://github.com/deepseek-ai/DeepGEMM - GIT_TAG d75b218b7b8f4a5dd5406ac87905039ead3ae42f + GIT_TAG 8dfa3298274bfe6b242f6f8a3e6f3eff2707dd9f GIT_SHALLOW OFF ) FetchContent_Populate(repo-deepgemm) From cf38ce5eb4f729845c7a5f92cbf5d22f312493a4 Mon Sep 17 00:00:00 2001 From: zhyncs Date: Sat, 7 Jun 2025 06:23:59 +0000 Subject: [PATCH 2/2] upd --- python/sglang/srt/models/deepseek_v2.py | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/python/sglang/srt/models/deepseek_v2.py b/python/sglang/srt/models/deepseek_v2.py index d62478e0f746..895ef648b5be 100644 --- a/python/sglang/srt/models/deepseek_v2.py +++ b/python/sglang/srt/models/deepseek_v2.py @@ -1719,7 +1719,10 @@ def determine_num_fused_shared_experts( logger, "Only Deepseek V3/R1 on NV-platform can use shared experts fusion optimization. Shared experts fusion optimization is disabled.", ) - elif (global_server_args_dict["enable_deepep_moe"] or global_server_args_dict["enable_ep_moe"]): + elif ( + global_server_args_dict["enable_deepep_moe"] + or global_server_args_dict["enable_ep_moe"] + ): self.num_fused_shared_experts = 0 global_server_args_dict["disable_shared_experts_fusion"] = True log_info_on_rank0(