We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 7943e43 commit be09580Copy full SHA for be09580
python/sglang/srt/server_args.py
@@ -323,6 +323,9 @@ def __post_init__(self):
323
assert (
324
not self.enable_dp_attention
325
), "DeepEP MoE `auto` mode is not supported with DP Attention."
326
+ if self.deepep_mode == "normal":
327
+ logger.warning("Cuda graph is disabled because deepep_mode=`normal`")
328
+ self.disable_cuda_graph = True
329
self.ep_size = self.tp_size
330
self.enable_sp_layernorm = (
331
self.dp_size < self.tp_size if self.enable_dp_attention else True
0 commit comments