@@ -23,7 +23,8 @@ extern aclnnStatus aclnnInnerMoeDistributeCombineV2GetWorkspaceSize(
2323 int64_t epRankId, int64_t moeExpertNum, char *groupTp, int64_t tpWorldSize, int64_t tpRankId,
2424 int64_t expertShardType, int64_t sharedExpertNum, int64_t sharedExpertRankNum, int64_t globalBs, int64_t outDtype,
2525 int64_t commQuantMode, int64_t groupListType, char *commAlg, int64_t zeroExpertNum, int64_t copyExpertNum,
26- int64_t constExpertNum, const aclTensor *x, uint64_t *workspaceSize, aclOpExecutor **executor);
26+ int64_t constExpertNum, const aclTensor *x, const aclTensor *sendCostStats, uint64_t *workspaceSize,
27+ aclOpExecutor **executor);
2728
2829extern aclnnStatus aclnnInnerMoeDistributeCombineV2 (void *workspace, uint64_t workspaceSize, aclOpExecutor *executor,
2930 aclrtStream stream);
@@ -38,14 +39,15 @@ aclnnStatus aclnnMoeDistributeCombineV2GetWorkspaceSize(
3839 const aclTensor *sharedExpertXOptional, char *groupEp, int64_t epWorldSize, int64_t epRankId, int64_t moeExpertNum,
3940 char *groupTp, int64_t tpWorldSize, int64_t tpRankId, int64_t expertShardType, int64_t sharedExpertNum,
4041 int64_t sharedExpertRankNum, int64_t globalBs, int64_t outDtype, int64_t commQuantMode, int64_t groupListType,
41- char *commAlg, const aclTensor *xOut, uint64_t *workspaceSize, aclOpExecutor **executor)
42+ char *commAlg, const aclTensor *xOut, const aclTensor *sendCostStats, uint64_t *workspaceSize,
43+ aclOpExecutor **executor)
4244{
4345 return aclnnInnerMoeDistributeCombineV2GetWorkspaceSize (
4446 expandX, expertIds, assistInfoForCombine, epSendCounts, expertScales, tpSendCountsOptional, xActiveMaskOptional,
4547 activationScaleOptional, weightScaleOptional, groupListOptional, expandScalesOptional, sharedExpertXOptional,
4648 nullptr , nullptr , nullptr , nullptr , nullptr , groupEp, epWorldSize, epRankId, moeExpertNum, groupTp, tpWorldSize,
4749 tpRankId, expertShardType, sharedExpertNum, sharedExpertRankNum, globalBs, outDtype, commQuantMode,
48- groupListType, commAlg, 0 , 0 , 0 , xOut, workspaceSize, executor);
50+ groupListType, commAlg, 0 , 0 , 0 , xOut, sendCostStats, workspaceSize, executor);
4951}
5052
5153aclnnStatus aclnnMoeDistributeCombineV2 (void *workspace, uint64_t workspaceSize, aclOpExecutor *executor,
0 commit comments