We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 7cae5c4 commit 6cf59faCopy full SHA for 6cf59fa
nemo/collections/nlp/models/language_modeling/megatron_gpt_model.py
@@ -545,6 +545,7 @@ def setup_mcore_distributed_parallel(self):
545
# mcore bucket_size is based on num of parameters, therefore not
546
# using bucket_cap_mb to configure bucket_size here
547
bucket_size=self.cfg.optim.get('ddp_bucket_size', None),
548
+ average_in_collective=self.cfg.optim.get('average_in_collective', True),
549
)
550
self.model = [
551
McoreDDP(
0 commit comments