Skip to content

Commit ad2aeb3

Browse files
fix
1 parent 62dc7d5 commit ad2aeb3

2 files changed

Lines changed: 1 addition & 5 deletions

File tree

deepmd/pd/train/training.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -783,7 +783,7 @@ def step(_step_id, task_key="Default") -> None:
783783
loss.backward()
784784

785785
# gradient accumulation
786-
if _step_id % self.acc_freq == 0:
786+
if (_step_id + 1) % self.acc_freq == 0:
787787
# fuse + allreduce manually before optimization if use DDP + no_sync
788788
# details in https://github.com/PaddlePaddle/Paddle/issues/48898#issuecomment-1343838622
789789
if self.world_size > 1:

source/tests/pd/test_training.py

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -150,9 +150,7 @@ def setUp(self) -> None:
150150
self.config["model"] = deepcopy(model_se_e2_a)
151151
self.config["training"]["numb_steps"] = 1
152152
self.config["training"]["save_freq"] = 1
153-
# import paddle
154153
enable_prim(True)
155-
# assert paddle.framework.core._is_eager_prim_enabled()
156154

157155
def tearDown(self) -> None:
158156
DPTrainTest.tearDown(self)
@@ -170,9 +168,7 @@ def setUp(self) -> None:
170168
self.config["training"]["numb_steps"] = 1
171169
self.config["training"]["save_freq"] = 1
172170
self.config["training"]["acc_freq"] = 4
173-
# import paddle
174171
enable_prim(True)
175-
# assert paddle.framework.core._is_eager_prim_enabled()
176172

177173
def tearDown(self) -> None:
178174
DPTrainTest.tearDown(self)

0 commit comments

Comments
 (0)