We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent ac935c7 commit 91a9986Copy full SHA for 91a9986
deepspeed/runtime/pipe/engine.py
@@ -852,7 +852,8 @@ def _exec_backward_pass(self, buffer_id):
852
853
if self.using_bf16_optimizer and not self.is_last_stage():
854
# manually call because we don't call optimizer.backward()
855
- self.optimizer.update_hp_grads(clear_lp_grads=False)
+ if not self._config.bfloat16_immediate_grad_update:
856
+ self.optimizer.update_hp_grads(clear_lp_grads=False)
857
858
# Free up the memory from the output of forward()
859
self.pipe_buffers['output_tensors'][buffer_id] = None
0 commit comments