Commit 4fd6432d authored by Lawrence McAfee's avatar Lawrence McAfee
Browse files

fixed zero_grad for fp32_from_float16_groups

parent 90e0a0dd
Loading
Loading
Loading
Loading
+2 −0
Original line number Diff line number Diff line
@@ -285,6 +285,8 @@ class Float16OptimizerWithFloat16Params(MegatronOptimizer):
                float16_groups & fp32_from_fp32_groups."""
        for group in self.float16_groups:
            _zero_grad_group_helper(group, set_to_none)
        for group in self.fp32_from_float16_groups:
            _zero_grad_group_helper(group, set_to_none)
        for group in self.fp32_from_fp32_groups:
            _zero_grad_group_helper(group, set_to_none)