|
|
|
@ -215,7 +215,7 @@ def set_gradient_clip(clip, param_list=None, program=None):
|
|
|
|
|
def append_gradient_clip_ops(param_grad):
|
|
|
|
|
context = dict()
|
|
|
|
|
for p, g in param_grad:
|
|
|
|
|
with p.block.program.optimization_guard(p):
|
|
|
|
|
with p.block.program.optimized_guard(p):
|
|
|
|
|
clip_attr = getattr(p, 'gradient_clip_attr', NullGradientClipAttr())
|
|
|
|
|
if clip_attr is None:
|
|
|
|
|
clip_attr = NullGradientClipAttr()
|
|
|
|
@ -228,7 +228,7 @@ def append_gradient_clip_ops(param_grad):
|
|
|
|
|
|
|
|
|
|
res = []
|
|
|
|
|
for p, g in param_grad:
|
|
|
|
|
with p.block.program.optimization_guard(p):
|
|
|
|
|
with p.block.program.optimized_guard(p):
|
|
|
|
|
res.append(clip_attr.create_operators(param=p, grad=g))
|
|
|
|
|
|
|
|
|
|
return res
|
|
|
|
|