GitOrigin-RevId: d677d1ca6b
release-1.4
@@ -84,7 +84,7 @@ class Adadelta(Optimizer): | |||||
step += c1 | step += c1 | ||||
grad = param.grad | grad = param.grad | ||||
if weight_decay != 0.0: | if weight_decay != 0.0: | ||||
grad += param * _weight_decay | |||||
grad = grad + param * _weight_decay | |||||
square_avg = states["square_avg"] | square_avg = states["square_avg"] | ||||
acc_delta = states["acc_delta"] | acc_delta = states["acc_delta"] | ||||
@@ -82,7 +82,7 @@ class Adagrad(Optimizer): | |||||
step += c1 | step += c1 | ||||
grad = param.grad | grad = param.grad | ||||
if weight_decay != 0.0: | if weight_decay != 0.0: | ||||
grad += param * _weight_decay | |||||
grad = grad + param * _weight_decay | |||||
square_avg = states["square_avg"] | square_avg = states["square_avg"] | ||||
square_avg += grad ** c2 | square_avg += grad ** c2 | ||||
@@ -85,7 +85,7 @@ class Adam(Optimizer): | |||||
grad = param.grad | grad = param.grad | ||||
if weight_decay != 0.0: | if weight_decay != 0.0: | ||||
grad += param * _weight_decay | |||||
grad = grad + param * _weight_decay | |||||
states = self._state[param] | states = self._state[param] | ||||
@@ -72,7 +72,7 @@ class SGD(Optimizer): | |||||
grad = param.grad | grad = param.grad | ||||
if weight_decay != 0.0: | if weight_decay != 0.0: | ||||
grad += param * _weight_decay | |||||
grad = grad + param * _weight_decay | |||||
if inplace_mode: | if inplace_mode: | ||||
if momentum: | if momentum: | ||||