lib/torch/optim/adadelta.rb in torch-rb-0.3.7 vs lib/torch/optim/adadelta.rb in torch-rb-0.4.0

- old
+ new

@@ -43,10 +43,10 @@ end square_avg.mul!(rho).addcmul!(1 - rho, grad, grad) std = square_avg.add(eps).sqrt! delta = acc_delta.add(eps).sqrt!.div!(std).mul!(grad) - p.data.add!(-group[:lr], delta) + p.data.add!(delta, alpha: -group[:lr]) acc_delta.mul!(rho).addcmul!(1 - rho, delta, delta) end end loss