lib/torch/optim/adadelta.rb in torch-rb-0.3.7 vs lib/torch/optim/adadelta.rb in torch-rb-0.4.0
- old
+ new
@@ -43,10 +43,10 @@
end
square_avg.mul!(rho).addcmul!(1 - rho, grad, grad)
std = square_avg.add(eps).sqrt!
delta = acc_delta.add(eps).sqrt!.div!(std).mul!(grad)
- p.data.add!(-group[:lr], delta)
+ p.data.add!(delta, alpha: -group[:lr])
acc_delta.mul!(rho).addcmul!(1 - rho, delta, delta)
end
end
loss