module DNN module Regularizers class Regularizer attr_accessor :param def self.from_hash(hash) return nil unless hash regularizer_class = DNN.const_get(hash[:class]) regularizer = regularizer_class.allocate raise DNN_Error, "#{regularizer.class} is not an instance of #{self} class." unless regularizer.is_a?(self) regularizer.load_hash(hash) regularizer end def forward(x) raise NotImplementedError, "Class '#{self.class.name}' has implement method 'forward'" end def backward raise NotImplementedError, "Class '#{self.class.name}' has implement method 'backward'" end def to_hash(merge_hash) hash = { class: self.class.name } hash.merge!(merge_hash) hash end def load_hash(hash) raise NotImplementedError, "Class '#{self.class.name}' has implement method 'load_hash'" end end class L1 < Regularizer attr_accessor :l1_lambda # @param [Float] l1_lambda L1 regularizer coefficient. def initialize(l1_lambda = 0.01) @l1_lambda = l1_lambda end def forward(x) x + @l1_lambda * @param.data.abs.sum end def backward dparam = Xumo::SFloat.ones(*@param.data.shape) dparam[@param.data < 0] = -1 @param.grad += @l1_lambda * dparam end def to_hash super(l1_lambda: @l1_lambda) end def load_hash(hash) initialize(hash[:l1_lambda]) end end class L2 < Regularizer attr_accessor :l2_lambda # @param [Float] l2_lambda L2 regularizer coefficient. def initialize(l2_lambda = 0.01) @l2_lambda = l2_lambda end def forward(x) x + 0.5 * @l2_lambda * (@param.data**2).sum end def backward @param.grad += @l2_lambda * @param.data end def to_hash super(l2_lambda: @l2_lambda) end def load_hash(hash) initialize(hash[:l2_lambda]) end end class L1L2 < Regularizer attr_accessor :l1_lambda attr_accessor :l2_lambda # @param [Float] l1_lambda L1 regularizer coefficient. # @param [Float] l2_lambda L2 regularizer coefficient. def initialize(l1_lambda = 0.01, l2_lambda = 0.01) @l1_lambda = l1_lambda @l2_lambda = l2_lambda end def forward(x) l1 = @l1_lambda * @param.data.abs.sum l2 = 0.5 * @l2_lambda * (@param.data**2).sum x + l1 + l2 end def backward dparam = Xumo::SFloat.ones(*@param.data.shape) dparam[@param.data < 0] = -1 @param.grad += @l1_lambda * dparam @param.grad += @l2_lambda * @param.data end def to_hash super(l1_lambda: l1_lambda, l2_lambda: l2_lambda) end def load_hash(hash) initialize(hash[:l1_lambda], hash[:l2_lambda]) end end end end