require "json"
require "base64"

module DNN

  # This class deals with the model of the network.
  class Model
    attr_accessor :layers    # All layers possessed by the model
    attr_accessor :trainable # Setting false prevents learning of parameters.

    def self.load(file_name)
      Marshal.load(File.binread(file_name))
    end

    def self.load_json(json_str)
      hash = JSON.parse(json_str, symbolize_names: true)
      model = self.new
      model.layers = hash[:layers].map { |hash_layer| Util.load_hash(hash_layer) }
      model.compile(Util.load_hash(hash[:optimizer]))
      model
    end
  
    def initialize
      @layers = []
      @trainable = true
      @optimizer = nil
      @training = false
      @compiled = false
    end

    def load_json_params(json_str)
      has_param_layers_params = JSON.parse(json_str, symbolize_names: true)
      has_param_layers_index = 0
      @layers.each do |layer|
        next unless layer.is_a?(HasParamLayer)
        hash_params = has_param_layers_params[has_param_layers_index]
        hash_params.each do |key, (shape, base64_param)|
          bin = Base64.decode64(base64_param)
          data = Xumo::SFloat.from_binary(bin).reshape(*shape)
          if layer.params[key].is_a?(LearningParam)
            layer.params[key].data = data
          else
            layer.params[key] = data
          end
        end
        has_param_layers_index += 1
      end
    end
  
    def save(file_name)
      marshal = Marshal.dump(self)
      begin
        File.binwrite(file_name, marshal)
      rescue Errno::ENOENT => ex
        dir_name = file_name.match(%r`(.*)/.+$`)[1]
        Dir.mkdir(dir_name)
        File.binwrite(file_name, marshal)
      end
    end

    def to_json
      hash_layers = @layers.map { |layer| layer.to_hash }
      hash = {version: VERSION, layers: hash_layers, optimizer: @optimizer.to_hash}
      JSON.pretty_generate(hash)
    end
    
    def params_to_json
      has_param_layers = @layers.select { |layer| layer.is_a?(Layers::HasParamLayer) }
      has_param_layers_params = has_param_layers.map do |layer|
        layer.params.map { |key, param|
          param = param.data if param.is_a?(LearningParam)
          base64_param = Base64.encode64(param.to_binary)
          [key, [param.shape, base64_param]]
        }.to_h
      end
      JSON.dump(has_param_layers_params)
    end
  
    def <<(layer)
      if !layer.is_a?(Layers::Layer) && !layer.is_a?(Model)
        raise TypeError.new("layer is not an instance of the DNN::Layers::Layer class or DNN::Model class.")
      end
      @layers << layer
      self
    end
  
    def compile(optimizer)
      unless optimizer.is_a?(Optimizers::Optimizer)
        raise TypeError.new("optimizer is not an instance of the DNN::Optimizers::Optimizer class.")
      end
      @compiled = true
      layers_check
      @optimizer = optimizer
      build
      layers_shape_check
    end

    def build(super_model = nil)
      @super_model = super_model
      @layers.each do |layer|
        layer.build(self)
      end
    end

    def optimizer
      @optimizer ? @optimizer : @super_model.optimizer
    end

    def compiled?
      @compiled
    end

    def training?
      @training
    end

    def train(x, y, epochs,
              batch_size: 1,
              test: nil,
              verbose: true,
              batch_proc: nil,
              &epoch_proc)
      unless compiled?
        raise DNN_Error.new("The model is not compiled.")
      end
      num_train_data = x.shape[0]
      (1..epochs).each do |epoch|
        puts "【 epoch #{epoch}/#{epochs} 】" if verbose
        (num_train_data.to_f / batch_size).ceil.times do |index|
          x_batch, y_batch = Util.get_minibatch(x, y, batch_size)
          loss = train_on_batch(x_batch, y_batch, &batch_proc)
          if loss.nan?
            puts "\nloss is nan" if verbose
            return
          end
          num_trained_data = (index + 1) * batch_size
          num_trained_data = num_trained_data > num_train_data ? num_train_data : num_trained_data
          log = "\r"
          40.times do |i|
            if i < num_trained_data * 40 / num_train_data
              log << "="
            elsif i == num_trained_data * 40 / num_train_data
              log << ">"
            else
              log << "_"
            end
          end
          log << "  #{num_trained_data}/#{num_train_data} loss: #{sprintf('%.8f', loss)}"
          print log if verbose
        end
        if verbose && test
          acc = accurate(test[0], test[1], batch_size, &batch_proc)
          print "  accurate: #{acc}"
        end
        puts "" if verbose
        epoch_proc.call(epoch) if epoch_proc
      end
    end
  
    def train_on_batch(x, y, &batch_proc)
      input_data_shape_check(x, y)
      x, y = batch_proc.call(x, y) if batch_proc
      forward(x, true)
      loss_value = loss(y)
      backward(y)
      dloss
      update
      loss_value
    end
  
    def accurate(x, y, batch_size = 100, &batch_proc)
      input_data_shape_check(x, y)
      batch_size = batch_size >= x.shape[0] ? x.shape[0] : batch_size
      correct = 0
      (x.shape[0].to_f / batch_size).ceil.times do |i|
        x_batch = Xumo::SFloat.zeros(batch_size, *x.shape[1..-1])
        y_batch = Xumo::SFloat.zeros(batch_size, *y.shape[1..-1])
        batch_size.times do |j|
          k = i * batch_size + j
          break if k >= x.shape[0]
          x_batch[j, false] = x[k, false]
          y_batch[j, false] = y[k, false]
        end
        x_batch, y_batch = batch_proc.call(x_batch, y_batch) if batch_proc
        out = forward(x_batch, false)
        batch_size.times do |j|
          if @layers[-1].shape == [1]
            correct += 1 if out[j, 0].round == y_batch[j, 0].round
          else
            correct += 1 if out[j, true].max_index == y_batch[j, true].max_index
          end
        end
      end
      correct.to_f / x.shape[0]
    end
  
    def predict(x)
      input_data_shape_check(x)
      forward(x, false)
    end

    def predict1(x)
      predict(Xumo::SFloat.cast([x]))[0, false]
    end

    def copy
      Marshal.load(Marshal.dump(self))
    end

    def get_layer(*args)
      if args.length == 1
        index = args[0]
        @layers[index]
      else
        layer_class, index = args
        @layers.select { |layer| layer.is_a?(layer_class) }[index]
      end
    end

    def get_all_layers
      @layers.map { |layer|
        layer.is_a?(Model) ? layer.get_all_layers : layer
      }.flatten
    end
  
    def forward(x, training)
      @training = training
      @layers.each do |layer|
        x = if layer.is_a?(Layers::Layer)
          layer.forward(x)
        elsif layer.is_a?(Model)
          layer.forward(x, training)
        end
      end
      x
    end

    def loss(y)
      @layers[-1].loss(y)
    end

    def dloss
      @layers[-1].dloss
    end
  
    def backward(y)
      dout = y
      @layers.reverse.each do |layer|
        dout = layer.backward(dout)
      end
      dout
    end

    def update
      @layers.each do |layer|
        layer.update if @trainable && (layer.is_a?(Layers::HasParamLayer) || layer.is_a?(Model))
      end
    end

    def get_prev_layer(layer)
      layer_index = @layers.index(layer)
      prev_layer = if layer_index == 0
        if @super_model
          @super_model.layers[@super_model.layers.index(self) - 1]
        else
          self
        end
      else
        @layers[layer_index - 1]
      end
      if prev_layer.is_a?(Layers::Layer)
        prev_layer
      elsif prev_layer.is_a?(Model)
        prev_layer.layers[-1]
      end
    end

    private

    def layers_check
      unless @layers.first.is_a?(Layers::InputLayer)
        raise TypeError.new("The first layer is not an InputLayer.")
      end
      unless @layers.last.is_a?(Layers::OutputLayer)
        raise TypeError.new("The last layer is not an OutputLayer.")
      end
    end

    def input_data_shape_check(x, y = nil)
      unless @layers.first.shape == x.shape[1..-1]
        raise DNN_ShapeError.new("The shape of x does not match the input shape. x shape is #{x.shape[1..-1]}, but input shape is #{@layers.first.shape}.")
      end
      if y && @layers.last.shape != y.shape[1..-1]
        raise DNN_ShapeError.new("The shape of y does not match the input shape. y shape is #{y.shape[1..-1]}, but output shape is #{@layers.last.shape}.")
      end
    end

    def layers_shape_check
      @layers.each.with_index do |layer, i|
        prev_shape = layer.is_a?(Layers::Layer) ? layer.prev_layer.shape : layer.layers[-1]
        if layer.is_a?(Layers::Dense)
          if prev_shape.length != 1
            raise DNN_ShapeError.new("layer index(#{i}) Dense:  The shape of the previous layer is #{prev_shape}. The shape of the previous layer must be 1 dimensional.")
          end
        elsif layer.is_a?(Layers::Conv2D) || layer.is_a?(Layers::MaxPool2D)
          if prev_shape.length != 3
            raise DNN_ShapeError.new("layer index(#{i}) Conv2D:  The shape of the previous layer is #{prev_shape}. The shape of the previous layer must be 3 dimensional.")
          end
        elsif layer.is_a?(Layers::RNN)
          if prev_shape.length != 2
            layer_name = layer.class.name.match("\:\:(.+)$")[1]
            raise DNN_ShapeError.new("layer index(#{i}) #{layer_name}:  The shape of the previous layer is #{prev_shape}. The shape of the previous layer must be 3 dimensional.")
          end
        end
      end
    end
  end

end