# -*- encoding: utf-8 -*-
# frozen_string_literal: true
require 'rdf/nquads'

module JSON::LD
  module FromRDF
    include Utils

    ##
    # Generate a JSON-LD array representation from an array of `RDF::Statement`.
    # Representation is in expanded form
    #
    # @param [Array<RDF::Statement>, RDF::Enumerable] dataset
    # @param [Boolean] useRdfType (false)
    #   If set to `true`, the JSON-LD processor will treat `rdf:type` like a normal property instead of using `@type`.
    # @param [Boolean] useNativeTypes (false) use native representations
    # @param extendedRepresentation (false)
    #   Use the extended internal representation for native types.
    #
    # @return [Array<Hash>] the JSON-LD document in normalized form
    def from_statements(dataset, useRdfType: false, useNativeTypes: false, extendedRepresentation: false)
      default_graph = {}
      graph_map = {'@default' => default_graph}
      referenced_once = {}

      value = nil

      # Create an entry for compound-literal node detection
      compound_literal_subjects = {}

      # Create a map for node to object representation

      # For each statement in dataset
      dataset.each do |statement|
        # log_debug("statement") { statement.to_nquads.chomp}

        name = statement.graph_name ? @context.expand_iri(statement.graph_name, base: @options[:base]).to_s : '@default'

        # Create a graph entry as needed
        node_map = graph_map[name] ||= {}
        compound_literal_subjects[name] ||= {}

        default_graph[name] ||= {'@id' => name} unless name == '@default'

        subject = statement.subject.statement? ?
          resource_representation(statement.subject, useNativeTypes, extendedRepresentation)['@id'].to_json_c14n :
          statement.subject.to_s
        node = node_map[subject] ||= resource_representation(statement.subject, useNativeTypes, extendedRepresentation)

        # If predicate is rdf:datatype, note subject in compound literal subjects map
        if @options[:rdfDirection] == 'compound-literal' && statement.predicate == RDF.to_uri + 'direction'
          compound_literal_subjects[name][subject] ||= true
        end

        # If object is an IRI, blank node identifier, or statement, and node map does not have an object member, create one and initialize its value to a new JSON object consisting of a single member @id whose value is set to object.
        unless statement.object.literal?
          object = statement.object.statement? ?
            resource_representation(statement.object, useNativeTypes, extendedRepresentation)['@id'].to_json_c14n :
            statement.object.to_s
          node_map[object] ||=
            resource_representation(statement.object, useNativeTypes, extendedRepresentation)
        end

        # If predicate equals rdf:type, and object is an IRI or blank node identifier, append object to the value of the @type member of node. If no such member exists, create one and initialize it to an array whose only item is object. Finally, continue to the next RDF triple.
        if statement.predicate == RDF.type && statement.object.resource? && !useRdfType
          merge_value(node, '@type', statement.object.to_s)
          next
        end

        # Set value to the result of using the RDF to Object Conversion algorithm, passing object, rdfDirection, and use native types.
        value = resource_representation(statement.object, useNativeTypes, extendedRepresentation)

        merge_value(node, statement.predicate.to_s, value)

        # If object is a blank node identifier or rdf:nil, it might represent the a list node:
        if statement.object == RDF.nil
          # Append a new JSON object consisting of three members, node, property, and value to the usages array. The node member is set to a reference to node, property to predicate, and value to a reference to value.
          object = node_map[statement.object.to_s]
          merge_value(object, :usages, {
            node:     node,
            property: statement.predicate.to_s,
            value:    value
          })
        elsif referenced_once.key?(statement.object.to_s)
          referenced_once[statement.object.to_s] = false
        elsif statement.object.node?
          referenced_once[statement.object.to_s] = {
            node:     node,
            property: statement.predicate.to_s,
            value:    value
          }
        end
      end

      # For each name and graph object in graph map:
      graph_map.each do |name, graph_object|

        # If rdfDirection is compound-literal, check referenced_once for entries from compound_literal_subjects
        compound_literal_subjects.fetch(name, {}).keys.each do |cl|
          node = referenced_once[cl][:node]
          next unless node.is_a?(Hash)
          property = referenced_once[cl][:property]
          value = referenced_once[cl][:value]
          cl_node = graph_map[name].delete(cl)
          next unless cl_node.is_a?(Hash)
          node[property].select do |v|
            next unless v['@id'] == cl
            v.delete('@id')
            v['@value'] = cl_node[RDF.value.to_s].first['@value']
            if cl_node[RDF.to_uri.to_s + 'language']
              lang = cl_node[RDF.to_uri.to_s + 'language'].first['@value']
              if lang !~ /^[a-zA-Z]{1,8}(-[a-zA-Z0-9]{1,8})*$/
                warn "i18n datatype language must be valid BCP47: #{lang.inspect}"
              end
              v['@language'] = lang
            end
            v['@direction'] = cl_node[RDF.to_uri.to_s + 'direction'].first['@value']
          end
        end

        nil_var = graph_object.fetch(RDF.nil.to_s, {})

        # For each item usage in the usages member of nil, perform the following steps:
        nil_var.fetch(:usages, []).each do |usage|
          node, property, head = usage[:node], usage[:property], usage[:value]
          list, list_nodes = [], []

          # If property equals rdf:rest, the value associated to the usages member of node has exactly 1 entry, node has a rdf:first and rdf:rest property, both of which have as value an array consisting of a single element, and node has no other members apart from an optional @type member whose value is an array with a single item equal to rdf:List, node represents a well-formed list node. Continue with the following steps:
          # log_debug("list element?") {node.to_json(JSON_STATE) rescue 'malformed json'}
          while property == RDF.rest.to_s &&
              blank_node?(node) &&
              referenced_once[node['@id']] &&
              node.keys.none? {|k| !["@id", '@type', :usages, RDF.first.to_s, RDF.rest.to_s].include?(k)} &&
              (f = node[RDF.first.to_s]).is_a?(Array) && f.length == 1 &&
              (r = node[RDF.rest.to_s]).is_a?(Array) && r.length == 1 &&
              ((t = node['@type']).nil? || t == [RDF.List.to_s])
            list << Array(node[RDF.first.to_s]).first
            list_nodes << node['@id']

            # get next node, moving backwards through list
            node_usage = referenced_once[node['@id']]
            node, property, head = node_usage[:node], node_usage[:property], node_usage[:value]
          end

          head.delete('@id')
          head['@list'] = list.reverse
          list_nodes.each {|node_id| graph_object.delete(node_id)}
        end

        # Create annotations on graph object
        create_annotations(graph_object)
      end

      result = []
      default_graph.keys.opt_sort(ordered: @options[:ordered]).each do |subject|
        node = default_graph[subject]
        if graph_map.key?(subject)
          node['@graph'] = []
          graph_map[subject].keys.opt_sort(ordered: @options[:ordered]).each do |s|
            n = graph_map[subject][s]
            n.delete(:usages)
            node['@graph'] << n unless node_reference?(n)
          end
        end
        node.delete(:usages)
        result << node unless node_reference?(node)
      end
      # log_debug("fromRdf") {result.to_json(JSON_STATE) rescue 'malformed json'}
      result
    end

    private

    RDF_LITERAL_NATIVE_TYPES = Set.new([RDF::XSD.boolean, RDF::XSD.integer, RDF::XSD.double]).freeze

    def resource_representation(resource, useNativeTypes, extendedRepresentation)
      case resource
      when RDF::Statement
        # Note, if either subject or object are a BNode which is used elsewhere,
        # this might not work will with the BNode accounting from above.
        rep = {'@id' => resource_representation(resource.subject, false, extendedRepresentation)}
        if resource.predicate == RDF.type
          rep['@id'].merge!('@type' => resource.object.to_s)
        else
          rep['@id'].merge!(
            resource.predicate.to_s =>
            as_array(resource_representation(resource.object, useNativeTypes, extendedRepresentation)))
        end
        rep
      when RDF::Literal
        base = @options[:base]
        rdfDirection = @options[:rdfDirection]
        res = {}

        if resource.datatype == RDF::URI(RDF.to_uri + "JSON") && @context.processingMode('json-ld-1.1')
          res['@type'] = '@json'
          res['@value'] = begin
            ::JSON.parse(resource.object)
          rescue ::JSON::ParserError => e
            raise JSON::LD::JsonLdError::InvalidJsonLiteral, e.message
          end
        elsif useNativeTypes && extendedRepresentation
          res['@value'] = resource  # Raw literal
        elsif resource.datatype.start_with?("https://www.w3.org/ns/i18n#") && rdfDirection == 'i18n-datatype' && @context.processingMode('json-ld-1.1')
          lang, dir = resource.datatype.fragment.split('_')
          res['@value'] = resource.to_s
          unless lang.empty?
            if lang !~ /^[a-zA-Z]{1,8}(-[a-zA-Z0-9]{1,8})*$/
              if options[:validate]
                raise JsonLdError::InvalidLanguageMapping, "rdf:language must be valid BCP47: #{lang.inspect}"
              else
                warn "rdf:language must be valid BCP47: #{lang.inspect}"
              end
            end
            res['@language'] = lang
          end
          res['@direction'] = dir
        elsif useNativeTypes && RDF_LITERAL_NATIVE_TYPES.include?(resource.datatype) && resource.valid?
          res['@value'] = resource.object
        else
          resource.canonicalize! if resource.valid? && resource.datatype == RDF::XSD.double
          if resource.datatype?
            res['@type'] = resource.datatype.to_s
          elsif resource.language?
            res['@language'] = resource.language.to_s
          end
          res['@value'] = resource.to_s
        end
        res
      else
        {'@id' => resource.to_s}
      end
    end
  end
end