module Bolognese module Utils def find_from_format(id: nil, string: nil, ext: nil) if id.present? find_from_format_by_id(id) elsif string.present? find_from_format_by_string(string, ext: ext) end end def find_from_format_by_id(id) id = normalize_id(id) if /\A(?:(http|https):\/\/(dx\.)?doi.org\/)?(doi:)?(10\.\d{4,5}\/.+)\z/.match(id) get_doi_ra(id).fetch("id", nil) elsif /\A(?:(http|https):\/\/orcid\.org\/)?(\d{4}-\d{4}-\d{4}-\d{3}[0-9X]+)\z/.match(id) "orcid" else "schema_org" end end def find_from_format_by_string(string, options={}) if options[:ext] == ".bib" "bibtex" elsif Maremma.from_xml(string).dig("doi_records", "doi_record", "crossref") "crossref" elsif Maremma.from_xml(string).dig("resource", "xmlns") == "http://datacite.org/schema/kernel-4" "datacite" end end def write(id: nil, string: nil, from: nil, to: nil, **options) if from.present? p = case from when "crossref" then Crossref.new(id: id, string: string) when "datacite" then Datacite.new(id: id, string: string, schema_version: options[:schema_version]) when "bibtex" then Bibtex.new(string: string) else SchemaOrg.new(id: id) end puts p.send(to) else puts "not implemented" end end def orcid_from_url(url) Array(/\Ahttp:\/\/orcid\.org\/(.+)/.match(url)).last end def orcid_as_url(orcid) "http://orcid.org/#{orcid}" if orcid.present? end def validate_orcid(orcid) Array(/\A(?:http:\/\/orcid\.org\/)?(\d{4}-\d{4}-\d{4}-\d{3}[0-9X]+)\z/.match(orcid)).last end def validate_url(str) if /\A(?:(http|https):\/\/(dx\.)?doi.org\/)?(doi:)?(10\.\d{4,5}\/.+)\z/.match(str) "DOI" elsif /\A(http|https):\/\//.match(str) "URL" end end def parse_attributes(element) if element.is_a?(String) element elsif element.is_a?(Hash) element.fetch("__content__", nil) elsif element.is_a?(Array) element.map { |e| e.fetch("__content__", nil) } else nil end end def parse_attribute(element) if element.is_a?(String) element elsif element.is_a?(Hash) element.fetch("__content__", nil) elsif element.is_a?(Array) element.first.fetch("__content__", nil) else nil end end def normalize_id(id) return nil unless id.present? normalize_doi(id) || Addressable::URI.parse(id).host && PostRank::URI.clean(id) end def normalize_orcid(orcid) orcid = validate_orcid(orcid) return nil unless orcid.present? # turn ORCID ID into URL "http://orcid.org/" + Addressable::URI.encode(orcid) end def normalize_ids(list) Array.wrap(list).map { |url| url.merge("@id" => normalize_id(url["@id"])) } end end end