# encoding: UTF-8 recent_ruby = RUBY_VERSION >= '1.9.1' raise "IMPORTANT: dwc-archive gem requires ruby >= 1.9.1" unless recent_ruby require 'fileutils' require 'ostruct' require 'digest' require 'csv' require 'logger' require 'nokogiri' require_relative 'dwc-archive/xml_reader' require_relative 'dwc-archive/ingester' require_relative 'dwc-archive/errors' require_relative 'dwc-archive/expander' require_relative 'dwc-archive/archive' require_relative 'dwc-archive/core' require_relative 'dwc-archive/extension' require_relative 'dwc-archive/metadata' require_relative 'dwc-archive/generator' require_relative 'dwc-archive/generator_meta_xml' require_relative 'dwc-archive/generator_eml_xml' require_relative 'dwc-archive/classification_normalizer' require_relative 'dwc-archive/version' class DarwinCore DEFAULT_TMP_DIR = "/tmp" attr_reader :archive, :core, :metadata, :extensions, :classification_normalizer alias :eml :metadata def self.nil_field?(field) return true if [nil, '', '/N'].include?(field) false end def self.clean_all(tmp_dir = DEFAULT_TMP_DIR) Dir.entries(tmp_dir).each do |entry| path = File.join(tmp_dir, entry) if FileTest.directory?(path) && entry.match(/^dwc_[\d]+$/) FileUtils.rm_rf(path) end end end def self.logger @@logger ||= Logger.new(nil) end def self.logger=(logger) @@logger = logger end def self.logger_reset self.logger = Logger.new(nil) end def self.logger_write(obj_id, message, method = :info) self.logger.send(method, "|%s|%s|" % [obj_id, message]) end def initialize(dwc_path, tmp_dir = DEFAULT_TMP_DIR) @dwc_path = dwc_path @archive = DarwinCore::Archive.new(@dwc_path, tmp_dir) @core = DarwinCore::Core.new(self) @metadata = DarwinCore::Metadata.new(@archive) @extensions = get_extensions end def file_name File.split(@dwc_path).last end def path File.expand_path(@dwc_path) end # generates a hash from a classification data with path to each node, # list of synonyms and vernacular names. def normalize_classification return nil unless has_parent_id? @classification_normalizer ||= DarwinCore::ClassificationNormalizer. new(self) @classification_normalizer.normalize end def has_parent_id? !!@core.fields.join('|').downcase.match(/highertaxonid|parentnameusageid/) end def checksum Digest::SHA1.hexdigest(open(@dwc_path).read) end private def get_extensions res = [] root_key = @archive.meta.keys[0] ext = @archive.meta[root_key][:extension] return [] unless ext ext = [ext] if ext.class != Array ext.map { |e| DarwinCore::Extension.new(self, e) } end end