Sha256: adb3aa5b1d4e2af555b1b9e178c415197fdbcfe6cbec3b03dd284d9e506eedfc
Contents?: true
Size: 1.7 KB
Versions: 1
Compression:
Stored size: 1.7 KB
Contents
require 'csv' module Cevennes VERSION = '0.10.0' class << self def diff(id, csv0, csv1) h0 = hash(id, csv0) h1 = hash(id, csv1) ks0 = h0.delete(:keys) ks1 = h1.delete(:keys) d = h0 .collect { |k, v| v1 = h1[k] if v1 == nil [ '-', *v, -1, nil ] elsif v1[1] == v[1] [ '=', *v, v[0], nil ] else [ '!', *v, *v1 ] end } (h1.keys - h0.keys) .collect { |k| h1[k] } .reverse .each { |lnum, line| i = d.index { |a, _, _, l1, _| l1 > lnum } || d.length d.insert(i, [ '+', -1, nil, lnum, line ]) } s = d.inject({}) { |h, (a, _, _)| h[a] = (h[a] || 0) + 1; h } s['l0'] = h0.length - 1 s['l1'] = h1.length - 1 [ [ 'keys', ks0, ks1 ], [ 'stats', s ] ] + d end protected def hash(id, csv) csva = ::CSV.parse(reencode(csv)) .each_with_index.collect { |row, i| [ 1 + i, row ] } .reject { |i, row| row.compact.empty? } .drop_while { |i, row| ! row.include?(id) } idi = csva[0][1].index(id) csva[1..-1] .inject({ keys: csva[0] }) { |h, (i, row)| if row.compact.length > 1 k = row[idi] h[k] = [ i, row ] if k end h } end #def deflate(row) # ::CSV.generate(encoding: 'UTF-8') { |csv| csv << row }.strip #end def reencode(s) #s = unzip(s) if s[0, 2] == 'PK' # no dependency on rubyzip %w[ Windows-1252 ISO-8859-1 UTF-8 ].each do |e| ss = s.force_encoding(e).encode('UTF-8') rescue nil break ss if ss nil end end end end
Version data entries
1 entries across 1 versions & 1 rubygems
Version | Path |
---|---|
cevennes-0.10.0 | lib/cevennes.rb |