Sha256: ba4db21db58b490ee8c4acd49e70353a955a7fd2f53a44ab0fa1288ac10b3480

Contents?: true

Size: 826 Bytes

Versions: 46

Compression:

Stored size: 826 Bytes

Contents

#!/usr/bin/env ruby

require 'utils'
include Utils::MD5

def find_same(*pathes)
  files = Hash.new { |h,k| h[k] = {} }
  Utils::Find.find(*pathes) do |filename|
    file_stat = File.stat(filename)
    if file_stat.file?
      size = file_stat.size
      $DEBUG and warn "Encountered '#{filename}' (#{size} bytes)."
      files[size][filename] = true
    end
  end

  files = files.inject({}) do |h, (_,fs)|
    keys = fs.keys
    if keys.size >= 2
      keys.each { |k| h[k] = true }
    end
    h
  end.keys

  md5s = Hash.new { |h,k| h[k] = [] }
  for filename in files
    md5sum = md5 filename
    md5s[md5sum] << filename
  end
  files = md5s.values
  files.reject! { |fs| fs.size < 2 }
  files
end

puts find_same(*ARGV).map { |fs| [ fs.size, fs ] }.sort.map { |c, fs|
  "#{c}\t#{fs.sort.map { |f| "'#{f}'" } * "\t"}"
}

Version data entries

46 entries across 46 versions & 1 rubygems

Version Path
utils-0.0.48 bin/same_files
utils-0.0.47 bin/same_files
utils-0.0.46 bin/same_files
utils-0.0.45 bin/same_files
utils-0.0.44 bin/same_files
utils-0.0.43 bin/same_files
utils-0.0.42 bin/same_files
utils-0.0.41 bin/same_files
utils-0.0.40 bin/same_files
utils-0.0.39 bin/same_files
utils-0.0.38 bin/same_files
utils-0.0.37 bin/same_files
utils-0.0.36 bin/same_files
utils-0.0.35 bin/same_files
utils-0.0.34 bin/same_files
utils-0.0.33 bin/same_files
utils-0.0.32 bin/same_files
utils-0.0.31 bin/same_files
utils-0.0.30 bin/same_files
utils-0.0.29 bin/same_files