dfm 0.0.1
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +15 -0
- data/LICENSE +21 -0
- data/README.md +4 -0
- data/bin/dfm +43 -0
- data/lib/dfm.rb +76 -0
- data/lib/dfm/version.rb +6 -0
- metadata +49 -0
checksums.yaml
ADDED
@@ -0,0 +1,15 @@
|
|
1
|
+
---
|
2
|
+
!binary "U0hBMQ==":
|
3
|
+
metadata.gz: !binary |-
|
4
|
+
YTg4NWZlYWEwYWMxZTI4ZmE3YmUwZTljYzVjNmI3NTljZjBhYTQ2MA==
|
5
|
+
data.tar.gz: !binary |-
|
6
|
+
NjhjOTFjNGM4NTBjZTc3YmM5NmU4NTE2ZWM1NjI5YjMxODNlOGJhMA==
|
7
|
+
SHA512:
|
8
|
+
metadata.gz: !binary |-
|
9
|
+
ZmU2ZTZjMDBkMjAzYmJiMTcxNjhkMmE5YmFiZTViNzRkZTUwNmY0MjEzOGI2
|
10
|
+
M2U3NDY5NGI4ZGNiMmMwODgxOTU3MDM5NWVhZDQ2MzE1YzY1ZTJkNjZkZWE2
|
11
|
+
ZDRmN2RiY2EyZmJlNmZkYWI1NWI2MmU4YWRmOWUzYTYyZDY2ZDU=
|
12
|
+
data.tar.gz: !binary |-
|
13
|
+
NTIzZmNiZjczZmQxNmQ0NTEzOGU1NDM0Y2Y0ZDcxMjVkZjJjNTkyNDdkYzBi
|
14
|
+
MWE2YjhkM2I0MTNkOTZjYWZjZmJmYTEzYmVkNDg2MmY2YTM0OGE1NjhhMGYw
|
15
|
+
ODliNWE1Njg0NzM2ODU5ZWUyMWI1YmFiZmQyZTAyYWI4YzYyMDg=
|
data/LICENSE
ADDED
@@ -0,0 +1,21 @@
|
|
1
|
+
The MIT License (MIT)
|
2
|
+
|
3
|
+
Copyright (c) 2014 Daniel P. Clark
|
4
|
+
|
5
|
+
Permission is hereby granted, free of charge, to any person obtaining a copy
|
6
|
+
of this software and associated documentation files (the "Software"), to deal
|
7
|
+
in the Software without restriction, including without limitation the rights
|
8
|
+
to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
|
9
|
+
copies of the Software, and to permit persons to whom the Software is
|
10
|
+
furnished to do so, subject to the following conditions:
|
11
|
+
|
12
|
+
The above copyright notice and this permission notice shall be included in all
|
13
|
+
copies or substantial portions of the Software.
|
14
|
+
|
15
|
+
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
16
|
+
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
17
|
+
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
|
18
|
+
AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
19
|
+
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
|
20
|
+
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
|
21
|
+
SOFTWARE.
|
data/README.md
ADDED
data/bin/dfm
ADDED
@@ -0,0 +1,43 @@
|
|
1
|
+
#!/usr/bin/env ruby
|
2
|
+
|
3
|
+
begin
|
4
|
+
require 'dfm'
|
5
|
+
rescue LoadError
|
6
|
+
require 'rubygems'
|
7
|
+
require 'dfm'
|
8
|
+
end
|
9
|
+
require 'optparse'
|
10
|
+
|
11
|
+
|
12
|
+
options = {}
|
13
|
+
printers = Array.new
|
14
|
+
|
15
|
+
OptionParser.new do |opts|
|
16
|
+
opts.banner = "Usage: dfm [options] [path]\nDefaults: dfm -x -d ." + File::SEPARATOR
|
17
|
+
opts.on("-f", "--filters FILTERS", Array, "File extension filters") do |filters|
|
18
|
+
options[:filters] = filters
|
19
|
+
end
|
20
|
+
opts.on("-x", "--duplicates-hex", "Prints duplicate files by MD5 hexdigest") do |dh|
|
21
|
+
printers << "dh"
|
22
|
+
end
|
23
|
+
opts.on("-d", "--duplicates-name", "Prints duplicate files by file name") do |dh|
|
24
|
+
printers << "dn"
|
25
|
+
end
|
26
|
+
opts.on("-s", "--singles-hex", "Prints non-duplicate files by MD5 hexdigest") do |dh|
|
27
|
+
printers << "sh"
|
28
|
+
end
|
29
|
+
opts.on("-n", "--singles-name", "Prints non-duplicate files by file name") do |dh|
|
30
|
+
printers << "sn"
|
31
|
+
end
|
32
|
+
end.parse!
|
33
|
+
path = ARGV.select {|i| File.directory? i }[0]
|
34
|
+
program = DFM.new( options.update( { :path => path } ) )
|
35
|
+
if printers.empty?
|
36
|
+
program.print_duplicates
|
37
|
+
program.print_duplicates( "name" )
|
38
|
+
else
|
39
|
+
if printers.include? "dh"; program.print_duplicates; end
|
40
|
+
if printers.include? "dn"; program.print_duplicates( "name" ); end
|
41
|
+
if printers.include? "sh"; program.print_singles; end
|
42
|
+
if printers.include? "sn"; program.print_singles( "name" ); end
|
43
|
+
end
|
data/lib/dfm.rb
ADDED
@@ -0,0 +1,76 @@
|
|
1
|
+
require 'digest'
|
2
|
+
require 'json'
|
3
|
+
require 'dfm/version'
|
4
|
+
|
5
|
+
class DFM
|
6
|
+
attr_accessor :filters
|
7
|
+
|
8
|
+
def initialize( params = {} )
|
9
|
+
@files_by_hexdigest = {}
|
10
|
+
@files_by_name = {}
|
11
|
+
@filters = Array( params.fetch( :filters, nil ) )
|
12
|
+
@path = ( ( params.fetch( :path, '.' ) ) || '.' ) + File::SEPARATOR
|
13
|
+
@hashFunc = Digest::MD5.new
|
14
|
+
recurse_path( @path )
|
15
|
+
end
|
16
|
+
|
17
|
+
def print_singles( opt = "hex" )
|
18
|
+
print_match( { :type => opt, :duplicates => false } )
|
19
|
+
end
|
20
|
+
|
21
|
+
def print_duplicates( opt = "hex" )
|
22
|
+
print_match( { :type => opt } )
|
23
|
+
end
|
24
|
+
|
25
|
+
def hex( duplicates = true )
|
26
|
+
select_duplicates( { :hash => @files_by_hexdigest, :duplicates => duplicates } )
|
27
|
+
end
|
28
|
+
|
29
|
+
def name( duplicates = true )
|
30
|
+
select_duplicates( { :hash => @files_by_name, :duplicates => duplicates } )
|
31
|
+
end
|
32
|
+
|
33
|
+
def recurse( path )
|
34
|
+
@files_by_hexdigest = {}
|
35
|
+
@files_by_name = {}
|
36
|
+
recurse_path( path )
|
37
|
+
end
|
38
|
+
|
39
|
+
private
|
40
|
+
|
41
|
+
def insert_file( file )
|
42
|
+
# hex
|
43
|
+
file_io = File.open( file, "rb" ) { |io| io.read }
|
44
|
+
hex_file = @hashFunc.hexdigest( file_io )
|
45
|
+
@files_by_hexdigest[ hex_file ] = Array( @files_by_hexdigest[ hex_file ] ) << file
|
46
|
+
# name
|
47
|
+
@files_by_name[ File.basename( file ) ] = Array( @files_by_name[ File.basename( file ) ] ) << file
|
48
|
+
end
|
49
|
+
|
50
|
+
def recurse_path( path = @path )
|
51
|
+
@filters.empty? ? ( filters = "" ) : ( filters = @filters.join( "," ).prepend( ".{" ).<<( "}" ) )
|
52
|
+
Dir.glob( path + '**' + File::SEPARATOR + '*' + filters ).each { |file|
|
53
|
+
if File.file? file
|
54
|
+
insert_file file
|
55
|
+
end
|
56
|
+
}
|
57
|
+
end
|
58
|
+
|
59
|
+
def select_duplicates( opt = { :hash => @files_by_hexdigest, :duplicates => true } )
|
60
|
+
if opt[ :duplicates ]
|
61
|
+
opt[ :hash ].select { |k,v| v.length > 2 }
|
62
|
+
else
|
63
|
+
opt[ :hash ].select { |k,v| v.length == 1 }
|
64
|
+
end
|
65
|
+
end
|
66
|
+
|
67
|
+
def print_match( opt = { :type => "hex", :duplicates => true } )
|
68
|
+
if !!opt[ :type ][ "hex" ] or !!opt[ :type ][ "name" ]
|
69
|
+
print_json send( opt[ :type ], *Array( opt[ :duplicates ] ) )
|
70
|
+
end
|
71
|
+
end
|
72
|
+
|
73
|
+
def print_json( hash )
|
74
|
+
puts JSON.pretty_generate( hash )
|
75
|
+
end
|
76
|
+
end
|
data/lib/dfm/version.rb
ADDED
metadata
ADDED
@@ -0,0 +1,49 @@
|
|
1
|
+
--- !ruby/object:Gem::Specification
|
2
|
+
name: dfm
|
3
|
+
version: !ruby/object:Gem::Version
|
4
|
+
version: 0.0.1
|
5
|
+
platform: ruby
|
6
|
+
authors:
|
7
|
+
- Daniel P. Clark / 6ftDan(TM)
|
8
|
+
autorequire:
|
9
|
+
bindir: bin
|
10
|
+
cert_chain: []
|
11
|
+
date: 2014-06-16 00:00:00.000000000 Z
|
12
|
+
dependencies: []
|
13
|
+
description: Parse duplicate files to process!
|
14
|
+
email: webmaster@6ftdan.com
|
15
|
+
executables:
|
16
|
+
- dfm
|
17
|
+
extensions: []
|
18
|
+
extra_rdoc_files: []
|
19
|
+
files:
|
20
|
+
- LICENSE
|
21
|
+
- README.md
|
22
|
+
- bin/dfm
|
23
|
+
- lib/dfm.rb
|
24
|
+
- lib/dfm/version.rb
|
25
|
+
homepage: https://github.com/danielpclark/dfm
|
26
|
+
licenses:
|
27
|
+
- The MIT License (MIT)
|
28
|
+
metadata: {}
|
29
|
+
post_install_message:
|
30
|
+
rdoc_options: []
|
31
|
+
require_paths:
|
32
|
+
- lib
|
33
|
+
required_ruby_version: !ruby/object:Gem::Requirement
|
34
|
+
requirements:
|
35
|
+
- - ! '>='
|
36
|
+
- !ruby/object:Gem::Version
|
37
|
+
version: '0'
|
38
|
+
required_rubygems_version: !ruby/object:Gem::Requirement
|
39
|
+
requirements:
|
40
|
+
- - ! '>='
|
41
|
+
- !ruby/object:Gem::Version
|
42
|
+
version: '0'
|
43
|
+
requirements: []
|
44
|
+
rubyforge_project:
|
45
|
+
rubygems_version: 2.2.2
|
46
|
+
signing_key:
|
47
|
+
specification_version: 4
|
48
|
+
summary: Duplicate File Manager!
|
49
|
+
test_files: []
|