-
Notifications
You must be signed in to change notification settings - Fork 11
/
Copy pathfile-remove-duplicates
executable file
·62 lines (54 loc) · 1.3 KB
/
file-remove-duplicates
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
#!/usr/bin/env perl
use v5.12;
use strict;
use warnings;
use Digest::SHA;
use File::Next;
use Getopt::Long qw(GetOptions);
sub file_digest {
my ($file) = @_;
my $digester = Digest::SHA->new("512");
$digester->addfile($file, 'b');
return $digester->b64digest;
}
sub main {
my ($opts, $args) = @_;
my @input = grep { -d $_ } @{ $opts->{i} };
my %idx;
my $iter = File::Next::files(@input);
while (defined( my $file = $iter->() )) {
my $size = (stat($file))[7];
push @{ $idx{$size} }, $file;
}
for my $s (keys %idx) {
my @files = @{ $idx{$s} };
next unless @files > 0;
my %dup;
my @to_be_deleted;
for my $f (sort { length($a) <=> length($b) } @files) {
my $d = file_digest($f);
if (exists $dup{$d}) {
push @to_be_deleted, $f;
say "rm $f; # dup: $dup{$d}";
} else {
$dup{$d} = $f;
}
}
if (@to_be_deleted) {
if ($opts->{yes}) {
unlink(@to_be_deleted);
} else {
say "Not removing anything without `--yes`";
}
say "";
}
}
return 0;
}
my %opts;
GetOptions(
\%opts,
'i=s@',
'yes|y',
);
main(\%opts, [@ARGV]);