let fsck ignore the recent files
[rersyncrecent.git] / bin / rrr-fsck
blobb413a518f11006d4142657d1e39344c5489939c4
1 #!/usr/bin/perl
3 =head1 NAME
5 rrr-fsck -
7 =head1 SYNOPSIS
9 rrr-fsck [options] principalfile
11 =head1 OPTIONS
13 =over 8
15 =cut
17 my @opt = <<'=back' =~ /B<--(\S+)>/g;
19 =item B<--dry-run|n>
21 Does nothing, only prints what it would do.
23 =item B<--help|h>
25 Prints a brief message and exists.
27 =item B<--remoteroot=s>
29 If provided fsck will try to mirror missing files from this location.
30 For remote locations requiring authentication you may need to set the
31 environment variables USER and RSYNC_PASSWORD as well.
33 =item B<--verbose|v+>
35 More feedback.
37 =item B<--yes|y>
39 Consider all answers to asked questions to be I<yes>.
41 =back
43 =head1 DESCRIPTION
45 Compares disk contents with index contents and gathers files missing
46 on local disk and files missing in local index.
48 If remoteroot is given missing files are fetched from remote.
50 Files on the local disk that have no counterpart in the index are
51 considered obsolete and the user is asked for each file if the file
52 should be deleted. And if the user confirms it will be deleted.
54 =head1 BUGS
56 There is a race condition when the tree or the index is manipulated
57 while we are running. This implies that the result is only then 100%
58 correct when disk and index are not changed while we are running.
60 There should be an option to declare the files on disk authoritative
61 so that they are added to the index.
63 =cut
66 use strict;
67 use warnings;
69 use lib "/home/k/sources/rersyncrecent/lib";
71 use File::Basename qw(dirname);
72 use File::Find qw(find);
73 use ExtUtils::MakeMaker qw(prompt);
74 use File::Rsync::Mirror::Recent;
75 use File::Spec;
76 use Getopt::Long;
77 use List::Util qw(max);
78 use Pod::Usage qw(pod2usage);
79 use Time::HiRes qw(time sleep);
81 our %Opt;
82 GetOptions(\%Opt,
83 @opt,
84 ) or pod2usage(1);
86 if ($Opt{help}) {
87 pod2usage(0);
90 if (@ARGV == 1) {
91 } else {
92 pod2usage(1);
95 my($principal) = @ARGV;
96 my $recc = File::Rsync::Mirror::Recent->new
98 local => $principal,
99 localroot => dirname $principal,
101 for my $passthrough (qw(remoteroot verbose)) {
102 if (my $opt = $Opt{$passthrough}) {
103 $recc->$passthrough($opt);
106 my $root = $recc->localroot;
107 die "Alert: Root not defined, giving up" unless defined $root;
108 my $prf = $recc->principal_recentfile;
109 my $filenameroot = $prf->filenameroot;
110 my $serializer_suffix = $prf->serializer_suffix;
111 my $ignore_rx = qr((?x:
112 ^ \Q$filenameroot\E (?: - [0-9]*[smhdWMQYZ] \Q$serializer_suffix\E (?: \.lock (?: /.* )? )? | \.recent ) \z
115 my %diskfiles;
116 my $i;
117 my $last_verbosity = 0;
118 $|=1;
119 if ($Opt{verbose}) {
120 print "\n";
122 find({
123 wanted => sub {
124 my @lstat = lstat $_;
125 return unless -l _ or -f _;
126 my($reportname) = $File::Find::name =~ m{^\Q$root\E/*(.*)};
127 return if $reportname =~ $ignore_rx;
128 $i++;
129 if ($Opt{verbose} && time - $last_verbosity > 0.166666) {
130 printf "\r%8d files and symlinks checked on disk ", $i;
131 $last_verbosity = time;
133 $diskfiles{$File::Find::name} = $lstat[9];
135 no_chdir => 1,
137 $root
139 if ($Opt{verbose}) {
140 printf "\r%8d files and symlinks checked on disk\n", $i;
142 $i = 0;
144 if ($Opt{verbose}) {
145 print "\rChecking index";
147 my @newsargs = ();
148 if ($Opt{verbose}) {
149 @newsargs =
150 (callback => sub {
151 $i = scalar @{shift;};
152 if (time - $last_verbosity > 0.166666) {
153 printf "\r%8d entries read from index ", $i;
154 $last_verbosity = time;
158 my $indexfiles = $recc->news(@newsargs);
159 if ($Opt{verbose}) {
160 printf "\r%8d entries read from index\n", scalar @$indexfiles;
162 my %seen;
163 my %indexfiles = map {("$root/$_->{path}"=>$_->{epoch})} grep { !$seen{$_->{path}}++ && $_->{type} eq "new" } @$indexfiles;
164 for my $rf (@{$recc->recentfiles}) {
165 my $rfrfile = $rf->rfile;
166 my @stat = stat $rfrfile or die "Could not stat '$rfrfile': $!";
167 $indexfiles{$rfrfile} = $stat[9];
169 if ($Opt{verbose}) {
170 printf "\r%8d file objects found in index\n", scalar keys %indexfiles;
172 my $sprintfd = length(max scalar @$indexfiles, scalar keys %diskfiles);
173 warn sprintf(
174 "diskfiles: %*d\n".
175 "indexfiles: %*d\n",
176 $sprintfd, scalar keys %diskfiles,
177 $sprintfd, scalar keys %indexfiles,
179 my @diskmisses = sort { $indexfiles{$b} <=> $indexfiles{$a} } grep { ! exists $diskfiles{$_} } keys %indexfiles;
180 my @indexmisses = sort { $diskfiles{$a} <=> $diskfiles{$b} } grep { ! exists $indexfiles{$_} } keys %diskfiles;
181 warn sprintf(
182 "missing on disk: %*d\n".
183 "missing in index: %*d\n",
184 $sprintfd, scalar @diskmisses,
185 $sprintfd, scalar @indexmisses,
187 $DB::single++;
188 my $rf = $recc->principal_recentfile;
189 my $last_aggregate_call = time;
190 my @batch;
191 for my $dm (@diskmisses) {
192 if (0) {
193 } elsif ($Opt{"dry-run"}) {
194 if ($Opt{remoteroot}) {
195 warn "Would fetch $dm\n";
196 } else {
197 warn "Would remove from indexfile $dm\n";
199 } elsif ($Opt{remoteroot}) {
200 my $relative = substr $dm, 1 + length $root;
201 $rf->get_remotefile($relative);
202 } else {
203 warn "Removing from indexfile: $dm\n";
204 push @batch, {path => $dm, type => "delete"};
205 #$rf->update($dm,"delete");
206 #if (time > $last_aggregate_call + $rf->interval_secs) {
207 # warn "Aggregating\n";
208 # $rf->aggregate;
209 # $last_aggregate_call = time;
213 for my $im (@indexmisses) {
214 if ($Opt{"dry-run"}) {
215 if ($Opt{remoteroot}) {
216 warn "Would remove $im\n";
217 } else {
218 warn "Would add to indexfile $im\n";
220 } elsif ($Opt{remoteroot}) {
221 my $ans;
222 if ($Opt{yes}) {
223 warn "Going to unlink '$im'\n";
224 $ans = "y";
225 } else {
226 $ans = prompt "Unlink '$im'?", "y";
228 if ($ans =~ /^y/i) {
229 unlink $im or die "Could not unlink '$im': $!";
231 } else {
232 warn "Adding to indexfile: $im\n";
233 my @stat = stat $im or next;
234 push @batch, {epoch => $stat[9], path => $im, type => "new"};
235 #$rf->update($im,"new");
236 #if (time > $last_aggregate_call + $rf->interval_secs) {
237 # warn "Aggregating\n";
238 # $rf->aggregate;
239 # $last_aggregate_call = time;
243 unless ($Opt{"dry-run"}) {
244 if (@batch) {
245 $rf->batch_update(\@batch);
249 __END__
252 # Local Variables:
253 # mode: cperl
254 # coding: utf-8
255 # cperl-indent-level: 4
256 # End: