/[BackupPC]/trunk/bin/BackupPC_incPartsUpdate
This is repository of my old source code which isn't updated any more. Go to git.rot13.org for current projects!
ViewVC logotype

Contents of /trunk/bin/BackupPC_incPartsUpdate

Parent Directory Parent Directory | Revision Log Revision Log


Revision 215 - (show annotations)
Sun Oct 16 16:18:12 2005 UTC (18 years, 7 months ago) by dpavlin
File size: 6284 byte(s)
 r8613@llin:  dpavlin | 2005-10-16 18:18:05 +0200
 use Archive::Tar::Streamed to prevent OOM killer when working with
 huge tars

1 #!/usr/local/bin/perl -w
2
3 use strict;
4 use lib "__INSTALLDIR__/lib";
5
6 use DBI;
7 use BackupPC::Lib;
8 use BackupPC::View;
9 use BackupPC::Attrib qw/:all/;
10 use Data::Dumper;
11 use Time::HiRes qw/time/;
12 use POSIX qw/strftime/;
13 use BackupPC::SearchLib;
14 use Cwd qw/abs_path/;
15 use File::Which;
16 use Archive::Tar::Streamed;
17 use Algorithm::Diff;
18 use Getopt::Std;
19
20 my $path = abs_path($0);
21 $path =~ s#/[^/]+$#/#;
22 my $tarIncCreate = $path .= 'BackupPC_tarIncCreate';
23
24 die "can't find $tarIncCreate: $!\n" unless (-x $tarIncCreate);
25
26 my $bin;
27 foreach my $c (qw/gzip split/) {
28 $bin->{$c} = which($c) || die "$0 needs $c, install it\n";
29 }
30
31 my %opt;
32 getopts("cd", \%opt );
33
34 my $debug = $opt{d};
35 my $check = $opt{c} && print STDERR "NOTICE: tar archive check forced\n";
36
37 $|=1;
38
39 my $start_t = time();
40
41 my $t_fmt = '%Y-%m-%d %H:%M:%S';
42
43 my $hosts;
44 my $bpc = BackupPC::Lib->new || die;
45 my %Conf = $bpc->Conf();
46 my $TopDir = $bpc->TopDir();
47 my $beenThere = {};
48
49 my $dsn = $Conf{SearchDSN} || die "Need SearchDSN in config.pl\n";
50 my $user = $Conf{SearchUser} || '';
51
52 my $dbh = DBI->connect($dsn, $user, "", { RaiseError => 1, AutoCommit => 0 });
53
54 my $tar_dir = $Conf{InstallDir}.'/'.$Conf{GzipTempDir};
55
56 die "problem with $tar_dir, check GzipTempDir in configuration\n" unless (-d $tar_dir && -w $tar_dir);
57
58 #---- subs ----
59
60 sub fmt_time {
61 my $t = shift || return;
62 my $out = "";
63 my ($ss,$mm,$hh) = gmtime($t);
64 $out .= "${hh}h" if ($hh);
65 $out .= sprintf("%02d:%02d", $mm,$ss);
66 return $out;
67 }
68
69 sub curr_time {
70 return strftime($t_fmt,localtime());
71 }
72
73 sub tar_join($) {
74 my $filename = shift;
75
76 my $in = my $out = $filename;
77 $out .= '.tmp';
78
79 # FIXME I should really order parts manually!
80 system("cat $in/part* > $out && rm -Rf $in && mv $out $in") == 0 or die "can't join $in: $?";
81
82 }
83
84 sub tar_check($$$$) {
85 my ($host,$share,$num,$filename) = @_;
86
87 if ($debug) {
88 print STDERR " {{ CHECK: ${host}:${share}#${num} and $filename";
89 } else {
90 print " check";
91 }
92
93 if (-d $filename) {
94 print STDERR ", joining";
95 tar_join($filename);
96 }
97
98 print STDERR ", opening" if ($debug);
99 open(my $fh, "gzip -cd $filename |") or die "can't open $filename: $!";
100 binmode($fh);
101 my $tar = Archive::Tar::Streamed->new($fh);
102
103 print STDERR ", tar" if ($debug);
104 my @tar_files;
105 while(my $entry = $tar->next) {
106 push @tar_files, $entry->name;
107 }
108 @tar_files = sort @tar_files;
109 print STDERR " ",($#tar_files + 1), " files" if ($debug);
110
111 print STDERR ", database" if ($debug);
112
113 my $sth = $dbh->prepare(qq{
114 SELECT path,type
115 FROM files
116 JOIN shares on shares.id = shareid
117 JOIN hosts on hosts.id = shares.hostid
118 WHERE hosts.name = ? and shares.name = ? and backupnum = ?
119 });
120 $sth->execute($host, $share, $num);
121 my @db_files;
122 while( my $row = $sth->fetchrow_hashref ) {
123
124 my $path = $row->{'path'} || die "no path?";
125 $path =~ s#^/#./#;
126 $path .= '/' if ($row->{'type'} == BPC_FTYPE_DIR);
127 push @db_files, $path;
128 }
129
130 print STDERR " ",($#db_files + 1), " files, diff" if ($debug);
131
132 @db_files = sort @db_files;
133
134 my $same = 1;
135 if ($#tar_files != $#db_files) {
136 $same = 0;
137 print STDERR " NUMBER" if ($debug);
138 } else {
139 my $diff = Algorithm::Diff->new(\@tar_files, \@db_files);
140 while ( $diff->Next() ) {
141 next if $diff->Same();
142 $same = 0;
143 print "< $_\n" for $diff->Items(1);
144 print "> $_\n" for $diff->Items(2);
145 }
146 }
147
148 print STDERR " ",($same ? 'ok' : 'DIFFERENT');
149 print STDERR " }} " if ($debug);
150
151 return $same;
152 }
153
154
155 #----- main
156
157 my $sth = $dbh->prepare( qq{
158
159 select
160 backups.id as backup_id,
161 hosts.name as host,
162 shares.name as share,
163 backups.num as num,
164 inc_size,
165 parts
166 from backups
167 join shares on backups.hostid = shares.hostid
168 and shares.id = backups.shareid
169 join hosts on shares.hostid = hosts.id
170 where not inc_deleted
171 order by backups.date
172
173 } );
174
175 my $sth_inc_size = $dbh->prepare(qq{ update backups set inc_size = ?, parts = ? where id = ? });
176 my $sth_inc_deleted = $dbh->prepare(qq{ update backups set inc_deleted = ? where id = ? });
177
178 %BackupPC::SearchLib::Conf = %Conf;
179
180 $sth->execute();
181 my $num_backups = $sth->rows;
182 my $curr_backup = 1;
183
184 while (my $row = $sth->fetchrow_hashref) {
185 my $tar_file = BackupPC::SearchLib::getGzipName($row->{'host'}, $row->{'share'}, $row->{'num'});
186
187 # this will return -1 if file doesn't exist
188 my $size = BackupPC::SearchLib::get_tgz_size_by_name($tar_file);
189
190 print curr_time, " $curr_backup/$num_backups ", $row->{'host'}, ":", $row->{'share'}, " #", $row->{'num'}, " -> $tar_file";
191 $curr_backup++;
192
193 my $t = time();
194
195 # re-create archive?
196 if ($row->{'inc_size'} == -1 || $size == -1 ||
197 $row->{'inc_size'} != $size ||
198 $check && ! tar_check($row->{'host'}, $row->{'share'}, $row->{'num'}, "$tar_dir/$tar_file")
199 ) {
200 my $cmd = qq{rm -Rf $tar_dir/$tar_file && $tarIncCreate -h "$row->{'host'}" -s "$row->{'share'}" -n $row->{'num'} | $bin->{'gzip'} $Conf{GzipLevel} > ${tar_dir}/${tar_file}.tmp};
201 print STDERR "## $cmd\n" if ($debug);
202
203 system($cmd) == 0 or die "failed: $?";
204
205 rename("${tar_dir}/${tar_file}.tmp", "$tar_dir/$tar_file") or die "can't rename $tar_dir/$tar_file: $!";
206
207 $size = (stat( "$tar_dir/$tar_file" ))[7];
208 }
209
210 if ($size > 45) {
211
212 my $max_size = $Conf{'MaxArchiveSize'} || die "problem with MaxArchieSize parametar";
213 $max_size *= 1024; # convert to bytes
214
215 my $parts = int( ($size + $max_size - 1) / $max_size );
216
217 if (-d "$tar_dir/$tar_file" && $parts != $row->{'parts'}) {
218 print " join";
219 tar_join("$tar_dir/$tar_file");
220 }
221
222 if ($size > $max_size && ! -d "$tar_dir/$tar_file") {
223 print " split/$parts";
224 my $in = my $out = "$tar_dir/$tar_file";
225 $out .= '.tmp';
226 rename $in, $out || die "can't rename $in: $!";
227 mkdir $in || die "can't mkdir $in: $!";
228
229 my $suffix_len = length("$parts");
230 system("$bin->{'split'} -d -b $max_size -a $suffix_len $out $in/part") == 0 or die "can't split $out: $?";
231 unlink $out || die "can't unlink $out: $!";
232 }
233
234 $sth_inc_size->execute($size, $parts, $row->{'backup_id'});
235 $sth_inc_deleted->execute(0, $row->{'backup_id'});
236
237 printf(" %1.2f MB", ($size / 1024 / 1024));
238
239 } else {
240 $sth_inc_deleted->execute(1, $row->{'backup_id'});
241 unlink "$tar_dir/$tar_file" || die "can't delete $tar_dir/$tar_file: $!\n";
242 print " EMPTY";
243 }
244 print ", dur: ",fmt_time(time() - $t), "\n";
245
246 $dbh->commit;
247
248 }
249
250 undef $sth;
251 $dbh->disconnect;

Properties

Name Value
svn:executable *

  ViewVC Help
Powered by ViewVC 1.1.26