Mention the latest new options.
[rsync/rsync.git] / generator.c
... / ...
CommitLineData
1/* -*- c-file-style: "linux" -*-
2
3 rsync -- fast file replication program
4
5 Copyright (C) 1996-2000 by Andrew Tridgell
6 Copyright (C) Paul Mackerras 1996
7 Copyright (C) 2002 by Martin Pool <mbp@samba.org>
8
9 This program is free software; you can redistribute it and/or modify
10 it under the terms of the GNU General Public License as published by
11 the Free Software Foundation; either version 2 of the License, or
12 (at your option) any later version.
13
14 This program is distributed in the hope that it will be useful,
15 but WITHOUT ANY WARRANTY; without even the implied warranty of
16 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 GNU General Public License for more details.
18
19 You should have received a copy of the GNU General Public License
20 along with this program; if not, write to the Free Software
21 Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
22*/
23
24#include "rsync.h"
25
26extern int verbose;
27extern int dry_run;
28extern int relative_paths;
29extern int keep_dirlinks;
30extern int preserve_links;
31extern int am_root;
32extern int preserve_devices;
33extern int preserve_hard_links;
34extern int preserve_perms;
35extern int preserve_uid;
36extern int preserve_gid;
37extern int preserve_times;
38extern int omit_dir_times;
39extern int delete_during;
40extern int update_only;
41extern int opt_ignore_existing;
42extern int inplace;
43extern int make_backups;
44extern int csum_length;
45extern int ignore_times;
46extern int size_only;
47extern OFF_T max_size;
48extern int io_timeout;
49extern int protocol_version;
50extern int always_checksum;
51extern char *partial_dir;
52extern char *basis_dir[];
53extern int compare_dest;
54extern int link_dest;
55extern int whole_file;
56extern int local_server;
57extern int list_only;
58extern int read_batch;
59extern int only_existing;
60extern int orig_umask;
61extern int safe_symlinks;
62extern long block_size; /* "long" because popt can't set an int32. */
63
64extern struct exclude_list_struct server_exclude_list;
65
66static int unchanged_attrs(struct file_struct *file, STRUCT_STAT *st)
67{
68 if (preserve_perms
69 && (st->st_mode & CHMOD_BITS) != (file->mode & CHMOD_BITS))
70 return 0;
71
72 if (am_root && preserve_uid && st->st_uid != file->uid)
73 return 0;
74
75 if (preserve_gid && file->gid != GID_NONE && st->st_gid != file->gid)
76 return 0;
77
78 return 1;
79}
80
81/* Perform our quick-check heuristic for determining if a file is unchanged. */
82static int unchanged_file(char *fn, struct file_struct *file, STRUCT_STAT *st)
83{
84 if (st->st_size != file->length)
85 return 0;
86
87 /* if always checksum is set then we use the checksum instead
88 of the file time to determine whether to sync */
89 if (always_checksum && S_ISREG(st->st_mode)) {
90 char sum[MD4_SUM_LENGTH];
91 file_checksum(fn, sum, st->st_size);
92 return memcmp(sum, file->u.sum, protocol_version < 21 ? 2
93 : MD4_SUM_LENGTH) == 0;
94 }
95
96 if (size_only)
97 return 1;
98
99 if (ignore_times)
100 return 0;
101
102 return cmp_modtime(st->st_mtime, file->modtime) == 0;
103}
104
105
106/*
107 * set (initialize) the size entries in the per-file sum_struct
108 * calculating dynamic block and checksum sizes.
109 *
110 * This is only called from generate_and_send_sums() but is a separate
111 * function to encapsulate the logic.
112 *
113 * The block size is a rounded square root of file length.
114 *
115 * The checksum size is determined according to:
116 * blocksum_bits = BLOCKSUM_EXP + 2*log2(file_len) - log2(block_len)
117 * provided by Donovan Baarda which gives a probability of rsync
118 * algorithm corrupting data and falling back using the whole md4
119 * checksums.
120 *
121 * This might be made one of several selectable heuristics.
122 */
123static void sum_sizes_sqroot(struct sum_struct *sum, int64 len)
124{
125 int32 blength;
126 int s2length;
127
128 if (block_size)
129 blength = block_size;
130 else if (len <= BLOCK_SIZE * BLOCK_SIZE)
131 blength = BLOCK_SIZE;
132 else {
133 int32 c;
134 int64 l;
135 int cnt;
136 for (c = 1, l = len, cnt = 0; l >>= 2; c <<= 1, cnt++) {}
137 if (cnt >= 31 || c >= MAX_BLOCK_SIZE)
138 blength = MAX_BLOCK_SIZE;
139 else {
140 blength = 0;
141 do {
142 blength |= c;
143 if (len < (int64)blength * blength)
144 blength &= ~c;
145 c >>= 1;
146 } while (c >= 8); /* round to multiple of 8 */
147 blength = MAX(blength, BLOCK_SIZE);
148 }
149 }
150
151 if (protocol_version < 27) {
152 s2length = csum_length;
153 } else if (csum_length == SUM_LENGTH) {
154 s2length = SUM_LENGTH;
155 } else {
156 int32 c;
157 int64 l;
158 int b = BLOCKSUM_BIAS;
159 for (l = len; l >>= 1; b += 2) {}
160 for (c = blength; c >>= 1 && b; b--) {}
161 /* add a bit, subtract rollsum, round up. */
162 s2length = (b + 1 - 32 + 7) / 8; /* --optimize in compiler-- */
163 s2length = MAX(s2length, csum_length);
164 s2length = MIN(s2length, SUM_LENGTH);
165 }
166
167 sum->flength = len;
168 sum->blength = blength;
169 sum->s2length = s2length;
170 sum->count = (len + (blength - 1)) / blength;
171 sum->remainder = (len % blength);
172
173 if (sum->count && verbose > 2) {
174 rprintf(FINFO,
175 "count=%.0f rem=%ld blength=%ld s2length=%d flength=%.0f\n",
176 (double)sum->count, (long)sum->remainder, (long)sum->blength,
177 sum->s2length, (double)sum->flength);
178 }
179}
180
181
182/*
183 * Generate and send a stream of signatures/checksums that describe a buffer
184 *
185 * Generate approximately one checksum every block_len bytes.
186 */
187static void generate_and_send_sums(int fd, OFF_T len, int f_out, int f_copy)
188{
189 size_t i;
190 struct map_struct *mapbuf;
191 struct sum_struct sum;
192 OFF_T offset = 0;
193
194 sum_sizes_sqroot(&sum, len);
195
196 if (len > 0)
197 mapbuf = map_file(fd, len, MAX_MAP_SIZE, sum.blength);
198 else
199 mapbuf = NULL;
200
201 write_sum_head(f_out, &sum);
202
203 for (i = 0; i < sum.count; i++) {
204 int32 n1 = (int32)MIN(len, (OFF_T)sum.blength);
205 char *map = map_ptr(mapbuf, offset, n1);
206 uint32 sum1 = get_checksum1(map, n1);
207 char sum2[SUM_LENGTH];
208
209 if (f_copy >= 0)
210 full_write(f_copy, map, n1);
211
212 get_checksum2(map, n1, sum2);
213
214 if (verbose > 3) {
215 rprintf(FINFO,
216 "chunk[%.0f] offset=%.0f len=%ld sum1=%08lx\n",
217 (double)i, (double)offset, (long)n1,
218 (unsigned long)sum1);
219 }
220 write_int(f_out, sum1);
221 write_buf(f_out, sum2, sum.s2length);
222 len -= n1;
223 offset += n1;
224 }
225
226 if (mapbuf)
227 unmap_file(mapbuf);
228}
229
230
231/*
232 * Acts on file number @p i from @p flist, whose name is @p fname.
233 *
234 * First fixes up permissions, then generates checksums for the file.
235 *
236 * @note This comment was added later by mbp who was trying to work it
237 * out. It might be wrong.
238 */
239static void recv_generator(char *fname, struct file_list *flist,
240 struct file_struct *file, int i,
241 int f_out, int f_out_name)
242{
243 int fd = -1, f_copy = -1;
244 STRUCT_STAT st, partial_st;
245 struct file_struct *back_file = NULL;
246 int statret, stat_errno;
247 char *fnamecmp, *partialptr, *backupptr = NULL;
248 char fnamecmpbuf[MAXPATHLEN];
249 uchar fnamecmp_type;
250
251 if (list_only)
252 return;
253
254 if (verbose > 2)
255 rprintf(FINFO, "recv_generator(%s,%d)\n", safe_fname(fname), i);
256
257 if (server_exclude_list.head
258 && check_exclude(&server_exclude_list, fname,
259 S_ISDIR(file->mode)) < 0) {
260 if (verbose) {
261 rprintf(FINFO, "skipping server-excluded file \"%s\"\n",
262 safe_fname(fname));
263 }
264 return;
265 }
266
267 if (dry_run > 1) {
268 statret = -1;
269 stat_errno = ENOENT;
270 } else {
271 statret = link_stat(fname, &st,
272 keep_dirlinks && S_ISDIR(file->mode));
273 stat_errno = errno;
274 }
275
276 if (only_existing && statret == -1 && stat_errno == ENOENT) {
277 /* we only want to update existing files */
278 if (verbose > 1) {
279 rprintf(FINFO, "not creating new file \"%s\"\n",
280 safe_fname(fname));
281 }
282 return;
283 }
284
285 if (statret == 0 && !preserve_perms
286 && S_ISDIR(st.st_mode) == S_ISDIR(file->mode)) {
287 /* if the file exists already and we aren't perserving
288 * permissions then act as though the remote end sent
289 * us the file permissions we already have */
290 file->mode = (file->mode & ~CHMOD_BITS)
291 | (st.st_mode & CHMOD_BITS);
292 }
293
294 if (S_ISDIR(file->mode)) {
295 /* The file to be received is a directory, so we need
296 * to prepare appropriately. If there is already a
297 * file of that name and it is *not* a directory, then
298 * we need to delete it. If it doesn't exist, then
299 * (perhaps recursively) create it. */
300 if (statret == 0 && !S_ISDIR(st.st_mode)) {
301 delete_file(fname, DEL_TERSE);
302 statret = -1;
303 }
304 if (statret != 0 && do_mkdir(fname,file->mode) != 0 && errno != EEXIST) {
305 if (!relative_paths || errno != ENOENT
306 || create_directory_path(fname, orig_umask) < 0
307 || do_mkdir(fname, file->mode) < 0) {
308 rsyserr(FERROR, errno,
309 "recv_generator: mkdir %s failed",
310 full_fname(fname));
311 }
312 }
313 /* f_out is set to -1 when doing final directory-permission
314 * and modification-time repair. */
315 if (set_perms(fname, file, statret ? NULL : &st, 0)
316 && verbose && f_out != -1)
317 rprintf(FINFO, "%s/\n", safe_fname(fname));
318 if (delete_during && f_out != -1
319 && (file->flags & FLAG_DEL_START))
320 delete_in_dir(flist, fname);
321 return;
322 } else if (max_size && file->length > max_size) {
323 if (verbose > 1)
324 rprintf(FINFO, "%s is over max-size\n", fname);
325 return;
326 }
327
328 if (preserve_links && S_ISLNK(file->mode)) {
329#if SUPPORT_LINKS
330 if (safe_symlinks && unsafe_symlink(file->u.link, fname)) {
331 if (verbose) {
332 rprintf(FINFO, "ignoring unsafe symlink %s -> \"%s\"\n",
333 full_fname(fname), file->u.link);
334 }
335 return;
336 }
337 if (statret == 0) {
338 int dflag = S_ISDIR(st.st_mode) ? DEL_DIR : 0;
339 char lnk[MAXPATHLEN];
340 int len;
341
342 if (!dflag
343 && (len = readlink(fname, lnk, MAXPATHLEN-1)) > 0) {
344 lnk[len] = 0;
345 /* A link already pointing to the
346 * right place -- no further action
347 * required. */
348 if (strcmp(lnk, file->u.link) == 0) {
349 set_perms(fname, file, &st,
350 PERMS_REPORT);
351 return;
352 }
353 }
354 /* Not the right symlink (or not a symlink), so
355 * delete it. */
356 delete_file(fname, dflag | DEL_TERSE);
357 }
358 if (do_symlink(file->u.link,fname) != 0) {
359 rsyserr(FERROR, errno, "symlink %s -> \"%s\" failed",
360 full_fname(fname), safe_fname(file->u.link));
361 } else {
362 set_perms(fname,file,NULL,0);
363 if (verbose) {
364 rprintf(FINFO, "%s -> %s\n", safe_fname(fname),
365 safe_fname(file->u.link));
366 }
367 }
368#endif
369 return;
370 }
371
372 if (am_root && preserve_devices && IS_DEVICE(file->mode)) {
373 if (statret != 0 ||
374 st.st_mode != file->mode ||
375 st.st_rdev != file->u.rdev) {
376 int dflag = S_ISDIR(st.st_mode) ? DEL_DIR : 0;
377 delete_file(fname, dflag | DEL_TERSE);
378 if (verbose > 2) {
379 rprintf(FINFO,"mknod(%s,0%o,0x%x)\n",
380 safe_fname(fname),
381 (int)file->mode, (int)file->u.rdev);
382 }
383 if (do_mknod(fname,file->mode,file->u.rdev) != 0) {
384 rsyserr(FERROR, errno, "mknod %s failed",
385 full_fname(fname));
386 } else {
387 set_perms(fname,file,NULL,0);
388 if (verbose) {
389 rprintf(FINFO, "%s\n",
390 safe_fname(fname));
391 }
392 }
393 } else {
394 set_perms(fname, file, &st, PERMS_REPORT);
395 }
396 return;
397 }
398
399 if (preserve_hard_links && hard_link_check(file, HL_CHECK_MASTER))
400 return;
401
402 if (!S_ISREG(file->mode)) {
403 rprintf(FINFO, "skipping non-regular file \"%s\"\n",
404 safe_fname(fname));
405 return;
406 }
407
408 fnamecmp = fname;
409 fnamecmp_type = FNAMECMP_FNAME;
410
411 if (statret == -1 && basis_dir[0] != NULL) {
412 int fallback_match = -1;
413 int match_level = 0;
414 int i = 0;
415 do {
416 pathjoin(fnamecmpbuf, sizeof fnamecmpbuf,
417 basis_dir[i], fname);
418 if (link_stat(fnamecmpbuf, &st, 0) == 0
419 && S_ISREG(st.st_mode)) {
420 statret = 0;
421 if (link_dest) {
422 if (!match_level) {
423 fallback_match = i;
424 match_level = 1;
425 } else if (match_level == 2
426 && !unchanged_attrs(file, &st))
427 continue;
428 if (!unchanged_file(fnamecmpbuf, file, &st))
429 continue;
430 fallback_match = i;
431 match_level = 2;
432 if (!unchanged_attrs(file, &st))
433 continue;
434 }
435 match_level = 3;
436 break;
437 }
438 } while (basis_dir[++i] != NULL);
439 if (statret == 0) {
440 if (match_level < 3) {
441 i = fallback_match;
442 pathjoin(fnamecmpbuf, sizeof fnamecmpbuf,
443 basis_dir[i], fname);
444 }
445#if HAVE_LINK
446 if (link_dest && match_level == 3 && !dry_run) {
447 if (do_link(fnamecmpbuf, fname) < 0) {
448 if (verbose) {
449 rsyserr(FINFO, errno,
450 "link %s => %s",
451 fnamecmpbuf,
452 safe_fname(fname));
453 }
454 fnamecmp = fnamecmpbuf;
455 fnamecmp_type = i;
456 }
457 } else
458#endif
459 {
460 fnamecmp = fnamecmpbuf;
461 fnamecmp_type = i;
462 }
463 }
464 }
465
466 if (statret == 0 && !S_ISREG(st.st_mode)) {
467 int dflag = S_ISDIR(st.st_mode) ? DEL_DIR : 0;
468 if (delete_file(fname, dflag | DEL_TERSE) != 0)
469 return;
470 statret = -1;
471 stat_errno = ENOENT;
472 }
473
474 if (partial_dir && (partialptr = partial_dir_fname(fname)) != NULL
475 && link_stat(partialptr, &partial_st, 0) == 0
476 && S_ISREG(partial_st.st_mode)) {
477 if (statret == -1)
478 goto prepare_to_open;
479 } else
480 partialptr = NULL;
481
482 if (statret == -1) {
483 if (preserve_hard_links && hard_link_check(file, HL_SKIP))
484 return;
485 if (stat_errno == ENOENT)
486 goto notify_others;
487 if (verbose > 1) {
488 rsyserr(FERROR, stat_errno,
489 "recv_generator: failed to stat %s",
490 full_fname(fname));
491 }
492 return;
493 }
494
495 if (opt_ignore_existing && fnamecmp_type == FNAMECMP_FNAME) {
496 if (verbose > 1)
497 rprintf(FINFO, "%s exists\n", safe_fname(fname));
498 return;
499 }
500
501 if (update_only && fnamecmp_type == FNAMECMP_FNAME
502 && cmp_modtime(st.st_mtime, file->modtime) > 0) {
503 if (verbose > 1)
504 rprintf(FINFO, "%s is newer\n", safe_fname(fname));
505 return;
506 }
507
508 if (!compare_dest && fnamecmp_type <= FNAMECMP_BASIS_DIR_HIGH)
509 ;
510 else if (unchanged_file(fnamecmp, file, &st)) {
511 if (fnamecmp_type == FNAMECMP_FNAME)
512 set_perms(fname, file, &st, PERMS_REPORT);
513 return;
514 }
515
516prepare_to_open:
517 if (partialptr) {
518 st = partial_st;
519 fnamecmp = partialptr;
520 fnamecmp_type = FNAMECMP_PARTIAL_DIR;
521 statret = 0;
522 }
523
524 if (dry_run || whole_file > 0) {
525 statret = -1;
526 goto notify_others;
527 }
528 if (read_batch)
529 goto notify_others;
530
531 /* open the file */
532 fd = do_open(fnamecmp, O_RDONLY, 0);
533
534 if (fd == -1) {
535 rsyserr(FERROR, errno, "failed to open %s, continuing",
536 full_fname(fnamecmp));
537 pretend_missing:
538 /* pretend the file didn't exist */
539 if (preserve_hard_links && hard_link_check(file, HL_SKIP))
540 return;
541 statret = -1;
542 goto notify_others;
543 }
544
545 if (inplace && make_backups) {
546 if (!(backupptr = get_backup_name(fname))) {
547 close(fd);
548 return;
549 }
550 if (!(back_file = make_file(fname, NULL, NO_EXCLUDES))) {
551 close(fd);
552 goto pretend_missing;
553 }
554 if (robust_unlink(backupptr) && errno != ENOENT) {
555 rsyserr(FERROR, errno, "unlink %s",
556 full_fname(backupptr));
557 free(back_file);
558 close(fd);
559 return;
560 }
561 if ((f_copy = do_open(backupptr,
562 O_WRONLY | O_CREAT | O_TRUNC | O_EXCL, 0600)) < 0) {
563 rsyserr(FERROR, errno, "open %s",
564 full_fname(backupptr));
565 free(back_file);
566 close(fd);
567 return;
568 }
569 fnamecmp_type = FNAMECMP_BACKUP;
570 }
571
572 if (verbose > 3) {
573 rprintf(FINFO, "gen mapped %s of size %.0f\n",
574 safe_fname(fnamecmp), (double)st.st_size);
575 }
576
577 if (verbose > 2)
578 rprintf(FINFO, "generating and sending sums for %d\n", i);
579
580notify_others:
581 write_int(f_out, i);
582 if (protocol_version >= 29 && inplace && !read_batch)
583 write_byte(f_out, fnamecmp_type);
584 if (f_out_name >= 0)
585 write_byte(f_out_name, fnamecmp_type);
586
587 if (dry_run || read_batch)
588 return;
589
590 if (statret == 0) {
591 generate_and_send_sums(fd, st.st_size, f_out, f_copy);
592
593 if (f_copy >= 0) {
594 close(f_copy);
595 set_perms(backupptr, back_file, NULL, 0);
596 if (verbose > 1) {
597 rprintf(FINFO, "backed up %s to %s\n",
598 fname, backupptr);
599 }
600 free(back_file);
601 }
602
603 close(fd);
604 } else
605 write_sum_head(f_out, NULL);
606}
607
608
609void generate_files(int f_out, struct file_list *flist, char *local_name,
610 int f_out_name)
611{
612 int i;
613 int phase = 0;
614 char fbuf[MAXPATHLEN];
615 int need_retouch_dir_times = preserve_times && !omit_dir_times;
616 int need_retouch_dir_perms = 0;
617
618 if (verbose > 2) {
619 rprintf(FINFO, "generator starting pid=%ld count=%d\n",
620 (long)getpid(), flist->count);
621 }
622
623 if (verbose >= 2) {
624 rprintf(FINFO,
625 whole_file > 0
626 ? "delta-transmission disabled for local transfer or --whole-file\n"
627 : "delta transmission enabled\n");
628 }
629
630 /* we expect to just sit around now, so don't exit on a
631 timeout. If we really get a timeout then the other process should
632 exit */
633 io_timeout = 0;
634
635 for (i = 0; i < flist->count; i++) {
636 struct file_struct *file = flist->files[i];
637 struct file_struct copy;
638
639 if (!file->basename)
640 continue;
641 /* we need to ensure that any directories we create have writeable
642 permissions initially so that we can create the files within
643 them. This is then fixed after the files are transferred */
644 if (!am_root && S_ISDIR(file->mode) && !(file->mode & S_IWUSR)) {
645 copy = *file;
646 copy.mode |= S_IWUSR; /* user write */
647 file = &copy;
648 need_retouch_dir_perms = 1;
649 }
650
651 recv_generator(local_name ? local_name : f_name_to(file, fbuf),
652 flist, file, i, f_out, f_out_name);
653 }
654
655 phase++;
656 csum_length = SUM_LENGTH;
657 ignore_times = 1;
658
659 if (verbose > 2)
660 rprintf(FINFO,"generate_files phase=%d\n",phase);
661
662 write_int(f_out, -1);
663
664 /* files can cycle through the system more than once
665 * to catch initial checksum errors */
666 while ((i = get_redo_num()) != -1) {
667 struct file_struct *file = flist->files[i];
668 recv_generator(local_name ? local_name : f_name_to(file, fbuf),
669 flist, file, i, f_out, f_out_name);
670 }
671
672 phase++;
673 if (verbose > 2)
674 rprintf(FINFO,"generate_files phase=%d\n",phase);
675
676 write_int(f_out, -1);
677
678 /* Read post-redo-phase MSG_DONE and any prior messages. */
679 get_redo_num();
680
681 if (preserve_hard_links)
682 do_hard_links();
683
684 if (need_retouch_dir_perms || need_retouch_dir_times) {
685 /* Now we need to fix any directory permissions that were
686 * modified during the transfer and/or re-set any tweaked
687 * modified-time values. */
688 for (i = 0; i < flist->count; i++) {
689 struct file_struct *file = flist->files[i];
690 if (!file->basename || !S_ISDIR(file->mode))
691 continue;
692 if (!need_retouch_dir_times && file->mode & S_IWUSR)
693 continue;
694 recv_generator(local_name ? local_name : f_name(file),
695 flist, file, i, -1, -1);
696 }
697 }
698
699 if (verbose > 2)
700 rprintf(FINFO,"generate_files finished\n");
701}