In hlink_compare(), call f_name_cmp() directly instead of using
[rsync/rsync.git] / generator.c
... / ...
CommitLineData
1/* -*- c-file-style: "linux" -*-
2
3 rsync -- fast file replication program
4
5 Copyright (C) 1996-2000 by Andrew Tridgell
6 Copyright (C) Paul Mackerras 1996
7 Copyright (C) 2002 by Martin Pool <mbp@samba.org>
8
9 This program is free software; you can redistribute it and/or modify
10 it under the terms of the GNU General Public License as published by
11 the Free Software Foundation; either version 2 of the License, or
12 (at your option) any later version.
13
14 This program is distributed in the hope that it will be useful,
15 but WITHOUT ANY WARRANTY; without even the implied warranty of
16 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 GNU General Public License for more details.
18
19 You should have received a copy of the GNU General Public License
20 along with this program; if not, write to the Free Software
21 Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
22*/
23
24#include "rsync.h"
25
26extern int verbose;
27extern int dry_run;
28extern int relative_paths;
29extern int keep_dirlinks;
30extern int preserve_links;
31extern int am_root;
32extern int preserve_devices;
33extern int preserve_hard_links;
34extern int preserve_perms;
35extern int preserve_uid;
36extern int preserve_gid;
37extern int preserve_times;
38extern int omit_dir_times;
39extern int delete_during;
40extern int update_only;
41extern int opt_ignore_existing;
42extern int inplace;
43extern int make_backups;
44extern int csum_length;
45extern int ignore_times;
46extern int size_only;
47extern OFF_T max_size;
48extern int io_timeout;
49extern int protocol_version;
50extern int always_checksum;
51extern char *partial_dir;
52extern char *basis_dir[];
53extern int compare_dest;
54extern int link_dest;
55extern int whole_file;
56extern int local_server;
57extern int list_only;
58extern int read_batch;
59extern int only_existing;
60extern int orig_umask;
61extern int safe_symlinks;
62extern long block_size; /* "long" because popt can't set an int32. */
63
64extern struct filter_list_struct server_filter_list;
65
66static int unchanged_attrs(struct file_struct *file, STRUCT_STAT *st)
67{
68 if (preserve_perms
69 && (st->st_mode & CHMOD_BITS) != (file->mode & CHMOD_BITS))
70 return 0;
71
72 if (am_root && preserve_uid && st->st_uid != file->uid)
73 return 0;
74
75 if (preserve_gid && file->gid != GID_NONE && st->st_gid != file->gid)
76 return 0;
77
78 return 1;
79}
80
81/* Perform our quick-check heuristic for determining if a file is unchanged. */
82static int unchanged_file(char *fn, struct file_struct *file, STRUCT_STAT *st)
83{
84 if (st->st_size != file->length)
85 return 0;
86
87 /* if always checksum is set then we use the checksum instead
88 of the file time to determine whether to sync */
89 if (always_checksum && S_ISREG(st->st_mode)) {
90 char sum[MD4_SUM_LENGTH];
91 file_checksum(fn, sum, st->st_size);
92 return memcmp(sum, file->u.sum, protocol_version < 21 ? 2
93 : MD4_SUM_LENGTH) == 0;
94 }
95
96 if (size_only)
97 return 1;
98
99 if (ignore_times)
100 return 0;
101
102 return cmp_modtime(st->st_mtime, file->modtime) == 0;
103}
104
105
106/*
107 * set (initialize) the size entries in the per-file sum_struct
108 * calculating dynamic block and checksum sizes.
109 *
110 * This is only called from generate_and_send_sums() but is a separate
111 * function to encapsulate the logic.
112 *
113 * The block size is a rounded square root of file length.
114 *
115 * The checksum size is determined according to:
116 * blocksum_bits = BLOCKSUM_EXP + 2*log2(file_len) - log2(block_len)
117 * provided by Donovan Baarda which gives a probability of rsync
118 * algorithm corrupting data and falling back using the whole md4
119 * checksums.
120 *
121 * This might be made one of several selectable heuristics.
122 */
123static void sum_sizes_sqroot(struct sum_struct *sum, int64 len)
124{
125 int32 blength;
126 int s2length;
127
128 if (block_size)
129 blength = block_size;
130 else if (len <= BLOCK_SIZE * BLOCK_SIZE)
131 blength = BLOCK_SIZE;
132 else {
133 int32 c;
134 int64 l;
135 int cnt;
136 for (c = 1, l = len, cnt = 0; l >>= 2; c <<= 1, cnt++) {}
137 if (cnt >= 31 || c >= MAX_BLOCK_SIZE)
138 blength = MAX_BLOCK_SIZE;
139 else {
140 blength = 0;
141 do {
142 blength |= c;
143 if (len < (int64)blength * blength)
144 blength &= ~c;
145 c >>= 1;
146 } while (c >= 8); /* round to multiple of 8 */
147 blength = MAX(blength, BLOCK_SIZE);
148 }
149 }
150
151 if (protocol_version < 27) {
152 s2length = csum_length;
153 } else if (csum_length == SUM_LENGTH) {
154 s2length = SUM_LENGTH;
155 } else {
156 int32 c;
157 int64 l;
158 int b = BLOCKSUM_BIAS;
159 for (l = len; l >>= 1; b += 2) {}
160 for (c = blength; c >>= 1 && b; b--) {}
161 /* add a bit, subtract rollsum, round up. */
162 s2length = (b + 1 - 32 + 7) / 8; /* --optimize in compiler-- */
163 s2length = MAX(s2length, csum_length);
164 s2length = MIN(s2length, SUM_LENGTH);
165 }
166
167 sum->flength = len;
168 sum->blength = blength;
169 sum->s2length = s2length;
170 sum->count = (len + (blength - 1)) / blength;
171 sum->remainder = (len % blength);
172
173 if (sum->count && verbose > 2) {
174 rprintf(FINFO,
175 "count=%.0f rem=%ld blength=%ld s2length=%d flength=%.0f\n",
176 (double)sum->count, (long)sum->remainder, (long)sum->blength,
177 sum->s2length, (double)sum->flength);
178 }
179}
180
181
182/*
183 * Generate and send a stream of signatures/checksums that describe a buffer
184 *
185 * Generate approximately one checksum every block_len bytes.
186 */
187static void generate_and_send_sums(int fd, OFF_T len, int f_out, int f_copy)
188{
189 size_t i;
190 struct map_struct *mapbuf;
191 struct sum_struct sum;
192 OFF_T offset = 0;
193
194 sum_sizes_sqroot(&sum, len);
195
196 if (len > 0)
197 mapbuf = map_file(fd, len, MAX_MAP_SIZE, sum.blength);
198 else
199 mapbuf = NULL;
200
201 write_sum_head(f_out, &sum);
202
203 for (i = 0; i < sum.count; i++) {
204 int32 n1 = (int32)MIN(len, (OFF_T)sum.blength);
205 char *map = map_ptr(mapbuf, offset, n1);
206 uint32 sum1 = get_checksum1(map, n1);
207 char sum2[SUM_LENGTH];
208
209 if (f_copy >= 0)
210 full_write(f_copy, map, n1);
211
212 get_checksum2(map, n1, sum2);
213
214 if (verbose > 3) {
215 rprintf(FINFO,
216 "chunk[%.0f] offset=%.0f len=%ld sum1=%08lx\n",
217 (double)i, (double)offset, (long)n1,
218 (unsigned long)sum1);
219 }
220 write_int(f_out, sum1);
221 write_buf(f_out, sum2, sum.s2length);
222 len -= n1;
223 offset += n1;
224 }
225
226 if (mapbuf)
227 unmap_file(mapbuf);
228}
229
230
231/* Acts on flist->file's ndx'th item, whose name is fname. If a directory,
232 * make sure it exists, and has the right permissions/timestamp info. For
233 * all other non-regular files (symlinks, etc.) we create them here. For
234 * regular files that have changed, we try to find a basis file and then
235 * start sending checksums.
236 *
237 * Note that f_out is set to -1 when doing final directory-permission and
238 * modification-time repair. */
239static void recv_generator(char *fname, struct file_list *flist,
240 struct file_struct *file, int ndx,
241 int f_out, int f_out_name)
242{
243 int fd = -1, f_copy = -1;
244 STRUCT_STAT st, partial_st;
245 struct file_struct *back_file = NULL;
246 int statret, stat_errno;
247 char *fnamecmp, *partialptr, *backupptr = NULL;
248 char fnamecmpbuf[MAXPATHLEN];
249 uchar fnamecmp_type;
250
251 if (list_only)
252 return;
253
254 if (verbose > 2)
255 rprintf(FINFO, "recv_generator(%s,%d)\n", safe_fname(fname), ndx);
256
257 if (server_filter_list.head
258 && check_filter(&server_filter_list, fname,
259 S_ISDIR(file->mode)) < 0) {
260 if (verbose) {
261 rprintf(FINFO, "skipping server-excluded file \"%s\"\n",
262 safe_fname(fname));
263 }
264 return;
265 }
266
267 if (dry_run > 1) {
268 statret = -1;
269 stat_errno = ENOENT;
270 } else {
271 statret = link_stat(fname, &st,
272 keep_dirlinks && S_ISDIR(file->mode));
273 stat_errno = errno;
274 }
275
276 if (only_existing && statret == -1 && stat_errno == ENOENT) {
277 /* we only want to update existing files */
278 if (verbose > 1) {
279 rprintf(FINFO, "not creating new file \"%s\"\n",
280 safe_fname(fname));
281 }
282 return;
283 }
284
285 if (statret == 0 && !preserve_perms
286 && S_ISDIR(st.st_mode) == S_ISDIR(file->mode)) {
287 /* if the file exists already and we aren't perserving
288 * permissions then act as though the remote end sent
289 * us the file permissions we already have */
290 file->mode = (file->mode & ~CHMOD_BITS)
291 | (st.st_mode & CHMOD_BITS);
292 }
293
294 if (S_ISDIR(file->mode)) {
295 /* The file to be received is a directory, so we need
296 * to prepare appropriately. If there is already a
297 * file of that name and it is *not* a directory, then
298 * we need to delete it. If it doesn't exist, then
299 * (perhaps recursively) create it. */
300 if (statret == 0 && !S_ISDIR(st.st_mode)) {
301 delete_file(fname, DEL_TERSE);
302 statret = -1;
303 }
304 if (statret != 0 && do_mkdir(fname,file->mode) != 0 && errno != EEXIST) {
305 if (!relative_paths || errno != ENOENT
306 || create_directory_path(fname, orig_umask) < 0
307 || do_mkdir(fname, file->mode) < 0) {
308 rsyserr(FERROR, errno,
309 "recv_generator: mkdir %s failed",
310 full_fname(fname));
311 }
312 }
313 if (set_perms(fname, file, statret ? NULL : &st, 0)
314 && verbose && f_out != -1)
315 rprintf(FINFO, "%s/\n", safe_fname(fname));
316 if (delete_during && f_out != -1 && csum_length != SUM_LENGTH
317 && (file->flags & FLAG_DEL_START)) {
318 delete_in_dir(flist, fname, strlen(fname),
319 file->dir.depth);
320 }
321 return;
322 } else if (max_size && file->length > max_size) {
323 if (verbose > 1)
324 rprintf(FINFO, "%s is over max-size\n", fname);
325 return;
326 }
327
328 if (preserve_links && S_ISLNK(file->mode)) {
329#if SUPPORT_LINKS
330 if (safe_symlinks && unsafe_symlink(file->u.link, fname)) {
331 if (verbose) {
332 rprintf(FINFO, "ignoring unsafe symlink %s -> \"%s\"\n",
333 full_fname(fname), file->u.link);
334 }
335 return;
336 }
337 if (statret == 0) {
338 int dflag = S_ISDIR(st.st_mode) ? DEL_DIR : 0;
339 char lnk[MAXPATHLEN];
340 int len;
341
342 if (!dflag
343 && (len = readlink(fname, lnk, MAXPATHLEN-1)) > 0) {
344 lnk[len] = 0;
345 /* A link already pointing to the
346 * right place -- no further action
347 * required. */
348 if (strcmp(lnk, file->u.link) == 0) {
349 set_perms(fname, file, &st,
350 PERMS_REPORT);
351 return;
352 }
353 }
354 /* Not the right symlink (or not a symlink), so
355 * delete it. */
356 delete_file(fname, dflag | DEL_TERSE);
357 }
358 if (do_symlink(file->u.link,fname) != 0) {
359 rsyserr(FERROR, errno, "symlink %s -> \"%s\" failed",
360 full_fname(fname), safe_fname(file->u.link));
361 } else {
362 set_perms(fname,file,NULL,0);
363 if (verbose) {
364 rprintf(FINFO, "%s -> %s\n", safe_fname(fname),
365 safe_fname(file->u.link));
366 }
367 }
368#endif
369 return;
370 }
371
372 if (am_root && preserve_devices && IS_DEVICE(file->mode)) {
373 if (statret != 0 ||
374 st.st_mode != file->mode ||
375 st.st_rdev != file->u.rdev) {
376 int dflag = S_ISDIR(st.st_mode) ? DEL_DIR : 0;
377 delete_file(fname, dflag | DEL_TERSE);
378 if (verbose > 2) {
379 rprintf(FINFO,"mknod(%s,0%o,0x%x)\n",
380 safe_fname(fname),
381 (int)file->mode, (int)file->u.rdev);
382 }
383 if (do_mknod(fname,file->mode,file->u.rdev) != 0) {
384 rsyserr(FERROR, errno, "mknod %s failed",
385 full_fname(fname));
386 } else {
387 set_perms(fname,file,NULL,0);
388 if (verbose) {
389 rprintf(FINFO, "%s\n",
390 safe_fname(fname));
391 }
392 }
393 } else {
394 set_perms(fname, file, &st, PERMS_REPORT);
395 }
396 return;
397 }
398
399 if (preserve_hard_links && hard_link_check(file, HL_CHECK_MASTER))
400 return;
401
402 if (!S_ISREG(file->mode)) {
403 rprintf(FINFO, "skipping non-regular file \"%s\"\n",
404 safe_fname(fname));
405 return;
406 }
407
408 fnamecmp = fname;
409 fnamecmp_type = FNAMECMP_FNAME;
410
411 if (statret == -1 && basis_dir[0] != NULL) {
412 int fallback_match = -1;
413 int match_level = 0;
414 int i = 0;
415 do {
416 pathjoin(fnamecmpbuf, sizeof fnamecmpbuf,
417 basis_dir[i], fname);
418 if (link_stat(fnamecmpbuf, &st, 0) == 0
419 && S_ISREG(st.st_mode)) {
420 statret = 0;
421 if (link_dest) {
422 if (!match_level) {
423 fallback_match = i;
424 match_level = 1;
425 } else if (match_level == 2
426 && !unchanged_attrs(file, &st))
427 continue;
428 if (!unchanged_file(fnamecmpbuf, file, &st))
429 continue;
430 fallback_match = i;
431 match_level = 2;
432 if (!unchanged_attrs(file, &st))
433 continue;
434 }
435 match_level = 3;
436 break;
437 }
438 } while (basis_dir[++i] != NULL);
439 if (statret == 0) {
440 if (match_level < 3) {
441 i = fallback_match;
442 pathjoin(fnamecmpbuf, sizeof fnamecmpbuf,
443 basis_dir[i], fname);
444 }
445#if HAVE_LINK
446 if (link_dest && match_level == 3 && !dry_run) {
447 if (do_link(fnamecmpbuf, fname) < 0) {
448 if (verbose) {
449 rsyserr(FINFO, errno,
450 "link %s => %s",
451 fnamecmpbuf,
452 safe_fname(fname));
453 }
454 fnamecmp = fnamecmpbuf;
455 fnamecmp_type = i;
456 }
457 } else
458#endif
459 {
460 fnamecmp = fnamecmpbuf;
461 fnamecmp_type = i;
462 }
463 }
464 }
465
466 if (statret == 0 && !S_ISREG(st.st_mode)) {
467 int dflag = S_ISDIR(st.st_mode) ? DEL_DIR : 0;
468 if (delete_file(fname, dflag | DEL_TERSE) != 0)
469 return;
470 statret = -1;
471 stat_errno = ENOENT;
472 }
473
474 if (partial_dir && (partialptr = partial_dir_fname(fname)) != NULL
475 && link_stat(partialptr, &partial_st, 0) == 0
476 && S_ISREG(partial_st.st_mode)) {
477 if (statret == -1)
478 goto prepare_to_open;
479 } else
480 partialptr = NULL;
481
482 if (statret == -1) {
483 if (preserve_hard_links && hard_link_check(file, HL_SKIP))
484 return;
485 if (stat_errno == ENOENT)
486 goto notify_others;
487 if (verbose > 1) {
488 rsyserr(FERROR, stat_errno,
489 "recv_generator: failed to stat %s",
490 full_fname(fname));
491 }
492 return;
493 }
494
495 if (opt_ignore_existing && fnamecmp_type == FNAMECMP_FNAME) {
496 if (verbose > 1)
497 rprintf(FINFO, "%s exists\n", safe_fname(fname));
498 return;
499 }
500
501 if (update_only && fnamecmp_type == FNAMECMP_FNAME
502 && cmp_modtime(st.st_mtime, file->modtime) > 0) {
503 if (verbose > 1)
504 rprintf(FINFO, "%s is newer\n", safe_fname(fname));
505 return;
506 }
507
508 if (!compare_dest && fnamecmp_type <= FNAMECMP_BASIS_DIR_HIGH)
509 ;
510 else if (unchanged_file(fnamecmp, file, &st)) {
511 if (fnamecmp_type == FNAMECMP_FNAME)
512 set_perms(fname, file, &st, PERMS_REPORT);
513 return;
514 }
515
516prepare_to_open:
517 if (partialptr) {
518 st = partial_st;
519 fnamecmp = partialptr;
520 fnamecmp_type = FNAMECMP_PARTIAL_DIR;
521 statret = 0;
522 }
523
524 if (dry_run || whole_file > 0) {
525 statret = -1;
526 goto notify_others;
527 }
528 if (read_batch)
529 goto notify_others;
530
531 /* open the file */
532 fd = do_open(fnamecmp, O_RDONLY, 0);
533
534 if (fd == -1) {
535 rsyserr(FERROR, errno, "failed to open %s, continuing",
536 full_fname(fnamecmp));
537 pretend_missing:
538 /* pretend the file didn't exist */
539 if (preserve_hard_links && hard_link_check(file, HL_SKIP))
540 return;
541 statret = -1;
542 goto notify_others;
543 }
544
545 if (inplace && make_backups) {
546 if (!(backupptr = get_backup_name(fname))) {
547 close(fd);
548 return;
549 }
550 if (!(back_file = make_file(fname, NULL, NO_FILTERS))) {
551 close(fd);
552 goto pretend_missing;
553 }
554 if (robust_unlink(backupptr) && errno != ENOENT) {
555 rsyserr(FERROR, errno, "unlink %s",
556 full_fname(backupptr));
557 free(back_file);
558 close(fd);
559 return;
560 }
561 if ((f_copy = do_open(backupptr,
562 O_WRONLY | O_CREAT | O_TRUNC | O_EXCL, 0600)) < 0) {
563 rsyserr(FERROR, errno, "open %s",
564 full_fname(backupptr));
565 free(back_file);
566 close(fd);
567 return;
568 }
569 fnamecmp_type = FNAMECMP_BACKUP;
570 }
571
572 if (verbose > 3) {
573 rprintf(FINFO, "gen mapped %s of size %.0f\n",
574 safe_fname(fnamecmp), (double)st.st_size);
575 }
576
577 if (verbose > 2)
578 rprintf(FINFO, "generating and sending sums for %d\n", ndx);
579
580notify_others:
581 write_int(f_out, ndx);
582 if (protocol_version >= 29 && inplace && !read_batch)
583 write_byte(f_out, fnamecmp_type);
584 if (f_out_name >= 0)
585 write_byte(f_out_name, fnamecmp_type);
586
587 if (dry_run || read_batch)
588 return;
589
590 if (statret == 0) {
591 generate_and_send_sums(fd, st.st_size, f_out, f_copy);
592
593 if (f_copy >= 0) {
594 close(f_copy);
595 set_perms(backupptr, back_file, NULL, 0);
596 if (verbose > 1) {
597 rprintf(FINFO, "backed up %s to %s\n",
598 fname, backupptr);
599 }
600 free(back_file);
601 }
602
603 close(fd);
604 } else
605 write_sum_head(f_out, NULL);
606}
607
608
609void generate_files(int f_out, struct file_list *flist, char *local_name,
610 int f_out_name)
611{
612 int i;
613 int phase = 0;
614 char fbuf[MAXPATHLEN];
615 int need_retouch_dir_times = preserve_times && !omit_dir_times;
616 int need_retouch_dir_perms = 0;
617 int save_only_existing = only_existing;
618 int save_opt_ignore_existing = opt_ignore_existing;
619
620 if (verbose > 2) {
621 rprintf(FINFO, "generator starting pid=%ld count=%d\n",
622 (long)getpid(), flist->count);
623 }
624
625 if (verbose >= 2) {
626 rprintf(FINFO,
627 whole_file > 0
628 ? "delta-transmission disabled for local transfer or --whole-file\n"
629 : "delta transmission enabled\n");
630 }
631
632 /* We expect to just sit around now, so don't exit on a timeout.
633 * If we really get a timeout then the other process should exit. */
634 io_timeout = 0;
635
636 for (i = 0; i < flist->count; i++) {
637 struct file_struct *file = flist->files[i];
638 struct file_struct copy;
639
640 if (!file->basename)
641 continue;
642
643 /* We need to ensure that any dirs we create have writeable
644 * permissions during the time we are putting files within
645 * them. This is then fixed after the transfer is done. */
646 if (!am_root && S_ISDIR(file->mode) && !(file->mode & S_IWUSR)) {
647 copy = *file;
648 copy.mode |= S_IWUSR; /* user write */
649 file = &copy;
650 need_retouch_dir_perms = 1;
651 }
652
653 recv_generator(local_name ? local_name : f_name_to(file, fbuf),
654 flist, file, i, f_out, f_out_name);
655 }
656 if (delete_during)
657 delete_in_dir(NULL, NULL, 0, 0);
658
659 phase++;
660 csum_length = SUM_LENGTH;
661 only_existing = max_size = opt_ignore_existing = 0;
662 update_only = always_checksum = size_only = 0;
663 ignore_times = 1;
664
665 if (verbose > 2)
666 rprintf(FINFO,"generate_files phase=%d\n",phase);
667
668 write_int(f_out, -1);
669
670 /* files can cycle through the system more than once
671 * to catch initial checksum errors */
672 while ((i = get_redo_num()) != -1) {
673 struct file_struct *file = flist->files[i];
674 recv_generator(local_name ? local_name : f_name_to(file, fbuf),
675 flist, file, i, f_out, f_out_name);
676 }
677
678 phase++;
679 only_existing = save_only_existing;
680 opt_ignore_existing = save_opt_ignore_existing;
681
682 if (verbose > 2)
683 rprintf(FINFO,"generate_files phase=%d\n",phase);
684
685 write_int(f_out, -1);
686
687 /* Read post-redo-phase MSG_DONE and any prior messages. */
688 get_redo_num();
689
690 if (preserve_hard_links)
691 do_hard_links();
692
693 if ((need_retouch_dir_perms || need_retouch_dir_times)
694 && !list_only && !local_name && !dry_run) {
695 /* Now we need to fix any directory permissions that were
696 * modified during the transfer and/or re-set any tweaked
697 * modified-time values. */
698 for (i = 0; i < flist->count; i++) {
699 struct file_struct *file = flist->files[i];
700 if (!file->basename || !S_ISDIR(file->mode))
701 continue;
702 if (!need_retouch_dir_times && file->mode & S_IWUSR)
703 continue;
704 recv_generator(local_name ? local_name : f_name(file),
705 flist, file, i, -1, -1);
706 }
707 }
708
709 if (verbose > 2)
710 rprintf(FINFO,"generate_files finished\n");
711}