If a partial-dir file is present but the main file is up-to-date,
[rsync/rsync.git] / flist.c
... / ...
CommitLineData
1/*
2 Copyright (C) Andrew Tridgell 1996
3 Copyright (C) Paul Mackerras 1996
4 Copyright (C) 2001, 2002 by Martin Pool <mbp@samba.org>
5
6 This program is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 2 of the License, or
9 (at your option) any later version.
10
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
15
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, write to the Free Software
18 Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
19*/
20
21/** @file flist.c
22 * Generate and receive file lists
23 *
24 * @sa http://lists.samba.org/pipermail/rsync/2000-June/002351.html
25 *
26 **/
27
28#include "rsync.h"
29
30extern int verbose;
31extern int dry_run;
32extern int list_only;
33extern int am_root;
34extern int am_server;
35extern int am_daemon;
36extern int am_sender;
37extern int do_progress;
38extern int always_checksum;
39extern int module_id;
40extern int ignore_errors;
41extern int numeric_ids;
42extern int recurse;
43extern int xfer_dirs;
44extern int filesfrom_fd;
45extern int one_file_system;
46extern int keep_dirlinks;
47extern int preserve_links;
48extern int preserve_hard_links;
49extern int preserve_perms;
50extern int preserve_devices;
51extern int preserve_uid;
52extern int preserve_gid;
53extern int relative_paths;
54extern int implied_dirs;
55extern int copy_links;
56extern int copy_unsafe_links;
57extern int protocol_version;
58extern int sanitize_paths;
59extern int orig_umask;
60extern struct stats stats;
61extern struct file_list *the_file_list;
62
63extern char curr_dir[MAXPATHLEN];
64
65extern struct chmod_mode_struct *chmod_modes;
66
67extern struct filter_list_struct filter_list;
68extern struct filter_list_struct server_filter_list;
69
70int io_error;
71dev_t filesystem_dev; /* used to implement -x */
72
73static char empty_sum[MD4_SUM_LENGTH];
74static int flist_count_offset;
75static unsigned int file_struct_len;
76static struct file_list *sorting_flist;
77
78static void clean_flist(struct file_list *flist, int strip_root, int no_dups);
79static void output_flist(struct file_list *flist);
80
81void init_flist(void)
82{
83 struct file_struct f;
84
85 /* Figure out how big the file_struct is without trailing padding */
86 file_struct_len = offsetof(struct file_struct, flags) + sizeof f.flags;
87}
88
89static int show_filelist_p(void)
90{
91 return verbose && xfer_dirs && !am_server;
92}
93
94static void start_filelist_progress(char *kind)
95{
96 rprintf(FINFO, "%s ... ", kind);
97 if (verbose > 1 || do_progress)
98 rprintf(FINFO, "\n");
99 rflush(FINFO);
100}
101
102static void emit_filelist_progress(int count)
103{
104 rprintf(FINFO, " %d files...\r", count);
105}
106
107static void maybe_emit_filelist_progress(int count)
108{
109 if (do_progress && show_filelist_p() && (count % 100) == 0)
110 emit_filelist_progress(count);
111}
112
113static void finish_filelist_progress(const struct file_list *flist)
114{
115 if (do_progress) {
116 /* This overwrites the progress line */
117 rprintf(FINFO, "%d file%sto consider\n",
118 flist->count, flist->count == 1 ? " " : "s ");
119 } else
120 rprintf(FINFO, "done\n");
121}
122
123void show_flist_stats(void)
124{
125 /* Nothing yet */
126}
127
128static void list_file_entry(struct file_struct *f)
129{
130 char perms[11];
131
132 if (!f->basename) {
133 /* this can happen if duplicate names were removed */
134 return;
135 }
136
137 permstring(perms, f->mode);
138
139#ifdef SUPPORT_LINKS
140 if (preserve_links && S_ISLNK(f->mode)) {
141 rprintf(FINFO, "%s %11.0f %s %s -> %s\n",
142 perms,
143 (double)f->length, timestring(f->modtime),
144 safe_fname(f_name(f)), safe_fname(f->u.link));
145 } else
146#endif
147 {
148 rprintf(FINFO, "%s %11.0f %s %s\n",
149 perms,
150 (double)f->length, timestring(f->modtime),
151 safe_fname(f_name(f)));
152 }
153}
154
155/**
156 * Stat either a symlink or its referent, depending on the settings of
157 * copy_links, copy_unsafe_links, etc.
158 *
159 * @retval -1 on error
160 *
161 * @retval 0 for success
162 *
163 * @post If @p path is a symlink, then @p linkbuf (of size @c
164 * MAXPATHLEN) contains the symlink target.
165 *
166 * @post @p buffer contains information about the link or the
167 * referrent as appropriate, if they exist.
168 **/
169static int readlink_stat(const char *path, STRUCT_STAT *buffer, char *linkbuf)
170{
171#ifdef SUPPORT_LINKS
172 if (copy_links)
173 return do_stat(path, buffer);
174 if (link_stat(path, buffer, 0) < 0)
175 return -1;
176 if (S_ISLNK(buffer->st_mode)) {
177 int l = readlink((char *)path, linkbuf, MAXPATHLEN - 1);
178 if (l == -1)
179 return -1;
180 linkbuf[l] = 0;
181 if (copy_unsafe_links && unsafe_symlink(linkbuf, path)) {
182 if (verbose > 1) {
183 rprintf(FINFO,"copying unsafe symlink \"%s\" -> \"%s\"\n",
184 safe_fname(path), safe_fname(linkbuf));
185 }
186 return do_stat(path, buffer);
187 }
188 }
189 return 0;
190#else
191 return do_stat(path, buffer);
192#endif
193}
194
195int link_stat(const char *path, STRUCT_STAT *buffer, int follow_dirlinks)
196{
197#ifdef SUPPORT_LINKS
198 if (copy_links)
199 return do_stat(path, buffer);
200 if (do_lstat(path, buffer) < 0)
201 return -1;
202 if (follow_dirlinks && S_ISLNK(buffer->st_mode)) {
203 STRUCT_STAT st;
204 if (do_stat(path, &st) == 0 && S_ISDIR(st.st_mode))
205 *buffer = st;
206 }
207 return 0;
208#else
209 return do_stat(path, buffer);
210#endif
211}
212
213/* This function is used to check if a file should be included/excluded
214 * from the list of files based on its name and type etc. The value of
215 * filter_level is set to either SERVER_FILTERS or ALL_FILTERS. */
216static int is_excluded(char *fname, int is_dir, int filter_level)
217{
218#if 0 /* This currently never happens, so avoid a useless compare. */
219 if (filter_level == NO_FILTERS)
220 return 0;
221#endif
222 if (fname) {
223 /* never exclude '.', even if somebody does --exclude '*' */
224 if (fname[0] == '.' && !fname[1])
225 return 0;
226 /* Handle the -R version of the '.' dir. */
227 if (fname[0] == '/') {
228 int len = strlen(fname);
229 if (fname[len-1] == '.' && fname[len-2] == '/')
230 return 0;
231 }
232 }
233 if (server_filter_list.head
234 && check_filter(&server_filter_list, fname, is_dir) < 0)
235 return 1;
236 if (filter_level != ALL_FILTERS)
237 return 0;
238 if (filter_list.head
239 && check_filter(&filter_list, fname, is_dir) < 0)
240 return 1;
241 return 0;
242}
243
244static int to_wire_mode(mode_t mode)
245{
246#ifdef SUPPORT_LINKS
247 if (S_ISLNK(mode) && (_S_IFLNK != 0120000))
248 return (mode & ~(_S_IFMT)) | 0120000;
249#endif
250 return (int)mode;
251}
252
253static mode_t from_wire_mode(int mode)
254{
255 if ((mode & (_S_IFMT)) == 0120000 && (_S_IFLNK != 0120000))
256 return (mode & ~(_S_IFMT)) | _S_IFLNK;
257 return (mode_t)mode;
258}
259
260static void send_directory(int f, struct file_list *flist,
261 char *fbuf, int len);
262
263static char *flist_dir;
264static int flist_dir_len;
265
266
267/**
268 * Make sure @p flist is big enough to hold at least @p flist->count
269 * entries.
270 **/
271void flist_expand(struct file_list *flist)
272{
273 struct file_struct **new_ptr;
274
275 if (flist->count < flist->malloced)
276 return;
277
278 if (flist->malloced < FLIST_START)
279 flist->malloced = FLIST_START;
280 else if (flist->malloced >= FLIST_LINEAR)
281 flist->malloced += FLIST_LINEAR;
282 else
283 flist->malloced *= 2;
284
285 /*
286 * In case count jumped or we are starting the list
287 * with a known size just set it.
288 */
289 if (flist->malloced < flist->count)
290 flist->malloced = flist->count;
291
292 new_ptr = realloc_array(flist->files, struct file_struct *,
293 flist->malloced);
294
295 if (verbose >= 2 && flist->malloced != FLIST_START) {
296 rprintf(FINFO, "[%s] expand file_list to %.0f bytes, did%s move\n",
297 who_am_i(),
298 (double)sizeof flist->files[0] * flist->malloced,
299 (new_ptr == flist->files) ? " not" : "");
300 }
301
302 flist->files = new_ptr;
303
304 if (!flist->files)
305 out_of_memory("flist_expand");
306}
307
308void send_file_entry(struct file_struct *file, int f, unsigned short base_flags)
309{
310 unsigned short flags;
311 static time_t modtime;
312 static mode_t mode;
313 static int64 dev;
314 static dev_t rdev;
315 static uint32 rdev_major;
316 static uid_t uid;
317 static gid_t gid;
318 static char lastname[MAXPATHLEN];
319 char fname[MAXPATHLEN];
320 int l1, l2;
321
322 if (f < 0)
323 return;
324
325 if (!file) {
326 write_byte(f, 0);
327 modtime = 0, mode = 0;
328 dev = 0, rdev = makedev(0, 0);
329 rdev_major = 0;
330 uid = 0, gid = 0;
331 *lastname = '\0';
332 return;
333 }
334
335 io_write_phase = "send_file_entry";
336
337 f_name_to(file, fname);
338
339 flags = base_flags;
340
341 if (file->mode == mode)
342 flags |= XMIT_SAME_MODE;
343 else
344 mode = file->mode;
345 if (preserve_devices) {
346 if (protocol_version < 28) {
347 if (IS_DEVICE(mode)) {
348 if (file->u.rdev == rdev)
349 flags |= XMIT_SAME_RDEV_pre28;
350 else
351 rdev = file->u.rdev;
352 } else
353 rdev = makedev(0, 0);
354 } else if (IS_DEVICE(mode)) {
355 rdev = file->u.rdev;
356 if ((uint32)major(rdev) == rdev_major)
357 flags |= XMIT_SAME_RDEV_MAJOR;
358 else
359 rdev_major = major(rdev);
360 if ((uint32)minor(rdev) <= 0xFFu)
361 flags |= XMIT_RDEV_MINOR_IS_SMALL;
362 }
363 }
364 if (file->uid == uid)
365 flags |= XMIT_SAME_UID;
366 else
367 uid = file->uid;
368 if (file->gid == gid)
369 flags |= XMIT_SAME_GID;
370 else
371 gid = file->gid;
372 if (file->modtime == modtime)
373 flags |= XMIT_SAME_TIME;
374 else
375 modtime = file->modtime;
376
377#ifdef SUPPORT_HARD_LINKS
378 if (file->link_u.idev) {
379 if (file->F_DEV == dev) {
380 if (protocol_version >= 28)
381 flags |= XMIT_SAME_DEV;
382 } else
383 dev = file->F_DEV;
384 flags |= XMIT_HAS_IDEV_DATA;
385 }
386#endif
387
388 for (l1 = 0;
389 lastname[l1] && (fname[l1] == lastname[l1]) && (l1 < 255);
390 l1++) {}
391 l2 = strlen(fname+l1);
392
393 if (l1 > 0)
394 flags |= XMIT_SAME_NAME;
395 if (l2 > 255)
396 flags |= XMIT_LONG_NAME;
397
398 /* We must make sure we don't send a zero flag byte or the
399 * other end will terminate the flist transfer. Note that
400 * the use of XMIT_TOP_DIR on a non-dir has no meaning, so
401 * it's harmless way to add a bit to the first flag byte. */
402 if (protocol_version >= 28) {
403 if (!flags && !S_ISDIR(mode))
404 flags |= XMIT_TOP_DIR;
405 if ((flags & 0xFF00) || !flags) {
406 flags |= XMIT_EXTENDED_FLAGS;
407 write_byte(f, flags);
408 write_byte(f, flags >> 8);
409 } else
410 write_byte(f, flags);
411 } else {
412 if (!(flags & 0xFF))
413 flags |= S_ISDIR(mode) ? XMIT_LONG_NAME : XMIT_TOP_DIR;
414 write_byte(f, flags);
415 }
416 if (flags & XMIT_SAME_NAME)
417 write_byte(f, l1);
418 if (flags & XMIT_LONG_NAME)
419 write_int(f, l2);
420 else
421 write_byte(f, l2);
422 write_buf(f, fname + l1, l2);
423
424 write_longint(f, file->length);
425 if (!(flags & XMIT_SAME_TIME))
426 write_int(f, modtime);
427 if (!(flags & XMIT_SAME_MODE))
428 write_int(f, to_wire_mode(mode));
429 if (preserve_uid && !(flags & XMIT_SAME_UID)) {
430 if (!numeric_ids)
431 add_uid(uid);
432 write_int(f, uid);
433 }
434 if (preserve_gid && !(flags & XMIT_SAME_GID)) {
435 if (!numeric_ids)
436 add_gid(gid);
437 write_int(f, gid);
438 }
439 if (preserve_devices && IS_DEVICE(mode)) {
440 if (protocol_version < 28) {
441 if (!(flags & XMIT_SAME_RDEV_pre28))
442 write_int(f, (int)rdev);
443 } else {
444 if (!(flags & XMIT_SAME_RDEV_MAJOR))
445 write_int(f, major(rdev));
446 if (flags & XMIT_RDEV_MINOR_IS_SMALL)
447 write_byte(f, minor(rdev));
448 else
449 write_int(f, minor(rdev));
450 }
451 }
452
453#ifdef SUPPORT_LINKS
454 if (preserve_links && S_ISLNK(mode)) {
455 int len = strlen(file->u.link);
456 write_int(f, len);
457 write_buf(f, file->u.link, len);
458 }
459#endif
460
461#ifdef SUPPORT_HARD_LINKS
462 if (flags & XMIT_HAS_IDEV_DATA) {
463 if (protocol_version < 26) {
464 /* 32-bit dev_t and ino_t */
465 write_int(f, dev);
466 write_int(f, file->F_INODE);
467 } else {
468 /* 64-bit dev_t and ino_t */
469 if (!(flags & XMIT_SAME_DEV))
470 write_longint(f, dev);
471 write_longint(f, file->F_INODE);
472 }
473 }
474#endif
475
476 if (always_checksum && (S_ISREG(mode) || protocol_version < 28)) {
477 char *sum;
478 int slen = protocol_version < 21 ? 2 : MD4_SUM_LENGTH;
479 if (S_ISREG(mode))
480 sum = file->u.sum;
481 else {
482 /* Prior to 28, we sent a useless set of nulls. */
483 sum = empty_sum;
484 }
485 write_buf(f, sum, slen);
486 }
487
488 strlcpy(lastname, fname, MAXPATHLEN);
489
490 io_write_phase = "unknown";
491}
492
493static struct file_struct *receive_file_entry(struct file_list *flist,
494 unsigned short flags, int f)
495{
496 static time_t modtime;
497 static mode_t mode;
498 static int64 dev;
499 static dev_t rdev;
500 static uint32 rdev_major;
501 static uid_t uid;
502 static gid_t gid;
503 static char lastname[MAXPATHLEN], *lastdir;
504 static int lastdir_depth, lastdir_len = -1;
505 static unsigned int del_hier_name_len = 0;
506 static int in_del_hier = 0;
507 char thisname[MAXPATHLEN];
508 unsigned int l1 = 0, l2 = 0;
509 int alloc_len, basename_len, dirname_len, linkname_len, sum_len;
510 OFF_T file_length;
511 char *basename, *dirname, *bp;
512 struct file_struct *file;
513
514 if (!flist) {
515 modtime = 0, mode = 0;
516 dev = 0, rdev = makedev(0, 0);
517 rdev_major = 0;
518 uid = 0, gid = 0;
519 *lastname = '\0';
520 lastdir_len = -1;
521 in_del_hier = 0;
522 return NULL;
523 }
524
525 if (flags & XMIT_SAME_NAME)
526 l1 = read_byte(f);
527
528 if (flags & XMIT_LONG_NAME)
529 l2 = read_int(f);
530 else
531 l2 = read_byte(f);
532
533 if (l2 >= MAXPATHLEN - l1) {
534 rprintf(FERROR,
535 "overflow: flags=0x%x l1=%d l2=%d lastname=%s\n",
536 flags, l1, l2, safe_fname(lastname));
537 overflow_exit("receive_file_entry");
538 }
539
540 strlcpy(thisname, lastname, l1 + 1);
541 read_sbuf(f, &thisname[l1], l2);
542 thisname[l1 + l2] = 0;
543
544 strlcpy(lastname, thisname, MAXPATHLEN);
545
546 clean_fname(thisname, 0);
547
548 if (sanitize_paths)
549 sanitize_path(thisname, thisname, "", 0);
550
551 if ((basename = strrchr(thisname, '/')) != NULL) {
552 dirname_len = ++basename - thisname; /* counts future '\0' */
553 if (lastdir_len == dirname_len - 1
554 && strncmp(thisname, lastdir, lastdir_len) == 0) {
555 dirname = lastdir;
556 dirname_len = 0; /* indicates no copy is needed */
557 } else
558 dirname = thisname;
559 } else {
560 basename = thisname;
561 dirname = NULL;
562 dirname_len = 0;
563 }
564 basename_len = strlen(basename) + 1; /* count the '\0' */
565
566 file_length = read_longint(f);
567 if (!(flags & XMIT_SAME_TIME))
568 modtime = (time_t)read_int(f);
569 if (!(flags & XMIT_SAME_MODE))
570 mode = from_wire_mode(read_int(f));
571
572 if (preserve_uid && !(flags & XMIT_SAME_UID))
573 uid = (uid_t)read_int(f);
574 if (preserve_gid && !(flags & XMIT_SAME_GID))
575 gid = (gid_t)read_int(f);
576
577 if (preserve_devices) {
578 if (protocol_version < 28) {
579 if (IS_DEVICE(mode)) {
580 if (!(flags & XMIT_SAME_RDEV_pre28))
581 rdev = (dev_t)read_int(f);
582 } else
583 rdev = makedev(0, 0);
584 } else if (IS_DEVICE(mode)) {
585 uint32 rdev_minor;
586 if (!(flags & XMIT_SAME_RDEV_MAJOR))
587 rdev_major = read_int(f);
588 if (flags & XMIT_RDEV_MINOR_IS_SMALL)
589 rdev_minor = read_byte(f);
590 else
591 rdev_minor = read_int(f);
592 rdev = makedev(rdev_major, rdev_minor);
593 }
594 }
595
596#ifdef SUPPORT_LINKS
597 if (preserve_links && S_ISLNK(mode)) {
598 linkname_len = read_int(f) + 1; /* count the '\0' */
599 if (linkname_len <= 0 || linkname_len > MAXPATHLEN) {
600 rprintf(FERROR, "overflow: linkname_len=%d\n",
601 linkname_len - 1);
602 overflow_exit("receive_file_entry");
603 }
604 }
605 else
606#endif
607 linkname_len = 0;
608
609 sum_len = always_checksum && S_ISREG(mode) ? MD4_SUM_LENGTH : 0;
610
611 alloc_len = file_struct_len + dirname_len + basename_len
612 + linkname_len + sum_len;
613 bp = pool_alloc(flist->file_pool, alloc_len, "receive_file_entry");
614
615 file = (struct file_struct *)bp;
616 memset(bp, 0, file_struct_len);
617 bp += file_struct_len;
618
619 file->flags = 0;
620 file->modtime = modtime;
621 file->length = file_length;
622 file->mode = mode;
623 file->uid = uid;
624 file->gid = gid;
625
626 if (dirname_len) {
627 file->dirname = lastdir = bp;
628 lastdir_len = dirname_len - 1;
629 memcpy(bp, dirname, dirname_len - 1);
630 bp += dirname_len;
631 bp[-1] = '\0';
632 lastdir_depth = count_dir_elements(lastdir);
633 file->dir.depth = lastdir_depth + 1;
634 } else if (dirname) {
635 file->dirname = dirname; /* we're reusing lastname */
636 file->dir.depth = lastdir_depth + 1;
637 } else
638 file->dir.depth = 1;
639
640 if (S_ISDIR(mode)) {
641 if (basename_len == 1+1 && *basename == '.') /* +1 for '\0' */
642 file->dir.depth--;
643 if (flags & XMIT_TOP_DIR) {
644 in_del_hier = recurse;
645 del_hier_name_len = file->dir.depth == 0 ? 0 : l1 + l2;
646 if (relative_paths && del_hier_name_len > 2
647 && basename_len == 1+1 && *basename == '.')
648 del_hier_name_len -= 2;
649 file->flags |= FLAG_TOP_DIR | FLAG_DEL_HERE;
650 } else if (in_del_hier) {
651 if (!relative_paths || !del_hier_name_len
652 || (l1 >= del_hier_name_len
653 && thisname[del_hier_name_len] == '/'))
654 file->flags |= FLAG_DEL_HERE;
655 else
656 in_del_hier = 0;
657 }
658 }
659
660 file->basename = bp;
661 memcpy(bp, basename, basename_len);
662 bp += basename_len;
663
664 if (preserve_devices && IS_DEVICE(mode))
665 file->u.rdev = rdev;
666
667#ifdef SUPPORT_LINKS
668 if (linkname_len) {
669 file->u.link = bp;
670 read_sbuf(f, bp, linkname_len - 1);
671 if (sanitize_paths)
672 sanitize_path(bp, bp, "", lastdir_depth);
673 bp += linkname_len;
674 }
675#endif
676
677#ifdef SUPPORT_HARD_LINKS
678 if (preserve_hard_links && protocol_version < 28 && S_ISREG(mode))
679 flags |= XMIT_HAS_IDEV_DATA;
680 if (flags & XMIT_HAS_IDEV_DATA) {
681 int64 inode;
682 if (protocol_version < 26) {
683 dev = read_int(f);
684 inode = read_int(f);
685 } else {
686 if (!(flags & XMIT_SAME_DEV))
687 dev = read_longint(f);
688 inode = read_longint(f);
689 }
690 if (flist->hlink_pool) {
691 file->link_u.idev = pool_talloc(flist->hlink_pool,
692 struct idev, 1, "inode_table");
693 file->F_INODE = inode;
694 file->F_DEV = dev;
695 }
696 }
697#endif
698
699 if (always_checksum && (sum_len || protocol_version < 28)) {
700 char *sum;
701 int slen = protocol_version < 21 ? 2 : MD4_SUM_LENGTH;
702 if (sum_len) {
703 file->u.sum = sum = bp;
704 /*bp += sum_len;*/
705 } else {
706 /* Prior to 28, we get a useless set of nulls. */
707 sum = empty_sum;
708 }
709 read_buf(f, sum, slen);
710 }
711
712 if (!preserve_perms) {
713 /* set an appropriate set of permissions based on original
714 * permissions and umask. This emulates what GNU cp does */
715 file->mode &= ~orig_umask;
716 }
717
718 return file;
719}
720
721/**
722 * Create a file_struct for a named file by reading its stat()
723 * information and performing extensive checks against global
724 * options.
725 *
726 * @return the new file, or NULL if there was an error or this file
727 * should be excluded.
728 *
729 * @todo There is a small optimization opportunity here to avoid
730 * stat()ing the file in some circumstances, which has a certain cost.
731 * We are called immediately after doing readdir(), and so we may
732 * already know the d_type of the file. We could for example avoid
733 * statting directories if we're not recursing, but this is not a very
734 * important case. Some systems may not have d_type.
735 **/
736struct file_struct *make_file(char *fname, struct file_list *flist,
737 int filter_level)
738{
739 static char *lastdir;
740 static int lastdir_len = -1;
741 struct file_struct *file;
742 STRUCT_STAT st;
743 char sum[SUM_LENGTH];
744 char thisname[MAXPATHLEN];
745 char linkname[MAXPATHLEN];
746 int alloc_len, basename_len, dirname_len, linkname_len, sum_len;
747 char *basename, *dirname, *bp;
748 unsigned short flags = 0;
749
750 if (!flist || !flist->count) /* Ignore lastdir when invalid. */
751 lastdir_len = -1;
752
753 if (strlcpy(thisname, fname, sizeof thisname)
754 >= sizeof thisname - flist_dir_len) {
755 rprintf(FINFO, "skipping overly long name: %s\n",
756 safe_fname(fname));
757 return NULL;
758 }
759 clean_fname(thisname, 0);
760 if (sanitize_paths)
761 sanitize_path(thisname, thisname, "", 0);
762
763 memset(sum, 0, SUM_LENGTH);
764
765 if (readlink_stat(thisname, &st, linkname) != 0) {
766 int save_errno = errno;
767 /* See if file is excluded before reporting an error. */
768 if (filter_level != NO_FILTERS
769 && is_excluded(thisname, 0, filter_level))
770 return NULL;
771 if (save_errno == ENOENT) {
772#ifdef SUPPORT_LINKS
773 /* Avoid "vanished" error if symlink points nowhere. */
774 if (copy_links && do_lstat(thisname, &st) == 0
775 && S_ISLNK(st.st_mode)) {
776 io_error |= IOERR_GENERAL;
777 rprintf(FERROR, "symlink has no referent: %s\n",
778 full_fname(thisname));
779 } else
780#endif
781 {
782 enum logcode c = am_daemon && protocol_version < 28
783 ? FERROR : FINFO;
784 io_error |= IOERR_VANISHED;
785 rprintf(c, "file has vanished: %s\n",
786 full_fname(thisname));
787 }
788 } else {
789 io_error |= IOERR_GENERAL;
790 rsyserr(FERROR, save_errno, "readlink %s failed",
791 full_fname(thisname));
792 }
793 return NULL;
794 }
795
796 /* backup.c calls us with filter_level set to NO_FILTERS. */
797 if (filter_level == NO_FILTERS)
798 goto skip_filters;
799
800 if (S_ISDIR(st.st_mode) && !xfer_dirs) {
801 rprintf(FINFO, "skipping directory %s\n", safe_fname(thisname));
802 return NULL;
803 }
804
805 /* We only care about directories because we need to avoid recursing
806 * into a mount-point directory, not to avoid copying a symlinked
807 * file if -L (or similar) was specified. */
808 if (one_file_system && st.st_dev != filesystem_dev
809 && S_ISDIR(st.st_mode))
810 flags |= FLAG_MOUNT_POINT;
811
812 if (is_excluded(thisname, S_ISDIR(st.st_mode) != 0, filter_level))
813 return NULL;
814
815 if (lp_ignore_nonreadable(module_id)) {
816#ifdef SUPPORT_LINKS
817 if (!S_ISLNK(st.st_mode))
818#endif
819 if (access(thisname, R_OK) != 0)
820 return NULL;
821 }
822
823skip_filters:
824
825 if (verbose > 2) {
826 rprintf(FINFO, "[%s] make_file(%s,*,%d)\n",
827 who_am_i(), safe_fname(thisname), filter_level);
828 }
829
830 if ((basename = strrchr(thisname, '/')) != NULL) {
831 dirname_len = ++basename - thisname; /* counts future '\0' */
832 if (lastdir_len == dirname_len - 1
833 && strncmp(thisname, lastdir, lastdir_len) == 0) {
834 dirname = lastdir;
835 dirname_len = 0; /* indicates no copy is needed */
836 } else
837 dirname = thisname;
838 } else {
839 basename = thisname;
840 dirname = NULL;
841 dirname_len = 0;
842 }
843 basename_len = strlen(basename) + 1; /* count the '\0' */
844
845#ifdef SUPPORT_LINKS
846 linkname_len = S_ISLNK(st.st_mode) ? strlen(linkname) + 1 : 0;
847#else
848 linkname_len = 0;
849#endif
850
851 sum_len = always_checksum && S_ISREG(st.st_mode) ? MD4_SUM_LENGTH : 0;
852
853 alloc_len = file_struct_len + dirname_len + basename_len
854 + linkname_len + sum_len;
855 if (flist) {
856 bp = pool_alloc(flist->file_pool, alloc_len,
857 "receive_file_entry");
858 } else {
859 if (!(bp = new_array(char, alloc_len)))
860 out_of_memory("receive_file_entry");
861 }
862
863 file = (struct file_struct *)bp;
864 memset(bp, 0, file_struct_len);
865 bp += file_struct_len;
866
867 file->flags = flags;
868 file->modtime = st.st_mtime;
869 file->length = st.st_size;
870 if (chmod_modes && am_sender && (S_ISREG(st.st_mode) || S_ISDIR(st.st_mode)))
871 file->mode = tweak_mode(st.st_mode, chmod_modes);
872 else
873 file->mode = st.st_mode;
874 file->uid = st.st_uid;
875 file->gid = st.st_gid;
876
877#ifdef SUPPORT_HARD_LINKS
878 if (flist && flist->hlink_pool) {
879 if (protocol_version < 28) {
880 if (S_ISREG(st.st_mode))
881 file->link_u.idev = pool_talloc(
882 flist->hlink_pool, struct idev, 1,
883 "inode_table");
884 } else {
885 if (!S_ISDIR(st.st_mode) && st.st_nlink > 1)
886 file->link_u.idev = pool_talloc(
887 flist->hlink_pool, struct idev, 1,
888 "inode_table");
889 }
890 }
891 if (file->link_u.idev) {
892 file->F_DEV = st.st_dev;
893 file->F_INODE = st.st_ino;
894 }
895#endif
896
897 if (dirname_len) {
898 file->dirname = lastdir = bp;
899 lastdir_len = dirname_len - 1;
900 memcpy(bp, dirname, dirname_len - 1);
901 bp += dirname_len;
902 bp[-1] = '\0';
903 } else if (dirname)
904 file->dirname = dirname;
905
906 file->basename = bp;
907 memcpy(bp, basename, basename_len);
908 bp += basename_len;
909
910#ifdef HAVE_STRUCT_STAT_ST_RDEV
911 if (preserve_devices && IS_DEVICE(st.st_mode))
912 file->u.rdev = st.st_rdev;
913#endif
914
915#ifdef SUPPORT_LINKS
916 if (linkname_len) {
917 file->u.link = bp;
918 memcpy(bp, linkname, linkname_len);
919 bp += linkname_len;
920 }
921#endif
922
923 if (sum_len) {
924 file->u.sum = bp;
925 file_checksum(thisname, bp, st.st_size);
926 /*bp += sum_len;*/
927 }
928
929 file->dir.root = flist_dir;
930
931 /* This code is only used by the receiver when it is building
932 * a list of files for a delete pass. */
933 if (keep_dirlinks && linkname_len && flist) {
934 STRUCT_STAT st2;
935 int save_mode = file->mode;
936 file->mode = S_IFDIR; /* find a directory w/our name */
937 if (flist_find(the_file_list, file) >= 0
938 && do_stat(thisname, &st2) == 0 && S_ISDIR(st2.st_mode)) {
939 file->modtime = st2.st_mtime;
940 file->length = st2.st_size;
941 file->mode = st2.st_mode;
942 file->uid = st2.st_uid;
943 file->gid = st2.st_gid;
944 file->u.link = NULL;
945 } else
946 file->mode = save_mode;
947 }
948
949 if (S_ISREG(st.st_mode) || S_ISLNK(st.st_mode))
950 stats.total_size += st.st_size;
951
952 return file;
953}
954
955static struct file_struct *send_file_name(int f, struct file_list *flist,
956 char *fname, unsigned short base_flags)
957{
958 struct file_struct *file;
959
960 file = make_file(fname, flist, f == -2 ? SERVER_FILTERS : ALL_FILTERS);
961 if (!file)
962 return NULL;
963
964 maybe_emit_filelist_progress(flist->count + flist_count_offset);
965
966 flist_expand(flist);
967
968 if (file->basename[0]) {
969 flist->files[flist->count++] = file;
970 send_file_entry(file, f, base_flags);
971 }
972 return file;
973}
974
975static void send_if_directory(int f, struct file_list *flist,
976 struct file_struct *file,
977 char *fbuf, unsigned int ol)
978{
979 char is_dot_dir = fbuf[ol-1] == '.' && (ol == 1 || fbuf[ol-2] == '/');
980
981 if (S_ISDIR(file->mode)
982 && !(file->flags & FLAG_MOUNT_POINT) && f_name_to(file, fbuf)) {
983 void *save_filters;
984 unsigned int len = strlen(fbuf);
985 if (len > 1 && fbuf[len-1] == '/')
986 fbuf[--len] = '\0';
987 if (len >= MAXPATHLEN - 1) {
988 io_error |= IOERR_GENERAL;
989 rprintf(FERROR, "skipping long-named directory: %s\n",
990 full_fname(fbuf));
991 return;
992 }
993 save_filters = push_local_filters(fbuf, len);
994 send_directory(f, flist, fbuf, len);
995 pop_local_filters(save_filters);
996 fbuf[ol] = '\0';
997 if (is_dot_dir)
998 fbuf[ol-1] = '.';
999 }
1000}
1001
1002/* This function is normally called by the sender, but the receiving side also
1003 * calls it from get_dirlist() with f set to -1 so that we just construct the
1004 * file list in memory without sending it over the wire. Also, get_dirlist()
1005 * might call this with f set to -2, which also indicates that local filter
1006 * rules should be ignored. */
1007static void send_directory(int f, struct file_list *flist,
1008 char *fbuf, int len)
1009{
1010 struct dirent *di;
1011 unsigned remainder;
1012 char *p;
1013 DIR *d;
1014 int start = flist->count;
1015
1016 if (!(d = opendir(fbuf))) {
1017 io_error |= IOERR_GENERAL;
1018 rsyserr(FERROR, errno, "opendir %s failed", full_fname(fbuf));
1019 return;
1020 }
1021
1022 p = fbuf + len;
1023 if (len != 1 || *fbuf != '/')
1024 *p++ = '/';
1025 *p = '\0';
1026 remainder = MAXPATHLEN - (p - fbuf);
1027
1028 for (errno = 0, di = readdir(d); di; errno = 0, di = readdir(d)) {
1029 char *dname = d_name(di);
1030 if (dname[0] == '.' && (dname[1] == '\0'
1031 || (dname[1] == '.' && dname[2] == '\0')))
1032 continue;
1033 if (strlcpy(p, dname, remainder) < remainder)
1034 send_file_name(f, flist, fbuf, 0);
1035 else {
1036 io_error |= IOERR_GENERAL;
1037 rprintf(FINFO,
1038 "cannot send long-named file %s\n",
1039 full_fname(fbuf));
1040 }
1041 }
1042
1043 fbuf[len] = '\0';
1044
1045 if (errno) {
1046 io_error |= IOERR_GENERAL;
1047 rsyserr(FERROR, errno, "readdir(%s)", full_fname(fbuf));
1048 }
1049
1050 closedir(d);
1051
1052 if (recurse) {
1053 int i, end = flist->count - 1;
1054 for (i = start; i <= end; i++)
1055 send_if_directory(f, flist, flist->files[i], fbuf, len);
1056 }
1057}
1058
1059struct file_list *send_file_list(int f, int argc, char *argv[])
1060{
1061 int len;
1062 STRUCT_STAT st;
1063 char *p, *dir, olddir[sizeof curr_dir];
1064 char lastpath[MAXPATHLEN] = "";
1065 struct file_list *flist;
1066 struct timeval start_tv, end_tv;
1067 int64 start_write;
1068 int use_ff_fd = 0;
1069
1070 if (show_filelist_p())
1071 start_filelist_progress("building file list");
1072
1073 start_write = stats.total_written;
1074 gettimeofday(&start_tv, NULL);
1075
1076 flist = flist_new(WITH_HLINK, "send_file_list");
1077
1078 io_start_buffering_out();
1079 if (filesfrom_fd >= 0) {
1080 if (argv[0] && !push_dir(argv[0])) {
1081 rsyserr(FERROR, errno, "push_dir %s failed",
1082 full_fname(argv[0]));
1083 exit_cleanup(RERR_FILESELECT);
1084 }
1085 use_ff_fd = 1;
1086 }
1087
1088 while (1) {
1089 char fbuf[MAXPATHLEN];
1090 char *fn;
1091 int is_dot_dir;
1092
1093 if (use_ff_fd) {
1094 if (read_filesfrom_line(filesfrom_fd, fbuf) == 0)
1095 break;
1096 sanitize_path(fbuf, fbuf, "", 0);
1097 } else {
1098 if (argc-- == 0)
1099 break;
1100 strlcpy(fbuf, *argv++, MAXPATHLEN);
1101 if (sanitize_paths)
1102 sanitize_path(fbuf, fbuf, "", 0);
1103 }
1104
1105 len = strlen(fbuf);
1106 if (!len || fbuf[len - 1] == '/') {
1107 if (len == 2 && fbuf[0] == '.') {
1108 /* Turn "./" into just "." rather than "./." */
1109 fbuf[1] = '\0';
1110 } else {
1111 if (len + 1 >= MAXPATHLEN)
1112 overflow_exit("send_file_list");
1113 fbuf[len++] = '.';
1114 fbuf[len] = '\0';
1115 }
1116 is_dot_dir = 1;
1117 } else if (len > 1 && fbuf[len-1] == '.' && fbuf[len-2] == '.'
1118 && (len == 2 || fbuf[len-3] == '/')) {
1119 if (len + 2 >= MAXPATHLEN)
1120 overflow_exit("send_file_list");
1121 fbuf[len++] = '/';
1122 fbuf[len++] = '.';
1123 fbuf[len] = '\0';
1124 is_dot_dir = 1;
1125 } else {
1126 is_dot_dir = fbuf[len-1] == '.'
1127 && (len == 1 || fbuf[len-2] == '/');
1128 }
1129
1130 if (link_stat(fbuf, &st, keep_dirlinks) != 0) {
1131 io_error |= IOERR_GENERAL;
1132 rsyserr(FERROR, errno, "link_stat %s failed",
1133 full_fname(fbuf));
1134 continue;
1135 }
1136
1137 if (S_ISDIR(st.st_mode) && !xfer_dirs) {
1138 rprintf(FINFO, "skipping directory %s\n",
1139 safe_fname(fbuf));
1140 continue;
1141 }
1142
1143 dir = NULL;
1144 olddir[0] = '\0';
1145
1146 if (!relative_paths) {
1147 p = strrchr(fbuf, '/');
1148 if (p) {
1149 *p = '\0';
1150 if (p == fbuf)
1151 dir = "/";
1152 else
1153 dir = fbuf;
1154 len -= p - fbuf + 1;
1155 fn = p + 1;
1156 } else
1157 fn = fbuf;
1158 } else if ((p = strstr(fbuf, "/./")) != NULL) {
1159 *p = '\0';
1160 if (p == fbuf)
1161 dir = "/";
1162 else
1163 dir = fbuf;
1164 len -= p - fbuf + 3;
1165 fn = p + 3;
1166 } else
1167 fn = fbuf;
1168
1169 if (!*fn) {
1170 len = 1;
1171 fn = ".";
1172 }
1173
1174 if (dir && *dir) {
1175 static char *lastdir;
1176 static int lastdir_len;
1177
1178 strlcpy(olddir, curr_dir, sizeof olddir);
1179
1180 if (!push_dir(dir)) {
1181 io_error |= IOERR_GENERAL;
1182 rsyserr(FERROR, errno, "push_dir %s failed",
1183 full_fname(dir));
1184 continue;
1185 }
1186
1187 if (lastdir && strcmp(lastdir, dir) == 0) {
1188 flist_dir = lastdir;
1189 flist_dir_len = lastdir_len;
1190 } else {
1191 flist_dir = lastdir = strdup(dir);
1192 flist_dir_len = lastdir_len = strlen(dir);
1193 }
1194 }
1195
1196 if (fn != fbuf)
1197 memmove(fbuf, fn, len + 1);
1198
1199 if (implied_dirs && (p=strrchr(fbuf,'/')) && p != fbuf) {
1200 /* Send the implied directories at the start of the
1201 * source spec, so we get their permissions right. */
1202 char *lp = lastpath, *slash = fbuf;
1203 *p = '\0';
1204 /* Skip any initial directories in our path that we
1205 * have in common with lastpath. */
1206 for (fn = fbuf; *fn && *lp == *fn; lp++, fn++) {
1207 if (*fn == '/')
1208 slash = fn;
1209 }
1210 *p = '/';
1211 if (fn != p || (*lp && *lp != '/')) {
1212 int save_copy_links = copy_links;
1213 int save_xfer_dirs = xfer_dirs;
1214 copy_links = copy_unsafe_links;
1215 xfer_dirs = 1;
1216 while ((slash = strchr(slash+1, '/')) != 0) {
1217 *slash = '\0';
1218 send_file_name(f, flist, fbuf, 0);
1219 *slash = '/';
1220 }
1221 copy_links = save_copy_links;
1222 xfer_dirs = save_xfer_dirs;
1223 *p = '\0';
1224 strlcpy(lastpath, fbuf, sizeof lastpath);
1225 *p = '/';
1226 }
1227 }
1228
1229 if (one_file_system)
1230 filesystem_dev = st.st_dev;
1231
1232 if (recurse || (xfer_dirs && is_dot_dir)) {
1233 struct file_struct *file;
1234 if ((file = send_file_name(f, flist, fbuf, XMIT_TOP_DIR)))
1235 send_if_directory(f, flist, file, fbuf, len);
1236 } else
1237 send_file_name(f, flist, fbuf, 0);
1238
1239 if (olddir[0]) {
1240 flist_dir = NULL;
1241 flist_dir_len = 0;
1242 if (!pop_dir(olddir)) {
1243 rsyserr(FERROR, errno, "pop_dir %s failed",
1244 full_fname(olddir));
1245 exit_cleanup(RERR_FILESELECT);
1246 }
1247 }
1248 }
1249
1250 gettimeofday(&end_tv, NULL);
1251 stats.flist_buildtime = (int64)(end_tv.tv_sec - start_tv.tv_sec) * 1000
1252 + (end_tv.tv_usec - start_tv.tv_usec) / 1000;
1253 if (stats.flist_buildtime == 0)
1254 stats.flist_buildtime = 1;
1255 start_tv = end_tv;
1256
1257 send_file_entry(NULL, f, 0);
1258
1259 if (show_filelist_p())
1260 finish_filelist_progress(flist);
1261
1262 gettimeofday(&end_tv, NULL);
1263 stats.flist_xfertime = (int64)(end_tv.tv_sec - start_tv.tv_sec) * 1000
1264 + (end_tv.tv_usec - start_tv.tv_usec) / 1000;
1265
1266 if (flist->hlink_pool) {
1267 pool_destroy(flist->hlink_pool);
1268 flist->hlink_pool = NULL;
1269 }
1270
1271 /* Sort the list without removing any duplicates. This allows the
1272 * receiving side to ask for any name they like, which gives us the
1273 * flexibility to change the way we unduplicate names in the future
1274 * without causing a compatibility problem with older versions. */
1275 clean_flist(flist, 0, 0);
1276
1277 /* Now send the uid/gid list. This was introduced in
1278 * protocol version 15 */
1279 send_uid_list(f);
1280
1281 /* send the io_error flag */
1282 write_int(f, lp_ignore_errors(module_id) ? 0 : io_error);
1283
1284 io_end_buffering();
1285 stats.flist_size = stats.total_written - start_write;
1286 stats.num_files = flist->count;
1287
1288 if (verbose > 3)
1289 output_flist(flist);
1290
1291 if (verbose > 2)
1292 rprintf(FINFO, "send_file_list done\n");
1293
1294 return flist;
1295}
1296
1297struct file_list *recv_file_list(int f)
1298{
1299 struct file_list *flist;
1300 unsigned short flags;
1301 int64 start_read;
1302
1303 if (show_filelist_p())
1304 start_filelist_progress("receiving file list");
1305
1306 start_read = stats.total_read;
1307
1308 flist = flist_new(WITH_HLINK, "recv_file_list");
1309
1310 flist->count = 0;
1311 flist->malloced = 1000;
1312 flist->files = new_array(struct file_struct *, flist->malloced);
1313 if (!flist->files)
1314 goto oom;
1315
1316
1317 while ((flags = read_byte(f)) != 0) {
1318 struct file_struct *file;
1319
1320 flist_expand(flist);
1321
1322 if (protocol_version >= 28 && (flags & XMIT_EXTENDED_FLAGS))
1323 flags |= read_byte(f) << 8;
1324 file = receive_file_entry(flist, flags, f);
1325
1326 if (S_ISREG(file->mode))
1327 stats.total_size += file->length;
1328
1329 flist->files[flist->count++] = file;
1330
1331 maybe_emit_filelist_progress(flist->count);
1332
1333 if (verbose > 2) {
1334 rprintf(FINFO, "recv_file_name(%s)\n",
1335 safe_fname(f_name(file)));
1336 }
1337 }
1338 receive_file_entry(NULL, 0, 0); /* Signal that we're done. */
1339
1340 if (verbose > 2)
1341 rprintf(FINFO, "received %d names\n", flist->count);
1342
1343 if (show_filelist_p())
1344 finish_filelist_progress(flist);
1345
1346 clean_flist(flist, relative_paths, 1);
1347
1348 if (f >= 0) {
1349 /* Now send the uid/gid list. This was introduced in
1350 * protocol version 15 */
1351 recv_uid_list(f, flist);
1352
1353 /* Recv the io_error flag */
1354 if (lp_ignore_errors(module_id) || ignore_errors)
1355 read_int(f);
1356 else
1357 io_error |= read_int(f);
1358 }
1359
1360 if (verbose > 3)
1361 output_flist(flist);
1362
1363 if (list_only) {
1364 int i;
1365 for (i = 0; i < flist->count; i++)
1366 list_file_entry(flist->files[i]);
1367 }
1368
1369 if (verbose > 2)
1370 rprintf(FINFO, "recv_file_list done\n");
1371
1372 stats.flist_size = stats.total_read - start_read;
1373 stats.num_files = flist->count;
1374
1375 return flist;
1376
1377oom:
1378 out_of_memory("recv_file_list");
1379 return NULL; /* not reached */
1380}
1381
1382static int file_compare(struct file_struct **file1, struct file_struct **file2)
1383{
1384 return f_name_cmp(*file1, *file2);
1385}
1386
1387/* Search for an identically-named item in the file list. Note that the
1388 * items must agree in their directory-ness, or no match is returned. */
1389int flist_find(struct file_list *flist, struct file_struct *f)
1390{
1391 int low = flist->low, high = flist->high;
1392 int ret, mid, mid_up;
1393
1394 while (low <= high) {
1395 mid = (low + high) / 2;
1396 for (mid_up = mid; !flist->files[mid_up]->basename; mid_up++) {}
1397 if (mid_up <= high)
1398 ret = f_name_cmp(flist->files[mid_up], f);
1399 else
1400 ret = 1;
1401 if (ret == 0) {
1402 if (protocol_version < 29
1403 && S_ISDIR(flist->files[mid_up]->mode)
1404 != S_ISDIR(f->mode))
1405 return -1;
1406 return mid_up;
1407 }
1408 if (ret > 0)
1409 high = mid - 1;
1410 else
1411 low = mid_up + 1;
1412 }
1413 return -1;
1414}
1415
1416/*
1417 * Free up any resources a file_struct has allocated
1418 * and clear the file.
1419 */
1420void clear_file(int i, struct file_list *flist)
1421{
1422 if (flist->hlink_pool && flist->files[i]->link_u.idev)
1423 pool_free(flist->hlink_pool, 0, flist->files[i]->link_u.idev);
1424 memset(flist->files[i], 0, file_struct_len);
1425}
1426
1427/*
1428 * allocate a new file list
1429 */
1430struct file_list *flist_new(int with_hlink, char *msg)
1431{
1432 struct file_list *flist;
1433
1434 flist = new(struct file_list);
1435 if (!flist)
1436 out_of_memory(msg);
1437
1438 memset(flist, 0, sizeof (struct file_list));
1439
1440 if (!(flist->file_pool = pool_create(FILE_EXTENT, 0,
1441 out_of_memory, POOL_INTERN)))
1442 out_of_memory(msg);
1443
1444#ifdef SUPPORT_HARD_LINKS
1445 if (with_hlink && preserve_hard_links) {
1446 if (!(flist->hlink_pool = pool_create(HLINK_EXTENT,
1447 sizeof (struct idev), out_of_memory, POOL_INTERN)))
1448 out_of_memory(msg);
1449 }
1450#endif
1451
1452 return flist;
1453}
1454
1455/*
1456 * free up all elements in a flist
1457 */
1458void flist_free(struct file_list *flist)
1459{
1460 pool_destroy(flist->file_pool);
1461 pool_destroy(flist->hlink_pool);
1462 free(flist->files);
1463 free(flist);
1464}
1465
1466/*
1467 * This routine ensures we don't have any duplicate names in our file list.
1468 * duplicate names can cause corruption because of the pipelining
1469 */
1470static void clean_flist(struct file_list *flist, int strip_root, int no_dups)
1471{
1472 int i, prev_i = 0;
1473
1474 if (!flist)
1475 return;
1476 if (flist->count == 0) {
1477 flist->high = -1;
1478 return;
1479 }
1480
1481 sorting_flist = flist;
1482 qsort(flist->files, flist->count,
1483 sizeof flist->files[0], (int (*)())file_compare);
1484 sorting_flist = NULL;
1485
1486 for (i = no_dups? 0 : flist->count; i < flist->count; i++) {
1487 if (flist->files[i]->basename) {
1488 prev_i = i;
1489 break;
1490 }
1491 }
1492 flist->low = prev_i;
1493 while (++i < flist->count) {
1494 int j;
1495 struct file_struct *file = flist->files[i];
1496
1497 if (!file->basename)
1498 continue;
1499 if (f_name_cmp(file, flist->files[prev_i]) == 0)
1500 j = prev_i;
1501 else if (protocol_version >= 29 && S_ISDIR(file->mode)) {
1502 int save_mode = file->mode;
1503 /* Make sure that this directory doesn't duplicate a
1504 * non-directory earlier in the list. */
1505 flist->high = prev_i;
1506 file->mode = S_IFREG;
1507 j = flist_find(flist, file);
1508 file->mode = save_mode;
1509 } else
1510 j = -1;
1511 if (j >= 0) {
1512 struct file_struct *fp = flist->files[j];
1513 int keep, drop;
1514 /* If one is a dir and the other is not, we want to
1515 * keep the dir because it might have contents in the
1516 * list. */
1517 if (S_ISDIR(file->mode) != S_ISDIR(fp->mode)) {
1518 if (S_ISDIR(file->mode))
1519 keep = i, drop = j;
1520 else
1521 keep = j, drop = i;
1522 } else
1523 keep = j, drop = i;
1524 if (verbose > 1 && !am_server) {
1525 rprintf(FINFO,
1526 "removing duplicate name %s from file list (%d)\n",
1527 safe_fname(f_name(file)), drop);
1528 }
1529 /* Make sure that if we unduplicate '.', that we don't
1530 * lose track of a user-specified top directory. */
1531 flist->files[keep]->flags |= flist->files[drop]->flags
1532 & (FLAG_TOP_DIR|FLAG_DEL_HERE);
1533
1534 clear_file(drop, flist);
1535
1536 if (keep == i) {
1537 if (flist->low == drop) {
1538 for (j = drop + 1;
1539 j < i && !flist->files[j]->basename;
1540 j++) {}
1541 flist->low = j;
1542 }
1543 prev_i = i;
1544 }
1545 } else
1546 prev_i = i;
1547 }
1548 flist->high = no_dups ? prev_i : flist->count - 1;
1549
1550 if (strip_root) {
1551 /* We need to strip off the leading slashes for relative
1552 * paths, but this must be done _after_ the sorting phase. */
1553 for (i = flist->low; i <= flist->high; i++) {
1554 struct file_struct *file = flist->files[i];
1555
1556 if (!file->dirname)
1557 continue;
1558 if (*file->dirname == '/') {
1559 char *s = file->dirname + 1;
1560 while (*s == '/') s++;
1561 memmove(file->dirname, s, strlen(s) + 1);
1562 }
1563
1564 if (!*file->dirname)
1565 file->dirname = NULL;
1566 }
1567 }
1568}
1569
1570static void output_flist(struct file_list *flist)
1571{
1572 char uidbuf[16], gidbuf[16], depthbuf[16];
1573 struct file_struct *file;
1574 const char *who = who_am_i();
1575 int i;
1576
1577 for (i = 0; i < flist->count; i++) {
1578 file = flist->files[i];
1579 if ((am_root || am_sender) && preserve_uid)
1580 sprintf(uidbuf, " uid=%ld", (long)file->uid);
1581 else
1582 *uidbuf = '\0';
1583 if (preserve_gid && file->gid != GID_NONE)
1584 sprintf(gidbuf, " gid=%ld", (long)file->gid);
1585 else
1586 *gidbuf = '\0';
1587 if (!am_sender)
1588 sprintf(depthbuf, "%d", file->dir.depth);
1589 rprintf(FINFO, "[%s] i=%d %s %s%s%s%s mode=0%o len=%.0f%s%s flags=%x\n",
1590 who, i, am_sender ? NS(file->dir.root) : depthbuf,
1591 file->dirname ? safe_fname(file->dirname) : "",
1592 file->dirname ? "/" : "", NS(file->basename),
1593 S_ISDIR(file->mode) ? "/" : "", (int)file->mode,
1594 (double)file->length, uidbuf, gidbuf, file->flags);
1595 }
1596}
1597
1598enum fnc_state { s_DIR, s_SLASH, s_BASE, s_TRAILING };
1599enum fnc_type { t_PATH, t_ITEM };
1600
1601/* Compare the names of two file_struct entities, similar to how strcmp()
1602 * would do if it were operating on the joined strings.
1603 *
1604 * Some differences beginning with protocol_version 29: (1) directory names
1605 * are compared with an assumed trailing slash so that they compare in a
1606 * way that would cause them to sort immediately prior to any content they
1607 * may have; (2) a directory of any name compares after a non-directory of
1608 * any name at the same depth; (3) a directory with name "." compares prior
1609 * to anything else. These changes mean that a directory and a non-dir
1610 * with the same name will not compare as equal (protocol_version >= 29).
1611 *
1612 * The dirname component can be an empty string, but the basename component
1613 * cannot (and never is in the current codebase). The basename component
1614 * may be NULL (for a removed item), in which case it is considered to be
1615 * after any existing item. */
1616int f_name_cmp(struct file_struct *f1, struct file_struct *f2)
1617{
1618 int dif;
1619 const uchar *c1, *c2;
1620 enum fnc_state state1, state2;
1621 enum fnc_type type1, type2;
1622 enum fnc_type t_path = protocol_version >= 29 ? t_PATH : t_ITEM;
1623
1624 if (!f1 || !f1->basename) {
1625 if (!f2 || !f2->basename)
1626 return 0;
1627 return -1;
1628 }
1629 if (!f2 || !f2->basename)
1630 return 1;
1631
1632 c1 = (uchar*)f1->dirname;
1633 c2 = (uchar*)f2->dirname;
1634 if (c1 == c2)
1635 c1 = c2 = NULL;
1636 if (!c1) {
1637 type1 = S_ISDIR(f1->mode) ? t_path : t_ITEM;
1638 c1 = (uchar*)f1->basename;
1639 if (type1 == t_PATH && *c1 == '.' && !c1[1]) {
1640 type1 = t_ITEM;
1641 state1 = s_TRAILING;
1642 c1 = (uchar*)"";
1643 } else
1644 state1 = s_BASE;
1645 } else if (!*c1) {
1646 type1 = t_path;
1647 state1 = s_SLASH;
1648 c1 = (uchar*)"/";
1649 } else {
1650 type1 = t_path;
1651 state1 = s_DIR;
1652 }
1653 if (!c2) {
1654 type2 = S_ISDIR(f2->mode) ? t_path : t_ITEM;
1655 c2 = (uchar*)f2->basename;
1656 if (type2 == t_PATH && *c2 == '.' && !c2[1]) {
1657 type2 = t_ITEM;
1658 state2 = s_TRAILING;
1659 c2 = (uchar*)"";
1660 } else
1661 state2 = s_BASE;
1662 } else if (!*c2) {
1663 type2 = t_path;
1664 state2 = s_SLASH;
1665 c2 = (uchar*)"/";
1666 } else {
1667 type2 = t_path;
1668 state2 = s_DIR;
1669 }
1670
1671 if (type1 != type2)
1672 return type1 == t_PATH ? 1 : -1;
1673
1674 while (1) {
1675 if ((dif = (int)*c1++ - (int)*c2++) != 0)
1676 break;
1677 if (!*c1) {
1678 switch (state1) {
1679 case s_DIR:
1680 state1 = s_SLASH;
1681 c1 = (uchar*)"/";
1682 break;
1683 case s_SLASH:
1684 type1 = S_ISDIR(f1->mode) ? t_path : t_ITEM;
1685 c1 = (uchar*)f1->basename;
1686 if (type1 == t_PATH && *c1 == '.' && !c1[1]) {
1687 type1 = t_ITEM;
1688 state1 = s_TRAILING;
1689 c1 = (uchar*)"";
1690 } else
1691 state1 = s_BASE;
1692 break;
1693 case s_BASE:
1694 state1 = s_TRAILING;
1695 if (type1 == t_PATH) {
1696 c1 = (uchar*)"/";
1697 break;
1698 }
1699 /* FALL THROUGH */
1700 case s_TRAILING:
1701 type1 = t_ITEM;
1702 break;
1703 }
1704 if (*c2 && type1 != type2)
1705 return type1 == t_PATH ? 1 : -1;
1706 }
1707 if (!*c2) {
1708 switch (state2) {
1709 case s_DIR:
1710 state2 = s_SLASH;
1711 c2 = (uchar*)"/";
1712 break;
1713 case s_SLASH:
1714 type2 = S_ISDIR(f2->mode) ? t_path : t_ITEM;
1715 c2 = (uchar*)f2->basename;
1716 if (type2 == t_PATH && *c2 == '.' && !c2[1]) {
1717 type2 = t_ITEM;
1718 state2 = s_TRAILING;
1719 c2 = (uchar*)"";
1720 } else
1721 state2 = s_BASE;
1722 break;
1723 case s_BASE:
1724 state2 = s_TRAILING;
1725 if (type2 == t_PATH) {
1726 c2 = (uchar*)"/";
1727 break;
1728 }
1729 /* FALL THROUGH */
1730 case s_TRAILING:
1731 if (!*c1)
1732 return 0;
1733 type2 = t_ITEM;
1734 break;
1735 }
1736 if (type1 != type2)
1737 return type1 == t_PATH ? 1 : -1;
1738 }
1739 }
1740
1741 return dif;
1742}
1743
1744/* Return a copy of the full filename of a flist entry, using the indicated
1745 * buffer. No size-checking is done because we checked the size when creating
1746 * the file_struct entry.
1747 */
1748char *f_name_to(struct file_struct *f, char *fbuf)
1749{
1750 if (!f || !f->basename)
1751 return NULL;
1752
1753 if (f->dirname) {
1754 int len = strlen(f->dirname);
1755 memcpy(fbuf, f->dirname, len);
1756 fbuf[len] = '/';
1757 strcpy(fbuf + len + 1, f->basename);
1758 } else
1759 strcpy(fbuf, f->basename);
1760 return fbuf;
1761}
1762
1763/* Like f_name_to(), but we rotate through 5 static buffers of our own. */
1764char *f_name(struct file_struct *f)
1765{
1766 static char names[5][MAXPATHLEN];
1767 static unsigned int n;
1768
1769 n = (n + 1) % (sizeof names / sizeof names[0]);
1770
1771 return f_name_to(f, names[n]);
1772}
1773
1774/* Do a non-recursive scan of the named directory, possibly ignoring all
1775 * exclude rules except for the daemon's. If "dlen" is >=0, it is the length
1776 * of the dirname string, and also indicates that "dirname" is a MAXPATHLEN
1777 * buffer (the functions we call will append names onto the end, but the old
1778 * dir value will be restored on exit). */
1779struct file_list *get_dirlist(char *dirname, int dlen,
1780 int ignore_filter_rules)
1781{
1782 struct file_list *dirlist;
1783 char dirbuf[MAXPATHLEN];
1784 int save_recurse = recurse;
1785
1786 if (dlen < 0) {
1787 dlen = strlcpy(dirbuf, dirname, MAXPATHLEN);
1788 if (dlen >= MAXPATHLEN)
1789 return NULL;
1790 dirname = dirbuf;
1791 }
1792
1793 dirlist = flist_new(WITHOUT_HLINK, "get_dirlist");
1794
1795 recurse = 0;
1796 send_directory(ignore_filter_rules ? -2 : -1, dirlist, dirname, dlen);
1797 recurse = save_recurse;
1798 if (do_progress)
1799 flist_count_offset += dirlist->count;
1800
1801 clean_flist(dirlist, 0, 0);
1802
1803 if (verbose > 3)
1804 output_flist(dirlist);
1805
1806 return dirlist;
1807}