X-Git-Url: https://mattmccutchen.net/rsync/rsync.git/blobdiff_plain/8824e2cee4ec33cb11b97f96b40aec15d5191e9b..4f5b0756df0dfc925b9576db47ecce949c378e18:/flist.c diff --git a/flist.c b/flist.c index 252b91a5..731ffee9 100644 --- a/flist.c +++ b/flist.c @@ -145,7 +145,7 @@ static void list_file_entry(struct file_struct *f) permstring(perms, f->mode); -#if SUPPORT_LINKS +#ifdef SUPPORT_LINKS if (preserve_links && S_ISLNK(f->mode)) { rprintf(FINFO, "%s %11.0f %s %s -> %s\n", perms, @@ -178,7 +178,7 @@ static void list_file_entry(struct file_struct *f) **/ static int readlink_stat(const char *path, STRUCT_STAT *buffer, char *linkbuf) { -#if SUPPORT_LINKS +#ifdef SUPPORT_LINKS if (copy_links) return do_stat(path, buffer); if (link_stat(path, buffer, 0) < 0) @@ -204,7 +204,7 @@ static int readlink_stat(const char *path, STRUCT_STAT *buffer, char *linkbuf) int link_stat(const char *path, STRUCT_STAT *buffer, int follow_dirlinks) { -#if SUPPORT_LINKS +#ifdef SUPPORT_LINKS if (copy_links) return do_stat(path, buffer); if (do_lstat(path, buffer) < 0) @@ -253,7 +253,7 @@ static int is_excluded(char *fname, int is_dir, int filter_level) static int to_wire_mode(mode_t mode) { -#if SUPPORT_LINKS +#ifdef SUPPORT_LINKS if (S_ISLNK(mode) && (_S_IFLNK != 0120000)) return (mode & ~(_S_IFMT)) | 0120000; #endif @@ -385,7 +385,7 @@ void send_file_entry(struct file_struct *file, int f, unsigned short base_flags) else modtime = file->modtime; -#if SUPPORT_HARD_LINKS +#ifdef SUPPORT_HARD_LINKS if (file->link_u.idev) { if (file->F_DEV == dev) { if (protocol_version >= 28) @@ -463,7 +463,7 @@ void send_file_entry(struct file_struct *file, int f, unsigned short base_flags) } } -#if SUPPORT_LINKS +#ifdef SUPPORT_LINKS if (preserve_links && S_ISLNK(mode)) { int len = strlen(file->u.link); write_int(f, len); @@ -471,7 +471,7 @@ void send_file_entry(struct file_struct *file, int f, unsigned short base_flags) } #endif -#if SUPPORT_HARD_LINKS +#ifdef SUPPORT_HARD_LINKS if (flags & XMIT_HAS_IDEV_DATA) { if (protocol_version < 26) { /* 32-bit dev_t and ino_t */ @@ -508,8 +508,8 @@ void send_file_entry(struct file_struct *file, int f, unsigned short base_flags) -static void receive_file_entry(struct file_list *flist, int ndx, - unsigned short flags, int f) +static struct file_struct *receive_file_entry(struct file_list *flist, + unsigned short flags, int f) { static time_t modtime; static mode_t mode; @@ -537,7 +537,7 @@ static void receive_file_entry(struct file_list *flist, int ndx, *lastname = '\0'; lastdir_len = -1; in_del_hier = 0; - return; + return NULL; } if (flags & XMIT_SAME_NAME) @@ -611,7 +611,7 @@ static void receive_file_entry(struct file_list *flist, int ndx, } } -#if SUPPORT_LINKS +#ifdef SUPPORT_LINKS if (preserve_links && S_ISLNK(mode)) { linkname_len = read_int(f) + 1; /* count the '\0' */ if (linkname_len <= 0 || linkname_len > MAXPATHLEN) { @@ -630,7 +630,7 @@ static void receive_file_entry(struct file_list *flist, int ndx, + linkname_len + sum_len; bp = pool_alloc(flist->file_pool, alloc_len, "receive_file_entry"); - file = flist->files[ndx] = (struct file_struct *)bp; + file = (struct file_struct *)bp; memset(bp, 0, file_struct_len); bp += file_struct_len; @@ -679,7 +679,7 @@ static void receive_file_entry(struct file_list *flist, int ndx, if (preserve_devices && IS_DEVICE(mode)) file->u.rdev = rdev; -#if SUPPORT_LINKS +#ifdef SUPPORT_LINKS if (linkname_len) { file->u.link = bp; read_sbuf(f, bp, linkname_len - 1); @@ -689,7 +689,7 @@ static void receive_file_entry(struct file_list *flist, int ndx, } #endif -#if SUPPORT_HARD_LINKS +#ifdef SUPPORT_HARD_LINKS if (preserve_hard_links && protocol_version < 28 && S_ISREG(mode)) flags |= XMIT_HAS_IDEV_DATA; if (flags & XMIT_HAS_IDEV_DATA) { @@ -732,6 +732,8 @@ static void receive_file_entry(struct file_list *flist, int ndx, * permissions and umask. This emulates what GNU cp does */ file->mode &= ~orig_umask; } + + return file; } @@ -786,7 +788,7 @@ struct file_struct *make_file(char *fname, struct file_list *flist, && is_excluded(thisname, 0, filter_level)) return NULL; if (save_errno == ENOENT) { -#if SUPPORT_LINKS +#ifdef SUPPORT_LINKS /* Avoid "vanished" error if symlink points nowhere. */ if (copy_links && do_lstat(thisname, &st) == 0 && S_ISLNK(st.st_mode)) { @@ -830,7 +832,7 @@ struct file_struct *make_file(char *fname, struct file_list *flist, return NULL; if (lp_ignore_nonreadable(module_id)) { -#if SUPPORT_LINKS +#ifdef SUPPORT_LINKS if (!S_ISLNK(st.st_mode)) #endif if (access(thisname, R_OK) != 0) @@ -859,7 +861,7 @@ skip_filters: } basename_len = strlen(basename) + 1; /* count the '\0' */ -#if SUPPORT_LINKS +#ifdef SUPPORT_LINKS linkname_len = S_ISLNK(st.st_mode) ? strlen(linkname) + 1 : 0; #else linkname_len = 0; @@ -888,7 +890,7 @@ skip_filters: file->uid = st.st_uid; file->gid = st.st_gid; -#if SUPPORT_HARD_LINKS +#ifdef SUPPORT_HARD_LINKS if (flist && flist->hlink_pool) { if (protocol_version < 28) { if (S_ISREG(st.st_mode)) @@ -921,12 +923,12 @@ skip_filters: memcpy(bp, basename, basename_len); bp += basename_len; -#if HAVE_STRUCT_STAT_ST_RDEV +#ifdef HAVE_STRUCT_STAT_ST_RDEV if (preserve_devices && IS_DEVICE(st.st_mode)) file->u.rdev = st.st_rdev; #endif -#if SUPPORT_LINKS +#ifdef SUPPORT_LINKS if (linkname_len) { file->u.link = bp; memcpy(bp, linkname, linkname_len); @@ -946,8 +948,9 @@ skip_filters: * a list of files for a delete pass. */ if (keep_dirlinks && linkname_len && flist) { STRUCT_STAT st2; - int i = flist_find(received_flist, file); - if (i >= 0 && S_ISDIR(received_flist->files[i]->mode) + int save_mode = file->mode; + file->mode = S_IFDIR; /* find a directory w/our name */ + if (flist_find(received_flist, file) >= 0 && do_stat(thisname, &st2) == 0 && S_ISDIR(st2.st_mode)) { file->modtime = st2.st_mtime; file->length = st2.st_size; @@ -955,11 +958,8 @@ skip_filters: file->uid = st2.st_uid; file->gid = st2.st_gid; file->u.link = NULL; - if (file->link_u.idev) { - pool_free(flist->hlink_pool, 0, file->link_u.idev); - file->link_u.idev = NULL; - } - } + } else + file->mode = save_mode; } if (!S_ISDIR(st.st_mode)) @@ -1236,6 +1236,10 @@ struct file_list *send_file_list(int f, int argc, char *argv[]) flist->hlink_pool = NULL; } + /* Sort the list without removing any duplicates. This allows the + * receiving side to ask for any name they like, which gives us the + * flexibility to change the way we unduplicate names in the future + * without causing a compatibility problem with older versions. */ clean_flist(flist, 0, 0); /* Now send the uid/gid list. This was introduced in @@ -1281,27 +1285,27 @@ struct file_list *recv_file_list(int f) while ((flags = read_byte(f)) != 0) { - int i = flist->count; + struct file_struct *file; flist_expand(flist); if (protocol_version >= 28 && (flags & XMIT_EXTENDED_FLAGS)) flags |= read_byte(f) << 8; - receive_file_entry(flist, i, flags, f); + file = receive_file_entry(flist, flags, f); - if (S_ISREG(flist->files[i]->mode)) - stats.total_size += flist->files[i]->length; + if (S_ISREG(file->mode)) + stats.total_size += file->length; - flist->count++; + flist->files[flist->count++] = file; maybe_emit_filelist_progress(flist); if (verbose > 2) { rprintf(FINFO, "recv_file_name(%s)\n", - safe_fname(f_name(flist->files[i]))); + safe_fname(f_name(file))); } } - receive_file_entry(NULL, 0, 0, 0); /* Signal that we're done. */ + receive_file_entry(NULL, 0, 0); /* Signal that we're done. */ if (verbose > 2) rprintf(FINFO, "received %d names\n", flist->count); @@ -1352,6 +1356,8 @@ static int file_compare(struct file_struct **file1, struct file_struct **file2) } +/* Search for an identically-named item in the file list. Note that the + * items must agree in their directory-ness, or no match is returned. */ int flist_find(struct file_list *flist, struct file_struct *f) { int low = flist->low, high = flist->high; @@ -1364,8 +1370,13 @@ int flist_find(struct file_list *flist, struct file_struct *f) ret = f_name_cmp(flist->files[mid_up], f); else ret = 1; - if (ret == 0) + if (ret == 0) { + if (protocol_version < 29 + && S_ISDIR(flist->files[mid_up]->mode) + != S_ISDIR(f->mode)) + return -1; return mid_up; + } if (ret > 0) high = mid - 1; else @@ -1374,6 +1385,7 @@ int flist_find(struct file_list *flist, struct file_struct *f) return -1; } + /* * Free up any resources a file_struct has allocated * and clear the file. @@ -1403,7 +1415,7 @@ struct file_list *flist_new(int with_hlink, char *msg) out_of_memory, POOL_INTERN))) out_of_memory(msg); -#if SUPPORT_HARD_LINKS +#ifdef SUPPORT_HARD_LINKS if (with_hlink && preserve_hard_links) { if (!(flist->hlink_pool = pool_create(HLINK_EXTENT, sizeof (struct idev), out_of_memory, POOL_INTERN))) @@ -1448,41 +1460,78 @@ static void clean_flist(struct file_list *flist, int strip_root, int no_dups) } flist->low = prev_i; while (++i < flist->count) { - if (!flist->files[i]->basename) + int j; + struct file_struct *file = flist->files[i]; + + if (!file->basename) continue; - if (f_name_cmp(flist->files[i], flist->files[prev_i]) == 0) { + if (f_name_cmp(file, flist->files[prev_i]) == 0) + j = prev_i; + else if (protocol_version >= 29 && S_ISDIR(file->mode)) { + int save_mode = file->mode; + /* Make sure that this directory doesn't duplicate a + * non-directory earlier in the list. */ + flist->high = prev_i; + file->mode = S_IFREG; + j = flist_find(flist, file); + file->mode = save_mode; + } else + j = -1; + if (j >= 0) { + struct file_struct *fp = flist->files[j]; + int keep, drop; + /* If one is a dir and the other is not, we want to + * keep the dir because it might have contents in the + * list. */ + if (S_ISDIR(file->mode) != S_ISDIR(fp->mode)) { + if (S_ISDIR(file->mode)) + keep = i, drop = j; + else + keep = j, drop = i; + } else + keep = j, drop = i; if (verbose > 1 && !am_server) { rprintf(FINFO, - "removing duplicate name %s from file list %d\n", - safe_fname(f_name(flist->files[i])), i); + "removing duplicate name %s from file list (%d)\n", + safe_fname(f_name(file)), drop); } /* Make sure that if we unduplicate '.', that we don't * lose track of a user-specified top directory. */ - if (flist->files[i]->flags & FLAG_TOP_DIR) - flist->files[prev_i]->flags |= FLAG_TOP_DIR; + if (flist->files[drop]->flags & FLAG_TOP_DIR) + flist->files[keep]->flags |= FLAG_TOP_DIR; - clear_file(i, flist); + clear_file(drop, flist); + + if (keep == i) { + if (flist->low == drop) { + for (j = drop + 1; + j < i && !flist->files[j]->basename; + j++) {} + flist->low = j; + } + prev_i = i; + } } else prev_i = i; } - flist->high = prev_i; + flist->high = no_dups ? prev_i : flist->count - 1; if (strip_root) { - /* we need to strip off the root directory in the case - of relative paths, but this must be done _after_ - the sorting phase */ - for (i = 0; i < flist->count; i++) { - if (flist->files[i]->dirname && - flist->files[i]->dirname[0] == '/') { - memmove(&flist->files[i]->dirname[0], - &flist->files[i]->dirname[1], - strlen(flist->files[i]->dirname)); - } + /* We need to strip off the leading slashes for relative + * paths, but this must be done _after_ the sorting phase. */ + for (i = flist->low; i <= flist->high; i++) { + struct file_struct *file = flist->files[i]; - if (flist->files[i]->dirname && - !flist->files[i]->dirname[0]) { - flist->files[i]->dirname = NULL; + if (!file->dirname) + continue; + if (*file->dirname == '/') { + char *s = file->dirname + 1; + while (*s == '/') s++; + memmove(file->dirname, s, strlen(s) + 1); } + + if (!*file->dirname) + file->dirname = NULL; } } } @@ -1516,23 +1565,30 @@ static void output_flist(struct file_list *flist, const char *whose_list) enum fnc_state { s_DIR, s_SLASH, s_BASE, s_TRAILING }; +enum fnc_type { t_PATH, t_ITEM }; /* Compare the names of two file_struct entities, similar to how strcmp() - * would do if it were operating on the joined strings. The only difference - * is that, beginning with protocol_version 29, a directory name will always - * sort immediately prior to its contents (previously "foo." would sort in - * between directory "foo" and "foo/bar"). We do this by assuming that a dir - * has a trailing slash for comparison purposes, but only if we aren't about - * to match a file of the same name (because we need all identically named - * items to match each other). The dirname component can be an empty string, - * but the basename component cannot (and never is in the current codebase). - * The basename component may be NULL, in which case it is sorted to the end - * of the list (as a removed item). */ + * would do if it were operating on the joined strings. + * + * Some differences beginning with protocol_version 29: (1) directory names + * are compared with an assumed trailing slash so that they compare in a + * way that would cause them to sort immediately prior to any content they + * may have; (2) a directory of any name compares after a non-directory of + * any name at the same depth; (3) a directory with name "." compares prior + * to anything else. These changes mean that a directory and a non-dir + * with the same name will not compare as equal (protocol_version >= 29). + * + * The dirname component can be an empty string, but the basename component + * cannot (and never is in the current codebase). The basename component + * may be NULL (for a removed item), in which case it is considered to be + * after any existing item. */ int f_name_cmp(struct file_struct *f1, struct file_struct *f2) { int dif; const uchar *c1, *c2; enum fnc_state state1, state2; + enum fnc_type type1, type2; + enum fnc_type t_path = protocol_version >= 29 ? t_PATH : t_ITEM; if (!f1 || !f1->basename) { if (!f2 || !f2->basename) @@ -1547,64 +1603,97 @@ int f_name_cmp(struct file_struct *f1, struct file_struct *f2) if (c1 == c2) c1 = c2 = NULL; if (!c1) { - state1 = s_BASE; + type1 = S_ISDIR(f1->mode) ? t_path : t_ITEM; c1 = (uchar*)f1->basename; + if (type1 == t_PATH && *c1 == '.' && !c1[1]) { + type1 = t_ITEM; + state1 = s_TRAILING; + c1 = (uchar*)""; + } else + state1 = s_BASE; } else if (!*c1) { + type1 = t_path; state1 = s_SLASH; c1 = (uchar*)"/"; - } else + } else { + type1 = t_path; state1 = s_DIR; + } if (!c2) { - state2 = s_BASE; + type2 = S_ISDIR(f2->mode) ? t_path : t_ITEM; c2 = (uchar*)f2->basename; + if (type2 == t_PATH && *c2 == '.' && !c2[1]) { + type2 = t_ITEM; + state2 = s_TRAILING; + c2 = (uchar*)""; + } else + state2 = s_BASE; } else if (!*c2) { + type2 = t_path; state2 = s_SLASH; c2 = (uchar*)"/"; - } else + } else { + type2 = t_path; state2 = s_DIR; + } + + if (type1 != type2) + return type1 == t_PATH ? 1 : -1; while (1) { - if ((dif = (int)*c1 - (int)*c2) != 0) + if ((dif = (int)*c1++ - (int)*c2++) != 0) break; - if (!*++c1) { + if (!*c1) { switch (state1) { case s_DIR: state1 = s_SLASH; c1 = (uchar*)"/"; break; case s_SLASH: + type1 = S_ISDIR(f1->mode) ? t_path : t_ITEM; state1 = s_BASE; c1 = (uchar*)f1->basename; break; case s_BASE: state1 = s_TRAILING; - if (protocol_version >= 29 && S_ISDIR(f1->mode)) + if (type1 == t_PATH) { c1 = (uchar*)"/"; - break; + break; + } + /* FALL THROUGH */ case s_TRAILING: + type1 = t_ITEM; break; } + if (*c2 && type1 != type2) + return type1 == t_PATH ? 1 : -1; } - if (!*++c2) { + if (!*c2) { switch (state2) { case s_DIR: state2 = s_SLASH; c2 = (uchar*)"/"; break; case s_SLASH: + type2 = S_ISDIR(f2->mode) ? t_path : t_ITEM; state2 = s_BASE; c2 = (uchar*)f2->basename; break; case s_BASE: - if (state1 == s_TRAILING) - return 0; state2 = s_TRAILING; - if (protocol_version >= 29 && S_ISDIR(f2->mode)) + if (type2 == t_PATH) { c2 = (uchar*)"/"; - break; + break; + } + /* FALL THROUGH */ case s_TRAILING: + if (!*c1) + return 0; + type2 = t_ITEM; break; } + if (type1 != type2) + return type1 == t_PATH ? 1 : -1; } } @@ -1720,7 +1809,7 @@ void delete_in_dir(struct file_list *flist, char *fbuf, void delete_missing(struct file_list *full_list, struct file_list *dir_list, const char *dirname) { - int i, j, mode; + int i, mode; if (max_delete && deletion_count >= max_delete) return; @@ -1732,8 +1821,7 @@ void delete_missing(struct file_list *full_list, struct file_list *dir_list, if (!dir_list->files[i]->basename) continue; mode = dir_list->files[i]->mode; - if ((j = flist_find(full_list, dir_list->files[i])) < 0 - || (S_ISDIR(mode) && !S_ISDIR(full_list->files[j]->mode))) { + if (flist_find(full_list, dir_list->files[i]) < 0) { char *f = f_name(dir_list->files[i]); if (make_backups && (backup_dir || !is_backup_file(f)) && !S_ISDIR(mode)) {