X-Git-Url: https://mattmccutchen.net/rsync/rsync-patches.git/blobdiff_plain/7bfcb297c3723a52c1a5ccc5662a9b856b004c1f..f1f4dbd128c05bca1b3a305f775aca7034f188d7:/detect-renamed.diff diff --git a/detect-renamed.diff b/detect-renamed.diff index 954dfad..4f927d9 100644 --- a/detect-renamed.diff +++ b/detect-renamed.diff @@ -34,23 +34,22 @@ TODO: --- old/compat.c +++ new/compat.c -@@ -49,6 +49,7 @@ extern int preserve_xattrs; - extern int need_messages_from_generator; - extern int delete_mode, delete_before, delete_during, delete_after; - extern int delete_excluded; +@@ -41,6 +41,7 @@ extern int checksum_seed; + extern int basis_dir_cnt; + extern int prune_empty_dirs; + extern int protocol_version; +extern int detect_renamed; - extern int make_backups; - extern char *shell_cmd; /* contains VER.SUB string if client is a pre-release */ - extern char *backup_dir, *backup_suffix; -@@ -221,7 +222,7 @@ void setup_protocol(int f_out,int f_in) - } else if (protocol_version >= 30) { - if (recurse && allow_inc_recurse - && !delete_before && !delete_after && !delay_updates -- && !use_qsort && !prune_empty_dirs) -+ && !use_qsort && !prune_empty_dirs && !detect_renamed) - inc_recurse = 1; - need_messages_from_generator = 1; - } + extern int protect_args; + extern int preserve_uid; + extern int preserve_gid; +@@ -108,6 +109,7 @@ void set_allow_inc_recurse(void) + allow_inc_recurse = 0; + else if (!am_sender + && (delete_before || delete_after ++ || detect_renamed + || delay_updates || prune_empty_dirs)) + allow_inc_recurse = 0; + else if (am_server && !local_server --- old/flist.c +++ new/flist.c @@ -61,6 +61,7 @@ extern int non_perishable_cnt; @@ -70,7 +69,7 @@ TODO: static char empty_sum[MAX_DIGEST_LEN]; static int flist_count_offset; /* for --delete --progress */ static int dir_count = 0; -@@ -281,6 +284,45 @@ static int is_excluded(char *fname, int +@@ -252,6 +255,45 @@ static int is_excluded(char *fname, int return 0; } @@ -116,9 +115,9 @@ TODO: static void send_directory(int f, struct file_list *flist, char *fbuf, int len, int flags); -@@ -1935,6 +1977,25 @@ struct file_list *send_file_list(int f, - if (verbose > 2) - rprintf(FINFO, "send_file_list done\n"); +@@ -2154,6 +2196,25 @@ struct file_list *recv_file_list(int f) + + clean_flist(flist, relative_paths); + if (detect_renamed) { + int j = flist->used; @@ -139,9 +138,9 @@ TODO: + the_fattr_list.high = j; + } + - if (inc_recurse) { - add_dirs_to_tree(-1, flist, dir_count); - flist_done_allocating(flist); + if (protocol_version < 30) { + /* Recv the io_error flag */ + if (ignore_errors) --- old/generator.c +++ new/generator.c @@ -79,6 +79,7 @@ extern char *basis_dir[]; @@ -178,7 +177,7 @@ TODO: #define DEL_RECURSE (1<<1) /* recurse */ #define DEL_DIR_IS_EMPTY (1<<2) /* internal delete_FUNCTIONS use only */ -@@ -136,11 +140,120 @@ static int is_backup_file(char *fn) +@@ -136,11 +140,121 @@ static int is_backup_file(char *fn) return k > 0 && strcmp(fn+k, backup_suffix) == 0; } @@ -264,7 +263,7 @@ TODO: + STRUCT_STAT st; + int ndx; + -+ if ((ndx = fattr_find(file, fname)) < 0) ++ if (!partial_dir || (ndx = fattr_find(file, fname)) < 0) + return; + + fp = the_fattr_list.files[ndx]; @@ -272,21 +271,22 @@ TODO: + /* We don't provide an alternate-basis file if there is a basis file. */ + if (link_stat(fn, &st, 0) == 0) + return; -+ if ((partialptr = partial_dir_fname(fn)) == NULL -+ || !handle_partial_dir(partialptr, PDIR_CREATE)) -+ return; + -+ /* We only use the file if we can hard-link it into our tmp dir. */ -+ if (link(fname, partialptr) == 0) { -+ if (verbose > 2) { -+ rprintf(FINFO, "found renamed: %s => %s\n", -+ fname, partialptr); ++ if (!dry_run) { ++ if ((partialptr = partial_dir_fname(fn)) == NULL ++ || !handle_partial_dir(partialptr, PDIR_CREATE)) ++ return; ++ /* We only use the file if we can hard-link it into our tmp dir. */ ++ if (link(fname, partialptr) != 0) { ++ if (errno != EEXIST) ++ handle_partial_dir(partialptr, PDIR_DELETE); ++ return; + } -+ return; + } + -+ if (errno != EEXIST) -+ handle_partial_dir(partialptr, PDIR_DELETE); ++ /* I think this falls into the -vv category with "%s is uptodate", etc. */ ++ if (verbose > 1) ++ rprintf(FINFO, "found renamed: %s => %s\n", fname, fn); +} + /* Delete a file or directory. If DEL_RECURSE is set in the flags, this will @@ -299,7 +299,7 @@ TODO: */ static enum delret delete_item(char *fbuf, int mode, char *replace, int flags) { -@@ -162,6 +275,8 @@ static enum delret delete_item(char *fbu +@@ -162,6 +276,8 @@ static enum delret delete_item(char *fbu goto check_ret; /* OK: try to delete the directory. */ } @@ -308,7 +308,7 @@ TODO: if (!replace && max_delete >= 0 && ++deletion_count > max_delete) return DR_AT_LIMIT; -@@ -208,6 +323,8 @@ static enum delret delete_item(char *fbu +@@ -208,6 +324,8 @@ static enum delret delete_item(char *fbu * its contents, otherwise just checks for content. Returns DR_SUCCESS or * DR_NOT_EMPTY. Note that fname must point to a MAXPATHLEN buffer! (The * buffer is used for recursion, but returned unchanged.) @@ -317,7 +317,7 @@ TODO: */ static enum delret delete_dir_contents(char *fname, int flags) { -@@ -227,7 +344,9 @@ static enum delret delete_dir_contents(c +@@ -227,7 +345,9 @@ static enum delret delete_dir_contents(c save_filters = push_local_filters(fname, dlen); non_perishable_cnt = 0; @@ -327,7 +327,7 @@ TODO: ret = non_perishable_cnt ? DR_NOT_EMPTY : DR_SUCCESS; if (!dirlist->used) -@@ -264,6 +383,8 @@ static enum delret delete_dir_contents(c +@@ -264,6 +384,8 @@ static enum delret delete_dir_contents(c if (S_ISDIR(fp->mode) && delete_dir_contents(fname, flags | DEL_RECURSE) != DR_SUCCESS) ret = DR_NOT_EMPTY; @@ -336,7 +336,7 @@ TODO: if (delete_item(fname, fp->mode, NULL, flags) != DR_SUCCESS) ret = DR_NOT_EMPTY; } -@@ -416,12 +537,17 @@ static void do_delayed_deletions(char *d +@@ -416,13 +538,18 @@ static void do_delayed_deletions(char *d * all the --delete-WHEN options. Note that the fbuf pointer must point to a * MAXPATHLEN buffer with the name of the directory in it (the functions we * call will append names onto the end, but the old dir value will be restored @@ -352,12 +352,14 @@ TODO: static int already_warned = 0; struct file_list *dirlist; - char delbuf[MAXPATHLEN]; +- int dlen, i; + char *p, delbuf[MAXPATHLEN]; + unsigned remainder; - int dlen, i; ++ int dlen, i, restore_dot = 0; if (!fbuf) { -@@ -432,21 +558,28 @@ static void delete_in_dir(char *fbuf, st + change_local_filter_dir(NULL, 0, 0); +@@ -432,21 +559,28 @@ static void delete_in_dir(char *fbuf, st if (verbose > 2) rprintf(FINFO, "delete_in_dir(%s)\n", fbuf); @@ -391,19 +393,22 @@ TODO: if (one_file_system) { if (file->flags & FLAG_TOP_DIR) filesystem_dev = *fs_dev; -@@ -456,6 +589,11 @@ static void delete_in_dir(char *fbuf, st +@@ -456,6 +590,14 @@ static void delete_in_dir(char *fbuf, st dirlist = get_dirlist(fbuf, dlen, 0); + p = fbuf + dlen; -+ if (dlen != 1 || *fbuf != '/') ++ if (dlen == 1 && *fbuf == '.') { ++ restore_dot = 1; ++ p = fbuf; ++ } else if (dlen != 1 || *fbuf != '/') + *p++ = '/'; + remainder = MAXPATHLEN - (p - fbuf); + /* If an item in dirlist is not found in flist, delete it * from the filesystem. */ for (i = dirlist->used; i--; ) { -@@ -468,16 +606,23 @@ static void delete_in_dir(char *fbuf, st +@@ -468,16 +610,25 @@ static void delete_in_dir(char *fbuf, st f_name(fp, NULL)); continue; } @@ -425,12 +430,14 @@ TODO: + unexplored_dirs++; } ++ if (restore_dot) ++ fbuf[0] = '.'; + fbuf[dlen] = '\0'; + flist_free(dirlist); } -@@ -507,9 +652,9 @@ static void do_delete_pass(void) +@@ -507,9 +658,9 @@ static void do_delete_pass(void) || !S_ISDIR(st.st_mode)) continue; @@ -442,21 +449,21 @@ TODO: if (do_progress && !am_server) rprintf(FINFO, " \r"); -@@ -1072,6 +1217,7 @@ static int try_dests_non(struct file_str - return j; +@@ -1106,6 +1257,7 @@ static void list_file_entry(struct file_ + } } +static struct bitbag *delayed_bits = NULL; static int phase = 0; static int dflt_perms; -@@ -1308,8 +1454,12 @@ static void recv_generator(char *fname, +@@ -1350,8 +1502,12 @@ static void recv_generator(char *fname, } } else if (delete_during && f_out != -1 && !phase && dry_run < 2 -- && (file->flags & FLAG_XFER_DIR)) +- && (file->flags & FLAG_CONTENT_DIR)) - delete_in_dir(fname, file, &real_sx.st.st_dev); -+ && (file->flags & FLAG_XFER_DIR)) { ++ && (file->flags & FLAG_CONTENT_DIR)) { + if (detect_renamed && real_ret != 0) + unexplored_dirs++; + delete_in_dir(fname, file, &real_sx.st.st_dev, @@ -465,7 +472,7 @@ TODO: goto cleanup; } -@@ -1587,8 +1737,14 @@ static void recv_generator(char *fname, +@@ -1629,8 +1785,14 @@ static void recv_generator(char *fname, goto cleanup; } #endif @@ -481,7 +488,7 @@ TODO: rsyserr(FERROR, stat_errno, "recv_generator: failed to stat %s", full_fname(fname)); goto cleanup; -@@ -1910,6 +2066,12 @@ void generate_files(int f_out, const cha +@@ -1966,6 +2128,12 @@ void generate_files(int f_out, const cha if (verbose > 2) rprintf(FINFO, "generator starting pid=%ld\n", (long)getpid()); @@ -494,7 +501,7 @@ TODO: if (delete_before && !solo_file && cur_flist->used > 0) do_delete_pass(); if (delete_during == 2) { -@@ -1920,7 +2082,7 @@ void generate_files(int f_out, const cha +@@ -1976,7 +2144,7 @@ void generate_files(int f_out, const cha } do_progress = 0; @@ -503,7 +510,7 @@ TODO: whole_file = 0; if (verbose >= 2) { rprintf(FINFO, "delta-transmission %s\n", -@@ -1958,7 +2120,7 @@ void generate_files(int f_out, const cha +@@ -2014,7 +2182,7 @@ void generate_files(int f_out, const cha dirdev = MAKEDEV(DEV_MAJOR(devp), DEV_MINOR(devp)); } else dirdev = MAKEDEV(0, 0); @@ -512,7 +519,7 @@ TODO: } } } -@@ -2003,7 +2165,21 @@ void generate_files(int f_out, const cha +@@ -2059,7 +2227,21 @@ void generate_files(int f_out, const cha } while ((cur_flist = cur_flist->next) != NULL); if (delete_during) @@ -537,7 +544,7 @@ TODO: rprintf(FINFO, "generate_files phase=%d\n", phase); --- old/options.c +++ new/options.c -@@ -79,6 +79,7 @@ int am_generator = 0; +@@ -80,6 +80,7 @@ int am_generator = 0; int am_starting_up = 1; int relative_paths = -1; int implied_dirs = 1; @@ -545,7 +552,7 @@ TODO: int numeric_ids = 0; int allow_8bit_chars = 0; int force_delete = 0; -@@ -382,6 +383,7 @@ void usage(enum logcode F) +@@ -383,6 +384,7 @@ void usage(enum logcode F) rprintf(F," --modify-window=NUM compare mod-times with reduced accuracy\n"); rprintf(F," -T, --temp-dir=DIR create temporary files in directory DIR\n"); rprintf(F," -y, --fuzzy find similar file for basis if no dest file\n"); @@ -561,7 +568,7 @@ TODO: {"fuzzy", 'y', POPT_ARG_NONE, &fuzzy_basis, 0, 0, 0 }, {"compress", 'z', POPT_ARG_NONE, 0, 'z', 0, 0 }, {"no-compress", 0, POPT_ARG_VAL, &do_compression, 0, 0, 0 }, -@@ -1531,7 +1534,7 @@ int parse_arguments(int *argc_p, const c +@@ -1532,7 +1535,7 @@ int parse_arguments(int *argc_p, const c inplace = 1; } @@ -570,7 +577,7 @@ TODO: partial_dir = tmp_partialdir; if (inplace) { -@@ -1540,6 +1543,7 @@ int parse_arguments(int *argc_p, const c +@@ -1541,6 +1544,7 @@ int parse_arguments(int *argc_p, const c snprintf(err_buf, sizeof err_buf, "--%s cannot be used with --%s\n", append_mode ? "append" : "inplace", @@ -578,7 +585,7 @@ TODO: delay_updates ? "delay-updates" : "partial-dir"); return 0; } -@@ -1887,6 +1891,8 @@ void server_options(char **args, int *ar +@@ -1885,6 +1889,8 @@ void server_options(char **args, int *ar args[ac++] = "--super"; if (size_only) args[ac++] = "--size-only"; @@ -589,7 +596,7 @@ TODO: if (asprintf(&arg, "--skip-compress=%s", skip_compress) < 0) --- old/rsync.yo +++ new/rsync.yo -@@ -389,6 +389,7 @@ to the detailed description below for a +@@ -384,6 +384,7 @@ to the detailed description below for a --modify-window=NUM compare mod-times with reduced accuracy -T, --temp-dir=DIR create temporary files in directory DIR -y, --fuzzy find similar file for basis if no dest file @@ -597,13 +604,19 @@ TODO: --compare-dest=DIR also compare received files relative to DIR --copy-dest=DIR ... and include copies of unchanged files --link-dest=DIR hardlink to files in DIR when unchanged -@@ -1394,6 +1395,15 @@ Note that the use of the bf(--delete) op +@@ -1430,6 +1431,21 @@ Note that the use of the bf(--delete) op fuzzy-match files, so either use bf(--delete-after) or specify some filename exclusions if you need to prevent this. -+dit(bf(--detect-renamed)) This option tells rsync to scan the receiving -+side for files that have been renamed, and to use any that are found as -+alternate basis files to help speed up the transfer. ++dit(bf(--detect-renamed)) With this option, for each new source file ++(call it em(src/S)), rsync looks for a file em(dest/D) anywhere in the ++destination that passes the quick check with em(src/S). If such a em(dest/D) ++is found, rsync uses it as an alternate basis for transferring em(S). The ++idea is that if em(src/S) was renamed from em(src/D) (as opposed to em(src/S) ++passing the quick check with em(dest/D) by coincidence), the delta-transfer ++algorithm will find that all the data matches between em(src/S) and em(dest/D), ++and the transfer will be really fast. ++ +By default, alternate-basis files are hard-linked into a directory named +".~tmp~" in each file's destination directory, but if you've specified +the bf(--partial-dir) option, that directory will be used instead. These @@ -615,7 +628,7 @@ TODO: files against doing transfers (if the files are missing in the destination --- old/util.c +++ new/util.c -@@ -1029,6 +1029,32 @@ int handle_partial_dir(const char *fname +@@ -1030,6 +1030,32 @@ int handle_partial_dir(const char *fname return 1; }