X-Git-Url: https://mattmccutchen.net/rsync/rsync.git/blobdiff_plain/375a4556c7a1ffb9a4e7117f33fc42ed2bc4c026..1a9ec1fd1c144e5f578ee3746bc1ea4a3c73a7cc:/generator.c diff --git a/generator.c b/generator.c index 99052220..453c6e07 100644 --- a/generator.c +++ b/generator.c @@ -1,17 +1,21 @@ -/* - Copyright (C) Andrew Tridgell 1996 +/* -*- c-file-style: "linux" -*- + + rsync -- fast file replication program + + Copyright (C) 1996-2000 by Andrew Tridgell Copyright (C) Paul Mackerras 1996 - + Copyright (C) 2002 by Martin Pool + This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. - + This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. - + You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. @@ -26,169 +30,303 @@ extern int preserve_links; extern int am_root; extern int preserve_devices; extern int preserve_hard_links; +extern int preserve_perms; +extern int preserve_uid; +extern int preserve_gid; extern int update_only; -extern int whole_file; -extern int block_size; +extern int opt_ignore_existing; extern int csum_length; extern int ignore_times; +extern int size_only; extern int io_timeout; -extern int remote_version; +extern int protocol_version; extern int always_checksum; +extern char *compare_dest; +extern int link_dest; /* choose whether to skip a particular file */ -static int skip_file(char *fname, - struct file_struct *file, STRUCT_STAT *st) +static int skip_file(char *fname, struct file_struct *file, STRUCT_STAT *st) { if (st->st_size != file->length) { return 0; } - - /* if always checksum is set then we use the checksum instead + if (link_dest) { + if (preserve_perms + && (st->st_mode & CHMOD_BITS) != (file->mode & CHMOD_BITS)) + return 0; + + if (am_root && preserve_uid && st->st_uid != file->uid) + return 0; + + if (preserve_gid && file->gid != GID_NONE + && st->st_gid != file->gid) + return 0; + } + + /* if always checksum is set then we use the checksum instead of the file time to determine whether to sync */ if (always_checksum && S_ISREG(st->st_mode)) { char sum[MD4_SUM_LENGTH]; + char fnamecmpdest[MAXPATHLEN]; + + if (compare_dest != NULL) { + if (access(fname, 0) != 0) { + pathjoin(fnamecmpdest, sizeof fnamecmpdest, + compare_dest, fname); + fname = fnamecmpdest; + } + } file_checksum(fname,sum,st->st_size); - return (memcmp(sum,file->sum,csum_length) == 0); + return memcmp(sum, file->u.sum, protocol_version < 21 ? 2 + : MD4_SUM_LENGTH) == 0; + } + + if (size_only) { + return 1; } if (ignore_times) { return 0; } - return (st->st_mtime == file->modtime); + return (cmp_modtime(st->st_mtime,file->modtime) == 0); } -/* use a larger block size for really big files */ -static int adapt_block_size(struct file_struct *file, int bsize) +/* + * NULL sum_struct means we have no checksums + */ +void write_sum_head(int f, struct sum_struct *sum) { - int ret; + static struct sum_struct null_sum; - if (bsize != BLOCK_SIZE) return bsize; + if (sum == NULL) + sum = &null_sum; - ret = file->length / (10000); /* rough heuristic */ - ret = ret & ~15; /* multiple of 16 */ - if (ret < bsize) ret = bsize; - if (ret > CHUNK_SIZE/2) ret = CHUNK_SIZE/2; - return ret; + write_int(f, sum->count); + write_int(f, sum->blength); + if (protocol_version >= 27) + write_int(f, sum->s2length); + write_int(f, sum->remainder); } - -/* - send a sums struct down a fd - */ -static void send_sums(struct sum_struct *s,int f_out) +/* + * set (initialize) the size entries in the per-file sum_struct + * calulating dynamic block ans checksum sizes. + * + * This is only called from generate_and_send_sums() but is a seperate + * function to encapsulate the logic. + * + * The block size is a rounded square root of file length. + * + * The checksum size is determined according to: + * blocksum_bits = BLOCKSUM_EXP + 2*log2(file_len) - log2(block_len) + * provided by Donovan Baarda which gives a probability of rsync + * algorithm corrupting data and falling back using the whole md4 + * checksums. + * + * This might be made one of several selectable heuristics. + */ + +static void sum_sizes_sqroot(struct sum_struct *sum, uint64 len) { - int i; + extern unsigned int block_size; + unsigned int blength; + int s2length; + uint32 c; + uint64 l; + + if (block_size) { + blength = block_size; + } else if (len <= BLOCK_SIZE * BLOCK_SIZE) { + blength = BLOCK_SIZE; + } else { + l = len; + c = 1; + while (l >>= 2) { + c <<= 1; + } + blength = 0; + do { + blength |= c; + if (len < (uint64)blength * blength) + blength &= ~c; + c >>= 1; + } while (c >= 8); /* round to multiple of 8 */ + blength = MAX(blength, BLOCK_SIZE); + } - /* tell the other guy how many we are going to be doing and how many - bytes there are in the last chunk */ - write_int(f_out,s?s->count:0); - write_int(f_out,s?s->n:block_size); - write_int(f_out,s?s->remainder:0); - if (s) - for (i=0;icount;i++) { - write_int(f_out,s->sums[i].sum1); - write_buf(f_out,s->sums[i].sum2,csum_length); + if (protocol_version < 27) { + s2length = csum_length; + } else if (csum_length == SUM_LENGTH) { + s2length = SUM_LENGTH; + } else { + int b = BLOCKSUM_BIAS; + l = len; + while (l >>= 1) { + b += 2; } -} + c = blength; + while (c >>= 1 && b) { + b--; + } + s2length = (b + 1 - 32 + 7) / 8; /* add a bit, + * subtract rollsum, + * round up + * --optimize in compiler-- + */ + s2length = MAX(s2length, csum_length); + s2length = MIN(s2length, SUM_LENGTH); + } + sum->flength = len; + sum->blength = blength; + sum->s2length = s2length; + sum->count = (len + (blength - 1)) / blength; + sum->remainder = (len % blength); -/* - generate a stream of signatures/checksums that describe a buffer + if (sum->count && verbose > 2) { + rprintf(FINFO, "count=%.0f rem=%u blength=%u s2length=%d flength=%.0f\n", + (double)sum->count, sum->remainder, sum->blength, + sum->s2length, (double)sum->flength); + } +} - generate approximately one checksum every n bytes - */ -static struct sum_struct *generate_sums(struct map_struct *buf,OFF_T len,int n) +/** + * Perhaps we want to just send an empty checksum set for this file, + * which will force the whole thing to be literally transferred. + * + * When do we do this? If the user's explicitly said they + * want the whole thing, or if { they haven't explicitly + * requested a delta, and it's local but not batch mode.} + * + * Whew. */ +static BOOL disable_deltas_p(void) { - int i; - struct sum_struct *s; - int count; - int block_len = n; - int remainder = (len%block_len); - OFF_T offset = 0; - - count = (len+(block_len-1))/block_len; - - s = (struct sum_struct *)malloc(sizeof(*s)); - if (!s) out_of_memory("generate_sums"); - - s->count = count; - s->remainder = remainder; - s->n = n; - s->flength = len; + extern int whole_file; + extern int local_server; + extern int write_batch; + + if (whole_file > 0) + return True; + if (whole_file == 0 || write_batch) + return False; + return local_server; +} - if (count==0) { - s->sums = NULL; - return s; - } - if (verbose > 3) - rprintf(FINFO,"count=%d rem=%d n=%d flength=%d\n", - s->count,s->remainder,s->n,(int)s->flength); +/* + * Generate and send a stream of signatures/checksums that describe a buffer + * + * Generate approximately one checksum every block_len bytes. + */ +static void generate_and_send_sums(struct map_struct *buf, size_t len, int f_out) +{ + size_t i; + struct sum_struct sum; + OFF_T offset = 0; - s->sums = (struct sum_buf *)malloc(sizeof(s->sums[0])*s->count); - if (!s->sums) out_of_memory("generate_sums"); - - for (i=0;isums[i].sum1 = get_checksum1(map,n1); - get_checksum2(map,n1,s->sums[i].sum2); + write_sum_head(f_out, &sum); - s->sums[i].offset = offset; - s->sums[i].len = n1; - s->sums[i].i = i; + for (i = 0; i < sum.count; i++) { + unsigned int n1 = MIN(len, sum.blength); + char *map = map_ptr(buf, offset, n1); + uint32 sum1 = get_checksum1(map, n1); + char sum2[SUM_LENGTH]; - if (verbose > 3) - rprintf(FINFO,"chunk[%d] offset=%d len=%d sum1=%08x\n", - i,(int)s->sums[i].offset,s->sums[i].len,s->sums[i].sum1); + get_checksum2(map, n1, sum2); + if (verbose > 3) { + rprintf(FINFO, + "chunk[%.0f] offset=%.0f len=%u sum1=%08lx\n", + (double)i, (double)offset, n1, + (unsigned long)sum1); + } + write_int(f_out, sum1); + write_buf(f_out, sum2, sum.s2length); len -= n1; offset += n1; } - - return s; } -void recv_generator(char *fname,struct file_list *flist,int i,int f_out) -{ + +/** + * Acts on file number @p i from @p flist, whose name is @p fname. + * + * First fixes up permissions, then generates checksums for the file. + * + * @note This comment was added later by mbp who was trying to work it + * out. It might be wrong. + **/ +void recv_generator(char *fname, struct file_struct *file, int i, int f_out) +{ int fd; STRUCT_STAT st; - struct map_struct *buf; - struct sum_struct *s; + struct map_struct *mapbuf; int statret; - struct file_struct *file = flist->files[i]; char *fnamecmp; char fnamecmpbuf[MAXPATHLEN]; extern char *compare_dest; + extern int list_only; + extern int only_existing; + extern int orig_umask; + + if (list_only) + return; if (verbose > 2) rprintf(FINFO,"recv_generator(%s,%d)\n",fname,i); statret = link_stat(fname,&st); + if (only_existing && statret == -1 && errno == ENOENT) { + /* we only want to update existing files */ + if (verbose > 1) rprintf(FINFO, "not creating new file \"%s\"\n",fname); + return; + } + + if (statret == 0 && + !preserve_perms && + (S_ISDIR(st.st_mode) == S_ISDIR(file->mode))) { + /* if the file exists already and we aren't perserving + * permissions then act as though the remote end sent + * us the file permissions we already have */ + file->mode = (file->mode & ~CHMOD_BITS) + | (st.st_mode & CHMOD_BITS); + } + if (S_ISDIR(file->mode)) { - if (dry_run) return; + /* The file to be received is a directory, so we need + * to prepare appropriately. If there is already a + * file of that name and it is *not* a directory, then + * we need to delete it. If it doesn't exist, then + * recursively create it. */ + + if (dry_run) return; /* XXXX -- might cause inaccuracies?? -- mbp */ if (statret == 0 && !S_ISDIR(st.st_mode)) { - if (do_unlink(fname) != 0) { - rprintf(FERROR,"unlink %s : %s\n",fname,strerror(errno)); + if (robust_unlink(fname) != 0) { + rprintf(FERROR, + "recv_generator: unlink %s to make room for directory: %s\n", + full_fname(fname), strerror(errno)); return; } statret = -1; } if (statret != 0 && do_mkdir(fname,file->mode) != 0 && errno != EEXIST) { - if (!(relative_paths && errno==ENOENT && - create_directory_path(fname)==0 && + if (!(relative_paths && errno==ENOENT && + create_directory_path(fname, orig_umask)==0 && do_mkdir(fname,file->mode)==0)) { - rprintf(FERROR,"mkdir %s : %s (2)\n", - fname,strerror(errno)); + rprintf(FERROR, "recv_generator: mkdir %s failed: %s\n", + full_fname(fname), strerror(errno)); } } - if (set_perms(fname,file,NULL,0) && verbose) + /* f_out is set to -1 when doing final directory + permission and modification time repair */ + if (set_perms(fname,file,NULL,0) && verbose && (f_out != -1)) rprintf(FINFO,"%s/\n",fname); return; } @@ -199,10 +337,10 @@ void recv_generator(char *fname,struct file_list *flist,int i,int f_out) int l; extern int safe_symlinks; - if (safe_symlinks && unsafe_symlink(file->link, fname)) { + if (safe_symlinks && unsafe_symlink(file->u.link, fname)) { if (verbose) { - rprintf(FINFO,"ignoring unsafe symlink %s -> %s\n", - fname,file->link); + rprintf(FINFO, "ignoring unsafe symlink %s -> \"%s\"\n", + full_fname(fname), file->u.link); } return; } @@ -210,21 +348,26 @@ void recv_generator(char *fname,struct file_list *flist,int i,int f_out) l = readlink(fname,lnk,MAXPATHLEN-1); if (l > 0) { lnk[l] = 0; - if (strcmp(lnk,file->link) == 0) { + /* A link already pointing to the + * right place -- no further action + * required. */ + if (strcmp(lnk,file->u.link) == 0) { set_perms(fname,file,&st,1); return; } } + /* Not a symlink, so delete whatever's + * already there and put a new symlink + * in place. */ + delete_file(fname); } - delete_file(fname); - if (do_symlink(file->link,fname) != 0) { - rprintf(FERROR,"link %s -> %s : %s\n", - fname,file->link,strerror(errno)); + if (do_symlink(file->u.link,fname) != 0) { + rprintf(FERROR, "symlink %s -> \"%s\" failed: %s\n", + full_fname(fname), file->u.link, strerror(errno)); } else { set_perms(fname,file,NULL,0); if (verbose) { - rprintf(FINFO,"%s -> %s\n", - fname,file->link); + rprintf(FINFO,"%s -> %s\n", fname,file->u.link); } } #endif @@ -233,15 +376,16 @@ void recv_generator(char *fname,struct file_list *flist,int i,int f_out) #ifdef HAVE_MKNOD if (am_root && preserve_devices && IS_DEVICE(file->mode)) { - if (statret != 0 || + if (statret != 0 || st.st_mode != file->mode || - st.st_rdev != file->rdev) { + st.st_rdev != file->u.rdev) { delete_file(fname); if (verbose > 2) rprintf(FINFO,"mknod(%s,0%o,0x%x)\n", - fname,(int)file->mode,(int)file->rdev); - if (do_mknod(fname,file->mode,file->rdev) != 0) { - rprintf(FERROR,"mknod %s : %s\n",fname,strerror(errno)); + fname,(int)file->mode,(int)file->u.rdev); + if (do_mknod(fname,file->mode,file->u.rdev) != 0) { + rprintf(FERROR, "mknod %s failed: %s\n", + full_fname(fname), strerror(errno)); } else { set_perms(fname,file,NULL,0); if (verbose) @@ -254,39 +398,51 @@ void recv_generator(char *fname,struct file_list *flist,int i,int f_out) } #endif - if (preserve_hard_links && check_hard_link(file)) { - if (verbose > 1) - rprintf(FINFO,"%s is a hard link\n",f_name(file)); + if (preserve_hard_links && hard_link_check(file, HL_CHECK_MASTER)) return; - } if (!S_ISREG(file->mode)) { - rprintf(FINFO,"skipping non-regular file %s\n",fname); + rprintf(FINFO, "skipping non-regular file \"%s\"\n",fname); return; } fnamecmp = fname; - if ((statret == -1) && (compare_dest != NULL)) { + if (statret == -1 && compare_dest != NULL) { /* try the file at compare_dest instead */ int saveerrno = errno; - slprintf(fnamecmpbuf,MAXPATHLEN-1,"%s/%s",compare_dest,fname); + pathjoin(fnamecmpbuf, sizeof fnamecmpbuf, compare_dest, fname); statret = link_stat(fnamecmpbuf,&st); if (!S_ISREG(st.st_mode)) statret = -1; if (statret == -1) errno = saveerrno; +#if HAVE_LINK + else if (link_dest && !dry_run) { + if (do_link(fnamecmpbuf, fname) != 0) { + if (verbose > 0) { + rprintf(FINFO,"link %s => %s : %s\n", + fnamecmpbuf, fname, + strerror(errno)); + } + } + fnamecmp = fnamecmpbuf; + } +#endif else fnamecmp = fnamecmpbuf; } if (statret == -1) { + if (preserve_hard_links && hard_link_check(file, HL_SKIP)) + return; if (errno == ENOENT) { write_int(f_out,i); - if (!dry_run) send_sums(NULL,f_out); - } else { - if (verbose > 1) - rprintf(FERROR,"recv_generator failed to open %s\n",fname); + if (!dry_run) write_sum_head(f_out, NULL); + } else if (verbose > 1) { + rprintf(FERROR, + "recv_generator: failed to open %s: %s\n", + full_fname(fname), strerror(errno)); } return; } @@ -297,19 +453,28 @@ void recv_generator(char *fname,struct file_list *flist,int i,int f_out) } /* now pretend the file didn't exist */ + if (preserve_hard_links && hard_link_check(file, HL_SKIP)) + return; write_int(f_out,i); - if (!dry_run) send_sums(NULL,f_out); + if (!dry_run) write_sum_head(f_out, NULL); + return; + } + + if (opt_ignore_existing && fnamecmp == fname) { + if (verbose > 1) + rprintf(FINFO,"%s exists\n",fname); return; } - if (update_only && st.st_mtime > file->modtime && fnamecmp == fname) { + if (update_only && cmp_modtime(st.st_mtime,file->modtime)>0 && fnamecmp == fname) { if (verbose > 1) rprintf(FINFO,"%s is newer\n",fname); return; } if (skip_file(fname, file, &st)) { - set_perms(fname,file,&st,1); + if (fnamecmp == fname) + set_perms(fname,file,&st,1); return; } @@ -318,71 +483,89 @@ void recv_generator(char *fname,struct file_list *flist,int i,int f_out) return; } - if (whole_file) { + if (disable_deltas_p()) { write_int(f_out,i); - send_sums(NULL,f_out); + write_sum_head(f_out, NULL); return; } - /* open the file */ - fd = open(fnamecmp,O_RDONLY); + /* open the file */ + fd = do_open(fnamecmp, O_RDONLY, 0); if (fd == -1) { - rprintf(FERROR,"failed to open %s : %s\n",fnamecmp,strerror(errno)); - rprintf(FERROR,"skipping %s\n",fname); + rprintf(FERROR, "failed to open %s, continuing: %s\n", + full_fname(fnamecmp), strerror(errno)); + /* pretend the file didn't exist */ + if (preserve_hard_links && hard_link_check(file, HL_SKIP)) + return; + write_int(f_out,i); + write_sum_head(f_out, NULL); return; } - if (st.st_size > 0) { - buf = map_file(fd,st.st_size); - } else { - buf = NULL; - } - - if (verbose > 3) - rprintf(FINFO,"gen mapped %s of size %d\n",fnamecmp,(int)st.st_size); + if (st.st_size > 0) + mapbuf = map_file(fd,st.st_size); + else + mapbuf = NULL; - s = generate_sums(buf,st.st_size,adapt_block_size(file, block_size)); + if (verbose > 3) { + rprintf(FINFO,"gen mapped %s of size %.0f\n", fnamecmp, + (double)st.st_size); + } if (verbose > 2) - rprintf(FINFO,"sending sums for %d\n",i); + rprintf(FINFO, "generating and sending sums for %d\n", i); write_int(f_out,i); - send_sums(s,f_out); + generate_and_send_sums(mapbuf, st.st_size, f_out); close(fd); - if (buf) unmap_file(buf); - - free_sums(s); + if (mapbuf) unmap_file(mapbuf); } - -void generate_files(int f,struct file_list *flist,char *local_name,int f_recv) +void generate_files(int f, struct file_list *flist, char *local_name) { int i; int phase=0; + char fbuf[MAXPATHLEN]; - if (verbose > 2) - rprintf(FINFO,"generator starting pid=%d count=%d\n", - (int)getpid(),flist->count); + if (verbose > 2) { + rprintf(FINFO, "generator starting pid=%ld count=%d\n", + (long)getpid(), flist->count); + } + + if (verbose >= 2) { + rprintf(FINFO, + disable_deltas_p() + ? "delta-transmission disabled for local transfer or --whole-file\n" + : "delta transmission enabled\n"); + } + + /* we expect to just sit around now, so don't exit on a + timeout. If we really get a timeout then the other process should + exit */ + io_timeout = 0; for (i = 0; i < flist->count; i++) { struct file_struct *file = flist->files[i]; - mode_t saved_mode = file->mode; - if (!file->basename) continue; + struct file_struct copy; + if (!file->basename) + continue; /* we need to ensure that any directories we create have writeable permissions initially so that we can create the files within them. This is then fixed after the files are transferred */ - if (!am_root && S_ISDIR(file->mode)) { - file->mode |= S_IWUSR; /* user write */ + if (!am_root && S_ISDIR(file->mode) && !(file->mode & S_IWUSR)) { + copy = *file; + /* XXX: Could this be causing a problem on SCO? Perhaps their + * handling of permissions is strange? */ + copy.mode |= S_IWUSR; /* user write */ + file = © } - recv_generator(local_name?local_name:f_name(file), - flist,i,f); - - file->mode = saved_mode; + recv_generator(local_name ? local_name : f_name_to(file, fbuf), + file, i, f); } phase++; @@ -394,24 +577,32 @@ void generate_files(int f,struct file_list *flist,char *local_name,int f_recv) write_int(f,-1); - /* we expect to just sit around now, so don't exit on a - timeout. If we really get a timeout then the other process should - exit */ - io_timeout = 0; + /* files can cycle through the system more than once + * to catch initial checksum errors */ + while ((i = get_redo_num()) != -1) { + struct file_struct *file = flist->files[i]; + recv_generator(local_name ? local_name : f_name_to(file, fbuf), + file, i, f); + } - if (remote_version >= 13) { - /* in newer versions of the protocol the files can cycle through - the system more than once to catch initial checksum errors */ - for (i=read_int(f_recv); i != -1; i=read_int(f_recv)) { - struct file_struct *file = flist->files[i]; - recv_generator(local_name?local_name:f_name(file), - flist,i,f); - } + phase++; + if (verbose > 2) + rprintf(FINFO,"generate_files phase=%d\n",phase); - phase++; - if (verbose > 2) - rprintf(FINFO,"generate_files phase=%d\n",phase); + write_int(f,-1); + + if (preserve_hard_links) + do_hard_links(); - write_int(f,-1); + /* now we need to fix any directory permissions that were + * modified during the transfer */ + for (i = 0; i < flist->count; i++) { + struct file_struct *file = flist->files[i]; + if (!file->basename || !S_ISDIR(file->mode)) continue; + recv_generator(local_name ? local_name : f_name(file), + file, i, -1); } + + if (verbose > 2) + rprintf(FINFO,"generate_files finished\n"); }