Make some RERR_* choices better, and another noop_io_until_death() tweak.
[rsync/rsync.git] / io.c
diff --git a/io.c b/io.c
index e23c69a..4a6b95f 100644 (file)
--- a/io.c
+++ b/io.c
@@ -4,11 +4,11 @@
  * Copyright (C) 1996-2001 Andrew Tridgell
  * Copyright (C) 1996 Paul Mackerras
  * Copyright (C) 2001, 2002 Martin Pool <mbp@samba.org>
- * Copyright (C) 2003, 2004, 2005, 2006 Wayne Davison
+ * Copyright (C) 2003-2009 Wayne Davison
  *
  * This program is free software; you can redistribute it and/or modify
  * it under the terms of the GNU General Public License as published by
- * the Free Software Foundation; either version 2 of the License, or
+ * the Free Software Foundation; either version 3 of the License, or
  * (at your option) any later version.
  *
  * This program is distributed in the hope that it will be useful,
@@ -17,8 +17,7 @@
  * GNU General Public License for more details.
  *
  * You should have received a copy of the GNU General Public License along
- * with this program; if not, write to the Free Software Foundation, Inc.,
- * 51 Franklin Street - Fifth Floor, Boston, MA 02110-1301, USA.
+ * with this program; if not, visit the http://fsf.org website.
  */
 
 /* Rsync provides its own multiplexing system, which is used to send
@@ -29,6 +28,8 @@
  * io_start_multiplex_out() and io_start_multiplex_in(). */
 
 #include "rsync.h"
+#include "ifuncs.h"
+#include "inums.h"
 
 /** If no timeout is specified then use a 60 second select timeout */
 #define SELECT_TIMEOUT 60
 extern int bwlimit;
 extern size_t bwlimit_writemax;
 extern int io_timeout;
-extern int allowed_lull;
 extern int am_server;
 extern int am_daemon;
 extern int am_sender;
 extern int am_generator;
-extern int incremental;
+extern int msgs2stderr;
+extern int inc_recurse;
 extern int io_error;
 extern int eol_nulls;
 extern int flist_eof;
+extern int file_total;
+extern int file_old_total;
+extern int list_only;
 extern int read_batch;
-extern int csum_length;
+extern int protect_args;
 extern int checksum_seed;
 extern int protocol_version;
 extern int remove_source_files;
 extern int preserve_hard_links;
-extern char *filesfrom_host;
+extern BOOL extra_flist_sending_enabled;
 extern struct stats stats;
-extern struct file_list *cur_flist, *first_flist;
+extern struct file_list *cur_flist;
+#ifdef ICONV_OPTION
+extern int filesfrom_convert;
+extern iconv_t ic_send, ic_recv;
+#endif
 
-const char phase_unknown[] = "unknown";
+int csum_length = SHORT_SUM_LENGTH; /* initial value */
+int allowed_lull = 0;
 int ignore_timeout = 0;
 int batch_fd = -1;
-int done_cnt = 0;
+int msgdone_cnt = 0;
+int forward_flist_data = 0;
 
 /* Ignore an EOF error if non-zero. See whine_about_eof(). */
 int kluge_around_eof = 0;
 
-int msg_fd_in = -1;
-int msg_fd_out = -1;
 int sock_f_in = -1;
 int sock_f_out = -1;
 
-static int iobuf_f_in = -1;
-static char *iobuf_in;
-static size_t iobuf_in_siz;
-static size_t iobuf_in_ndx;
-static size_t iobuf_in_remaining;
-
-static int iobuf_f_out = -1;
-static char *iobuf_out;
-static int iobuf_out_cnt;
+int64 total_data_read = 0;
+int64 total_data_written = 0;
 
-int flist_forward_from = -1;
+static struct {
+       xbuf in, out, msg;
+       int in_fd;
+       int out_fd; /* Both "out" and "msg" go to this fd. */
+       BOOL in_multiplexed;
+       unsigned out_empty_len;
+       size_t raw_data_header_pos;      /* in the out xbuf */
+       size_t raw_flushing_ends_before; /* in the out xbuf */
+       size_t raw_input_ends_before;    /* in the in xbuf */
+} iobuf = { .in_fd = -1, .out_fd = -1 };
 
-static int io_multiplexing_out;
-static int io_multiplexing_in;
 static time_t last_io_in;
 static time_t last_io_out;
-static int no_flush;
 
 static int write_batch_monitor_in = -1;
 static int write_batch_monitor_out = -1;
 
-static int io_filesfrom_f_in = -1;
-static int io_filesfrom_f_out = -1;
-static char io_filesfrom_buf[2048];
-static char *io_filesfrom_bp;
-static char io_filesfrom_lastchar;
-static int io_filesfrom_buflen;
-static int defer_forwarding_messages = 0;
+static int ff_forward_fd = -1;
+static int ff_reenable_multiplex = -1;
+static char ff_lastchar = '\0';
+static xbuf ff_xb = EMPTY_XBUF;
+#ifdef ICONV_OPTION
+static xbuf iconv_buf = EMPTY_XBUF;
+#endif
 static int select_timeout = SELECT_TIMEOUT;
 static int active_filecnt = 0;
 static OFF_T active_bytecnt = 0;
+static int first_message = 1;
 
-static char int_byte_cnt[64] = {
-       3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, /* (00 - 3F)/4 */
-       3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, /* (40 - 7F)/4 */
-       4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, /* (80 - BF)/4 */
-       5, 5, 5, 5, 5, 5, 5, 5, 6, 6, 6, 6, 7, 7, 8, 9, /* (C0 - FF)/4 */
-};
-
-static void readfd(int fd, char *buffer, size_t N);
-static void writefd(int fd, const char *buf, size_t len);
-static void writefd_unbuffered(int fd, const char *buf, size_t len);
-static void decrement_active_files(int ndx);
-static void decrement_flist_in_progress(int ndx, int redo);
-
-struct flist_ndx_item {
-       struct flist_ndx_item *next;
-       int ndx;
-};
-
-struct flist_ndx_list {
-       struct flist_ndx_item *head, *tail;
+static char int_byte_extra[64] = {
+       0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, /* (00 - 3F)/4 */
+       0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, /* (40 - 7F)/4 */
+       1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, /* (80 - BF)/4 */
+       2, 2, 2, 2, 2, 2, 2, 2, 3, 3, 3, 3, 4, 4, 5, 6, /* (C0 - FF)/4 */
 };
 
-static struct flist_ndx_list redo_list, hlink_list;
+#define IN_MULTIPLEXED (iobuf.in_multiplexed)
+#define OUT_MULTIPLEXED (iobuf.out_empty_len != 0)
 
-struct msg_list_item {
-       struct msg_list_item *next;
-       int len;
-       char buf[1];
-};
+#define PIO_NEED_INPUT (1<<0) /* The *_NEED_* flags are mutually exclusive. */
+#define PIO_NEED_OUTROOM (1<<1)
+#define PIO_NEED_MSGROOM (1<<2)
 
-struct msg_list {
-       struct msg_list_item *head, *tail;
-};
+#define PIO_CONSUME_INPUT (1<<4) /* Must becombined with PIO_NEED_INPUT. */
 
-static struct msg_list msg2genr, msg2sndr;
+#define PIO_INPUT_AND_CONSUME (PIO_NEED_INPUT | PIO_CONSUME_INPUT)
+#define PIO_NEED_FLAGS (PIO_NEED_INPUT | PIO_NEED_OUTROOM | PIO_NEED_MSGROOM)
 
-static void flist_ndx_push(struct flist_ndx_list *lp, int ndx)
-{
-       struct flist_ndx_item *item;
-
-       if (!(item = new(struct flist_ndx_item)))
-               out_of_memory("flist_ndx_push");
-       item->next = NULL;
-       item->ndx = ndx;
-       if (lp->tail)
-               lp->tail->next = item;
-       else
-               lp->head = item;
-       lp->tail = item;
-}
+#define REMOTE_OPTION_ERROR "rsync: on remote machine: -"
+#define REMOTE_OPTION_ERROR2 ": unknown option"
 
-static int flist_ndx_pop(struct flist_ndx_list *lp)
-{
-       struct flist_ndx_item *next;
-       int ndx;
+#define FILESFROM_BUFLEN 2048
 
-       if (!lp->head)
-               return -1;
+enum festatus { FES_SUCCESS, FES_REDO, FES_NO_SEND };
 
-       ndx = lp->head->ndx;
-       next = lp->head->next;
-       free(lp->head);
-       lp->head = next;
-       if (!next)
-               lp->tail = NULL;
+static flist_ndx_list redo_list, hlink_list;
 
-       return ndx;
-}
+static void drain_multiplex_messages(void);
+static void sleep_for_bwlimit(int bytes_written);
 
 static void check_timeout(void)
 {
@@ -192,307 +162,6 @@ static void check_timeout(void)
        }
 }
 
-/* Note the fds used for the main socket (which might really be a pipe
- * for a local transfer, but we can ignore that). */
-void io_set_sock_fds(int f_in, int f_out)
-{
-       sock_f_in = f_in;
-       sock_f_out = f_out;
-}
-
-void set_io_timeout(int secs)
-{
-       io_timeout = secs;
-
-       if (!io_timeout || io_timeout > SELECT_TIMEOUT)
-               select_timeout = SELECT_TIMEOUT;
-       else
-               select_timeout = io_timeout;
-
-       allowed_lull = read_batch ? 0 : (io_timeout + 1) / 2;
-}
-
-/* Setup the fd used to receive MSG_* messages.  Only needed during the
- * early stages of being a local sender (up through the sending of the
- * file list) or when we're the generator (to fetch the messages from
- * the receiver). */
-void set_msg_fd_in(int fd)
-{
-       msg_fd_in = fd;
-}
-
-/* Setup the fd used to send our MSG_* messages.  Only needed when
- * we're the receiver (to send our messages to the generator). */
-void set_msg_fd_out(int fd)
-{
-       msg_fd_out = fd;
-       set_nonblocking(msg_fd_out);
-}
-
-/* Add a message to the pending MSG_* list. */
-static void msg_list_add(struct msg_list *lst, int code, const char *buf, int len)
-{
-       struct msg_list_item *m;
-       int sz = len + 4 + sizeof m[0] - 1;
-
-       if (!(m = (struct msg_list_item *)new_array(char, sz)))
-               out_of_memory("msg_list_add");
-       m->next = NULL;
-       m->len = len + 4;
-       SIVAL(m->buf, 0, ((code+MPLEX_BASE)<<24) | len);
-       memcpy(m->buf + 4, buf, len);
-       if (lst->tail)
-               lst->tail->next = m;
-       else
-               lst->head = m;
-       lst->tail = m;
-}
-
-/* Read a message from the MSG_* fd and handle it.  This is called either
- * during the early stages of being a local sender (up through the sending
- * of the file list) or when we're the generator (to fetch the messages
- * from the receiver). */
-static void read_msg_fd(void)
-{
-       char buf[2048];
-       size_t n;
-       struct file_list *flist;
-       int fd = msg_fd_in;
-       int tag, len;
-
-       /* Temporarily disable msg_fd_in.  This is needed to avoid looping back
-        * to this routine from writefd_unbuffered(). */
-       msg_fd_in = -1;
-
-       readfd(fd, buf, 4);
-       tag = IVAL(buf, 0);
-
-       len = tag & 0xFFFFFF;
-       tag = (tag >> 24) - MPLEX_BASE;
-
-       switch (tag) {
-       case MSG_DONE:
-               if (len != 0 || !am_generator) {
-                 invalid_msg:
-                       rprintf(FERROR, "invalid message %d:%d [%s%s]\n",
-                               tag, len, who_am_i(),
-                               incremental ? "/incremental" : "");
-                       exit_cleanup(RERR_STREAMIO);
-               }
-               done_cnt++;
-               break;
-       case MSG_REDO:
-               if (len != 4 || !am_generator)
-                       goto invalid_msg;
-               readfd(fd, buf, 4);
-               if (remove_source_files)
-                       decrement_active_files(IVAL(buf,0));
-               flist_ndx_push(&redo_list, IVAL(buf,0));
-               if (incremental)
-                       decrement_flist_in_progress(IVAL(buf,0), 1);
-               break;
-       case MSG_FLIST:
-               if (len != 4 || !am_generator || !incremental)
-                       goto invalid_msg;
-               readfd(fd, buf, 4);
-               /* Read extra file list from receiver. */
-               assert(iobuf_in != NULL);
-               assert(iobuf_f_in == fd);
-               flist = recv_file_list(fd);
-               flist->parent_ndx = IVAL(buf,0);
-               break;
-       case MSG_FLIST_EOF:
-               if (len != 0 || !am_generator || !incremental)
-                       goto invalid_msg;
-               flist_eof = 1;
-               break;
-       case MSG_DELETED:
-               if (len >= (int)sizeof buf || !am_generator)
-                       goto invalid_msg;
-               readfd(fd, buf, len);
-               send_msg(MSG_DELETED, buf, len);
-               break;
-       case MSG_SUCCESS:
-               if (len != 4 || !am_generator)
-                       goto invalid_msg;
-               readfd(fd, buf, len);
-               if (remove_source_files) {
-                       decrement_active_files(IVAL(buf,0));
-                       send_msg(MSG_SUCCESS, buf, len);
-               }
-               if (preserve_hard_links)
-                       flist_ndx_push(&hlink_list, IVAL(buf,0));
-               if (incremental)
-                       decrement_flist_in_progress(IVAL(buf,0), 0);
-               break;
-       case MSG_NO_SEND:
-               if (len != 4 || !am_generator)
-                       goto invalid_msg;
-               readfd(fd, buf, len);
-               if (incremental)
-                       decrement_flist_in_progress(IVAL(buf,0), 0);
-               break;
-       case MSG_SOCKERR:
-       case MSG_CLIENT:
-               if (!am_generator)
-                       goto invalid_msg;
-               if (tag == MSG_SOCKERR)
-                       io_end_multiplex_out();
-               /* FALL THROUGH */
-       case MSG_INFO:
-       case MSG_ERROR:
-       case MSG_LOG:
-               while (len) {
-                       n = len;
-                       if (n >= sizeof buf)
-                               n = sizeof buf - 1;
-                       readfd(fd, buf, n);
-                       rwrite((enum logcode)tag, buf, n);
-                       len -= n;
-               }
-               break;
-       default:
-               rprintf(FERROR, "unknown message %d:%d [%s]\n",
-                       tag, len, who_am_i());
-               exit_cleanup(RERR_STREAMIO);
-       }
-
-       msg_fd_in = fd;
-}
-
-/* This is used by the generator to limit how many file transfers can
- * be active at once when --remove-source-files is specified.  Without
- * this, sender-side deletions were mostly happening at the end. */
-void increment_active_files(int ndx, int itemizing, enum logcode code)
-{
-       /* TODO: tune these limits? */
-       while (active_filecnt >= (active_bytecnt >= 128*1024 ? 10 : 50)) {
-#ifdef SUPPORT_HARD_LINKS
-               if (hlink_list.head)
-                       check_for_finished_hlinks(itemizing, code);
-#endif
-               read_msg_fd();
-       }
-
-       active_filecnt++;
-       active_bytecnt += F_LENGTH(cur_flist->files[ndx]);
-}
-
-static void decrement_active_files(int ndx)
-{
-       struct file_list *flist = flist_for_ndx(ndx);
-       assert(flist != NULL);
-       active_filecnt--;
-       active_bytecnt -= F_LENGTH(flist->files[ndx - flist->ndx_start]);
-}
-
-static void decrement_flist_in_progress(int ndx, int redo)
-{
-       struct file_list *flist = cur_flist ? cur_flist : first_flist;
-
-       while (ndx < flist->ndx_start) {
-               if (flist == first_flist) {
-                 invalid_ndx:
-                       rprintf(FERROR,
-                               "Invalid file index: %d (%d - %d) [%s]\n",
-                               ndx, first_flist->ndx_start,
-                               first_flist->prev->ndx_start + first_flist->prev->count - 1,
-                               who_am_i());
-                       exit_cleanup(RERR_PROTOCOL);
-               }
-               flist = flist->prev;
-       }
-       while (ndx >= flist->ndx_start + flist->count) {
-               if (!(flist = flist->next))
-                       goto invalid_ndx;
-       }
-
-       flist->in_progress--;
-       if (redo)
-               flist->to_redo++;
-}
-
-/* Try to push messages off the list onto the wire.  If we leave with more
- * to do, return 0.  On error, return -1.  If everything flushed, return 1.
- * This is only active in the receiver. */
-static int msg2genr_flush(void)
-{
-       if (msg_fd_out < 0 || no_flush || flist_forward_from >= 0)
-               return -1;
-
-       no_flush++;
-       while (msg2genr.head) {
-               struct msg_list_item *m = msg2genr.head;
-               writefd(msg_fd_out, m->buf, m->len);
-               msg2genr.head = m->next;
-               if (!msg2genr.head)
-                       msg2genr.tail = NULL;
-               free(m);
-       }
-       if (iobuf_out_cnt) {
-               writefd_unbuffered(iobuf_f_out, iobuf_out, iobuf_out_cnt);
-               iobuf_out_cnt = 0;
-       }
-       no_flush--;
-       return 1;
-}
-
-int send_msg(enum msgcode code, const char *buf, int len)
-{
-       if (msg_fd_out < 0) {
-               if (!defer_forwarding_messages)
-                       return io_multiplex_write(code, buf, len);
-               if (!io_multiplexing_out)
-                       return 0;
-               msg_list_add(&msg2sndr, code, buf, len);
-               return 1;
-       }
-       msg_list_add(&msg2genr, code, buf, len);
-       msg2genr_flush();
-       return 1;
-}
-
-void send_msg_int(enum msgcode code, int num)
-{
-       char numbuf[4];
-       SIVAL(numbuf, 0, num);
-       send_msg(code, numbuf, 4);
-}
-
-void wait_for_receiver(void)
-{
-       read_msg_fd();
-}
-
-int get_redo_num(void)
-{
-       return flist_ndx_pop(&redo_list);
-}
-
-int get_hlink_num(void)
-{
-       return flist_ndx_pop(&hlink_list);
-}
-
-/**
- * When we're the receiver and we have a local --files-from list of names
- * that needs to be sent over the socket to the sender, we have to do two
- * things at the same time: send the sender a list of what files we're
- * processing and read the incoming file+info list from the sender.  We do
- * this by augmenting the read_timeout() function to copy this data.  It
- * uses the io_filesfrom_buf to read a block of data from f_in (when it is
- * ready, since it might be a pipe) and then blast it out f_out (when it
- * is ready to receive more data).
- */
-void io_set_filesfrom_fds(int f_in, int f_out)
-{
-       io_filesfrom_f_in = f_in;
-       io_filesfrom_f_out = f_out;
-       io_filesfrom_bp = io_filesfrom_buf;
-       io_filesfrom_lastchar = '\0';
-       io_filesfrom_buflen = 0;
-}
-
 /* It's almost always an error to get an EOF when we're trying to read from the
  * network, because the protocol is (for the most part) self-terminating.
  *
@@ -505,9 +174,9 @@ void io_set_filesfrom_fds(int f_in, int f_out)
  * There is another case for older protocol versions (< 24) where the module
  * listing was not terminated, so we must ignore an EOF error in that case and
  * exit.  In this situation, kluge_around_eof will be > 0. */
-static void whine_about_eof(int fd)
+static NORETURN void whine_about_eof(BOOL allow_kluge)
 {
-       if (kluge_around_eof && fd == sock_f_in) {
+       if (kluge_around_eof && allow_kluge) {
                int i;
                if (kluge_around_eof > 0)
                        exit_cleanup(0);
@@ -517,464 +186,1362 @@ static void whine_about_eof(int fd)
        }
 
        rprintf(FERROR, RSYNC_NAME ": connection unexpectedly closed "
-               "(%.0f bytes received so far) [%s]\n",
-               (double)stats.total_read, who_am_i());
+               "(%s bytes received so far) [%s]\n",
+               big_num(stats.total_read), who_am_i());
 
        exit_cleanup(RERR_STREAMIO);
 }
 
-/**
- * Read from a socket with I/O timeout. return the number of bytes
- * read. If no bytes can be read then exit, never return a number <= 0.
- *
- * TODO: If the remote shell connection fails, then current versions
- * actually report an "unexpected EOF" error here.  Since it's a
- * fairly common mistake to try to use rsh when ssh is required, we
- * should trap that: if we fail to read any data at all, we should
- * give a better explanation.  We can tell whether the connection has
- * started by looking e.g. at whether the remote version is known yet.
- */
-static int read_timeout(int fd, char *buf, size_t len)
+/* Do a safe read, handling any needed looping and error handling.
+ * Returns the count of the bytes read, which will only be different
+ * from "len" if we encountered an EOF.  This routine is not used on
+ * the socket except very early in the transfer. */
+static size_t safe_read(int fd, char *buf, size_t len)
 {
-       int n, cnt = 0;
+       size_t got;
+       int n;
 
-       io_flush(FULL_FLUSH);
+       assert(fd != iobuf.in_fd);
+
+       n = read(fd, buf, len);
+       if ((size_t)n == len || n == 0) {
+               if (DEBUG_GTE(IO, 2))
+                       rprintf(FINFO, "[%s] safe_read(%d)=%ld\n", who_am_i(), fd, (long)n);
+               return n;
+       }
+       if (n < 0) {
+               if (errno != EINTR && errno != EWOULDBLOCK && errno != EAGAIN) {
+                 read_failed:
+                       rsyserr(FERROR, errno, "safe_read failed to read %ld bytes [%s]",
+                               (long)len, who_am_i());
+                       exit_cleanup(RERR_STREAMIO);
+               }
+               got = 0;
+       } else
+               got = n;
 
-       while (cnt == 0) {
-               /* until we manage to read *something* */
-               fd_set r_fds, w_fds;
+       while (1) {
                struct timeval tv;
-               int maxfd = fd;
-               int count;
+               fd_set r_fds, e_fds;
+               int cnt;
 
                FD_ZERO(&r_fds);
-               FD_ZERO(&w_fds);
                FD_SET(fd, &r_fds);
-               if (msg2genr.head) {
-                       FD_SET(msg_fd_out, &w_fds);
-                       if (msg_fd_out > maxfd)
-                               maxfd = msg_fd_out;
-               }
-               if (io_filesfrom_f_out >= 0) {
-                       int new_fd;
-                       if (io_filesfrom_buflen == 0) {
-                               if (io_filesfrom_f_in >= 0) {
-                                       FD_SET(io_filesfrom_f_in, &r_fds);
-                                       new_fd = io_filesfrom_f_in;
-                               } else {
-                                       io_filesfrom_f_out = -1;
-                                       new_fd = -1;
-                               }
-                       } else {
-                               FD_SET(io_filesfrom_f_out, &w_fds);
-                               new_fd = io_filesfrom_f_out;
-                       }
-                       if (new_fd > maxfd)
-                               maxfd = new_fd;
-               }
-
+               FD_ZERO(&e_fds);
+               FD_SET(fd, &e_fds);
                tv.tv_sec = select_timeout;
                tv.tv_usec = 0;
 
-               errno = 0;
-
-               count = select(maxfd + 1, &r_fds, &w_fds, NULL, &tv);
-
-               if (count <= 0) {
-                       if (errno == EBADF)
-                               exit_cleanup(RERR_SOCKETIO);
+               cnt = select(fd+1, &r_fds, NULL, &e_fds, &tv);
+               if (cnt <= 0) {
+                       if (cnt < 0 && errno == EBADF) {
+                               rsyserr(FERROR, errno, "safe_read select failed [%s]",
+                                       who_am_i());
+                               exit_cleanup(RERR_FILEIO);
+                       }
                        check_timeout();
                        continue;
                }
 
-               if (msg2genr.head && FD_ISSET(msg_fd_out, &w_fds))
-                       msg2genr_flush();
-
-               if (io_filesfrom_f_out >= 0) {
-                       if (io_filesfrom_buflen) {
-                               if (FD_ISSET(io_filesfrom_f_out, &w_fds)) {
-                                       int l = write(io_filesfrom_f_out,
-                                                     io_filesfrom_bp,
-                                                     io_filesfrom_buflen);
-                                       if (l > 0) {
-                                               if (!(io_filesfrom_buflen -= l))
-                                                       io_filesfrom_bp = io_filesfrom_buf;
-                                               else
-                                                       io_filesfrom_bp += l;
-                                       } else {
-                                               /* XXX should we complain? */
-                                               io_filesfrom_f_out = -1;
-                                       }
-                               }
-                       } else if (io_filesfrom_f_in >= 0) {
-                               if (FD_ISSET(io_filesfrom_f_in, &r_fds)) {
-                                       int l = read(io_filesfrom_f_in,
-                                                    io_filesfrom_buf,
-                                                    sizeof io_filesfrom_buf);
-                                       if (l <= 0) {
-                                               /* Send end-of-file marker */
-                                               io_filesfrom_buf[0] = '\0';
-                                               io_filesfrom_buf[1] = '\0';
-                                               io_filesfrom_buflen = io_filesfrom_lastchar? 2 : 1;
-                                               io_filesfrom_f_in = -1;
-                                       } else {
-                                               if (!eol_nulls) {
-                                                       char *s = io_filesfrom_buf + l;
-                                                       /* Transform CR and/or LF into '\0' */
-                                                       while (s-- > io_filesfrom_buf) {
-                                                               if (*s == '\n' || *s == '\r')
-                                                                       *s = '\0';
-                                                       }
-                                               }
-                                               if (!io_filesfrom_lastchar) {
-                                                       /* Last buf ended with a '\0', so don't
-                                                        * let this buf start with one. */
-                                                       while (l && !*io_filesfrom_bp)
-                                                               io_filesfrom_bp++, l--;
-                                               }
-                                               if (!l)
-                                                       io_filesfrom_bp = io_filesfrom_buf;
-                                               else {
-                                                       char *f = io_filesfrom_bp;
-                                                       char *t = f;
-                                                       char *eob = f + l;
-                                                       /* Eliminate any multi-'\0' runs. */
-                                                       while (f != eob) {
-                                                               if (!(*t++ = *f++)) {
-                                                                       while (f != eob && !*f)
-                                                                               f++, l--;
-                                                               }
-                                                       }
-                                                       io_filesfrom_lastchar = f[-1];
-                                               }
-                                               io_filesfrom_buflen = l;
-                                       }
-                               }
+               /*if (FD_ISSET(fd, &e_fds))
+                       rprintf(FINFO, "select exception on fd %d\n", fd); */
+
+               if (FD_ISSET(fd, &r_fds)) {
+                       n = read(fd, buf + got, len - got);
+                       if (DEBUG_GTE(IO, 2))
+                               rprintf(FINFO, "[%s] safe_read(%d)=%ld\n", who_am_i(), fd, (long)n);
+                       if (n == 0)
+                               break;
+                       if (n < 0) {
+                               if (errno == EINTR)
+                                       continue;
+                               goto read_failed;
                        }
+                       if ((got += (size_t)n) == len)
+                               break;
                }
+       }
 
-               if (!FD_ISSET(fd, &r_fds))
-                       continue;
+       return got;
+}
 
-               n = read(fd, buf, len);
+static const char *what_fd_is(int fd)
+{
+       static char buf[20];
 
-               if (n <= 0) {
-                       if (n == 0)
-                               whine_about_eof(fd); /* Doesn't return. */
-                       if (errno == EINTR || errno == EWOULDBLOCK
-                           || errno == EAGAIN)
-                               continue;
+       if (fd == sock_f_out)
+               return "socket";
+       else if (fd == iobuf.out_fd)
+               return "message fd";
+       else if (fd == batch_fd)
+               return "batch file";
+       else {
+               snprintf(buf, sizeof buf, "fd %d", fd);
+               return buf;
+       }
+}
 
-                       /* Don't write errors on a dead socket. */
-                       if (fd == sock_f_in) {
-                               io_end_multiplex_out();
-                               rsyserr(FSOCKERR, errno, "read error");
-                       } else
-                               rsyserr(FERROR, errno, "read error");
+/* Do a safe write, handling any needed looping and error handling.
+ * Returns only if everything was successfully written.  This routine
+ * is not used on the socket except very early in the transfer. */
+static void safe_write(int fd, const char *buf, size_t len)
+{
+       int n;
+
+       assert(fd != iobuf.out_fd);
+
+       n = write(fd, buf, len);
+       if ((size_t)n == len)
+               return;
+       if (n < 0) {
+               if (errno != EINTR && errno != EWOULDBLOCK && errno != EAGAIN) {
+                 write_failed:
+                       rsyserr(FERROR, errno,
+                               "safe_write failed to write %ld bytes to %s [%s]",
+                               (long)len, what_fd_is(fd), who_am_i());
                        exit_cleanup(RERR_STREAMIO);
                }
-
+       } else {
                buf += n;
                len -= n;
-               cnt += n;
-
-               if (fd == sock_f_in && io_timeout)
-                       last_io_in = time(NULL);
        }
 
-       return cnt;
-}
+       while (len) {
+               struct timeval tv;
+               fd_set w_fds;
+               int cnt;
 
-/**
- * Read a line into the "fname" buffer (which must be at least MAXPATHLEN
- * characters long).
- */
-int read_filesfrom_line(int fd, char *fname)
-{
-       char ch, *s, *eob = fname + MAXPATHLEN - 1;
-       int cnt;
-       int reading_remotely = filesfrom_host != NULL;
-       int nulls = eol_nulls || reading_remotely;
+               FD_ZERO(&w_fds);
+               FD_SET(fd, &w_fds);
+               tv.tv_sec = select_timeout;
+               tv.tv_usec = 0;
 
-  start:
-       s = fname;
-       while (1) {
-               cnt = read(fd, &ch, 1);
-               if (cnt < 0 && (errno == EWOULDBLOCK
-                 || errno == EINTR || errno == EAGAIN)) {
-                       struct timeval tv;
-                       fd_set r_fds, e_fds;
-                       FD_ZERO(&r_fds);
-                       FD_SET(fd, &r_fds);
-                       FD_ZERO(&e_fds);
-                       FD_SET(fd, &e_fds);
-                       tv.tv_sec = select_timeout;
-                       tv.tv_usec = 0;
-                       if (!select(fd+1, &r_fds, NULL, &e_fds, &tv))
-                               check_timeout();
-                       if (FD_ISSET(fd, &e_fds)) {
-                               rsyserr(FINFO, errno,
-                                       "select exception on fd %d", fd);
+               cnt = select(fd + 1, NULL, &w_fds, NULL, &tv);
+               if (cnt <= 0) {
+                       if (cnt < 0 && errno == EBADF) {
+                               rsyserr(FERROR, errno, "safe_write select failed on %s [%s]",
+                                       what_fd_is(fd), who_am_i());
+                               exit_cleanup(RERR_FILEIO);
                        }
+                       check_timeout();
                        continue;
                }
-               if (cnt != 1)
-                       break;
-               if (nulls? !ch : (ch == '\r' || ch == '\n')) {
-                       /* Skip empty lines if reading locally. */
-                       if (!reading_remotely && s == fname)
-                               continue;
-                       break;
+
+               if (FD_ISSET(fd, &w_fds)) {
+                       n = write(fd, buf, len);
+                       if (n < 0) {
+                               if (errno == EINTR)
+                                       continue;
+                               goto write_failed;
+                       }
+                       buf += n;
+                       len -= n;
                }
-               if (s < eob)
-                       *s++ = ch;
        }
-       *s = '\0';
-
-       /* Dump comments. */
-       if (*fname == '#' || *fname == ';')
-               goto start;
-
-       return s - fname;
 }
 
-int io_start_buffering_out(int f_out)
+/* This is only called when files-from data is known to be available.  We read
+ * a chunk of data and put it into the output buffer. */
+static void forward_filesfrom_data(void)
 {
-       if (iobuf_out) {
-               assert(f_out == iobuf_f_out);
-               return 0;
-       }
-       if (!(iobuf_out = new_array(char, IO_BUFFER_SIZE)))
-               out_of_memory("io_start_buffering_out");
-       iobuf_out_cnt = 0;
-       iobuf_f_out = f_out;
-       return 1;
-}
+       int len;
 
-int io_start_buffering_in(int f_in)
-{
-       if (iobuf_in) {
-               assert(f_in == iobuf_f_in);
-               return 0;
+       len = read(ff_forward_fd, ff_xb.buf + ff_xb.len, ff_xb.size - ff_xb.len);
+       if (len <= 0) {
+               if (len == 0 || errno != EINTR) {
+                       /* Send end-of-file marker */
+                       ff_forward_fd = -1;
+                       write_buf(iobuf.out_fd, "\0\0", ff_lastchar ? 2 : 1);
+                       free_xbuf(&ff_xb);
+                       if (ff_reenable_multiplex >= 0)
+                               io_start_multiplex_out(ff_reenable_multiplex);
+               }
+               return;
        }
-       iobuf_in_siz = 2 * IO_BUFFER_SIZE;
-       if (!(iobuf_in = new_array(char, iobuf_in_siz)))
-               out_of_memory("io_start_buffering_in");
-       iobuf_f_in = f_in;
-       return 1;
-}
 
-void io_end_buffering_in(void)
-{
-       if (!iobuf_in)
-               return;
-       free(iobuf_in);
-       iobuf_in = NULL;
-       iobuf_in_ndx = 0;
-       iobuf_in_remaining = 0;
-       iobuf_f_in = -1;
+       if (DEBUG_GTE(IO, 2))
+               rprintf(FINFO, "[%s] files-from read=%ld\n", who_am_i(), (long)len);
+
+#ifdef ICONV_OPTION
+       len += ff_xb.len;
+#endif
+
+       if (!eol_nulls) {
+               char *s = ff_xb.buf + len;
+               /* Transform CR and/or LF into '\0' */
+               while (s-- > ff_xb.buf) {
+                       if (*s == '\n' || *s == '\r')
+                               *s = '\0';
+               }
+       }
+
+       if (ff_lastchar)
+               ff_xb.pos = 0;
+       else {
+               char *s = ff_xb.buf;
+               /* Last buf ended with a '\0', so don't let this buf start with one. */
+               while (len && *s == '\0')
+                       s++, len--;
+               ff_xb.pos = s - ff_xb.buf;
+       }
+
+#ifdef ICONV_OPTION
+       if (filesfrom_convert && len) {
+               char *sob = ff_xb.buf + ff_xb.pos, *s = sob;
+               char *eob = sob + len;
+               int flags = ICB_INCLUDE_BAD | ICB_INCLUDE_INCOMPLETE | ICB_CIRCULAR_OUT;
+               if (ff_lastchar == '\0')
+                       flags |= ICB_INIT;
+               /* Convert/send each null-terminated string separately, skipping empties. */
+               while (s != eob) {
+                       if (*s++ == '\0') {
+                               ff_xb.len = s - sob - 1;
+                               if (iconvbufs(ic_send, &ff_xb, &iobuf.out, flags) < 0)
+                                       exit_cleanup(RERR_PROTOCOL); /* impossible? */
+                               write_buf(iobuf.out_fd, s-1, 1); /* Send the '\0'. */
+                               while (s != eob && *s == '\0')
+                                       s++;
+                               sob = s;
+                               ff_xb.pos = sob - ff_xb.buf;
+                               flags |= ICB_INIT;
+                       }
+               }
+
+               if ((ff_xb.len = s - sob) == 0)
+                       ff_lastchar = '\0';
+               else {
+                       /* Handle a partial string specially, saving any incomplete chars. */
+                       flags &= ~ICB_INCLUDE_INCOMPLETE;
+                       if (iconvbufs(ic_send, &ff_xb, &iobuf.out, flags) < 0) {
+                               if (errno == E2BIG)
+                                       exit_cleanup(RERR_PROTOCOL); /* impossible? */
+                               if (ff_xb.pos)
+                                       memmove(ff_xb.buf, ff_xb.buf + ff_xb.pos, ff_xb.len);
+                       }
+                       ff_lastchar = 'x'; /* Anything non-zero. */
+               }
+       } else
+#endif
+
+       if (len) {
+               char *f = ff_xb.buf + ff_xb.pos;
+               char *t = ff_xb.buf;
+               char *eob = f + len;
+               /* Eliminate any multi-'\0' runs. */
+               while (f != eob) {
+                       if (!(*t++ = *f++)) {
+                               while (f != eob && *f == '\0')
+                                       f++;
+                       }
+               }
+               ff_lastchar = f[-1];
+               if ((len = t - ff_xb.buf) != 0) {
+                       /* This will not circle back to perform_io() because we only get
+                        * called when there is plenty of room in the output buffer. */
+                       write_buf(iobuf.out_fd, ff_xb.buf, len);
+               }
+       }
+}
+
+/* Perform buffered input and output until specified conditions are met.  When
+ * given a "needed" read requirement, we'll return without doing any I/O if the
+ * iobuf.in bytes are already available.  When reading, we'll read as many
+ * bytes as we can into the buffer, and return as soon as we meet the minimum
+ * read requirement.  When given a "needed" write requirement, we'll return
+ * without doing any I/O if that many bytes will fit in the output buffer (we
+ * check either iobuf.out or iobuf.msg, depending on the flags).  When writing,
+ * we write out as much as we can, and return as soon as the given free-space
+ * requirement is available.
+ *
+ * The iobuf.out and iobuf.msg buffers are circular, so some writes into them
+ * will need to be split when the data needs to wrap around to the start.  In
+ * order to help make this easier for some operations (such as the use of
+ * SIVAL() into the buffer) the buffers MUST have 4 bytes of overflow space at
+ * the end that is not not counted in the "size".  The iobuf.in buffer is not
+ * (currently) circular.  To facilitate the handling of MSG_DATA bytes as they
+ * are read-from/written-into the buffers, see the three raw_* iobuf vars.
+ *
+ * When writing, we flush data in the following priority order:
+ *
+ * 1. Finish writing any in-progress MSG_DATA sequence from iobuf.out.
+ *
+ * 2. Write out all the messages from the message buf (if iobuf.msg is active).
+ *    Yes, this means that a PIO_NEED_OUTROOM call will completely flush any
+ *    messages before getting to the iobuf.out flushing (except for rule 1).
+ *
+ * 3. Write out the raw data from iobuf.out, possibly filling in the multiplexed
+ *    MSG_DATA header that was pre-allocated (when output is multiplexed).
+ *
+ * TODO:  items for possible future work:
+ *
+ *    - Make this routine able to read the generator-to-receiver batch flow?
+ *
+ *    - Make the input buffer circular?
+ *
+ * Unlike the old routines that this replaces, it is OK to read ahead as far as
+ * we can because the read_a_msg() routine now reads its bytes out of the input
+ * buffer.  In the old days, only raw data was in the input buffer, and any
+ * unused raw data in the buf would prevent the reading of socket data. */
+static char *perform_io(size_t needed, int flags)
+{
+       fd_set r_fds, e_fds, w_fds;
+       struct timeval tv;
+       int cnt, max_fd;
+       size_t empty_buf_len = 0;
+       xbuf *out;
+       char *data;
+
+       if (iobuf.in.len == 0 && iobuf.in.pos != 0) {
+               if (iobuf.raw_input_ends_before)
+                       iobuf.raw_input_ends_before -= iobuf.in.pos;
+               iobuf.in.pos = 0;
+       }
+
+       switch (flags & PIO_NEED_FLAGS) {
+       case PIO_NEED_INPUT:
+               if (DEBUG_GTE(IO, 3)) {
+                       rprintf(FINFO, "[%s] perform_io(%ld, %sinput)\n",
+                               who_am_i(), (long)needed, flags & PIO_CONSUME_INPUT ? "consume&" : "");
+               }
+
+               /* Make sure the input buffer is big enough to hold "needed" bytes.
+                * Also make sure it will fit in the free space at the end, or
+                * else we need to shift some bytes. */
+               if (needed && iobuf.in.size < needed) {
+                       if (!(iobuf.in.buf = realloc_array(iobuf.in.buf, char, needed)))
+                               out_of_memory("perform_io");
+                       if (DEBUG_GTE(IO, 4)) {
+                               rprintf(FINFO, "[%s] resized input buffer from %ld to %ld bytes.\n",
+                                       who_am_i(), (long)iobuf.in.size, (long)needed);
+                       }
+                       iobuf.in.size = needed;
+               }
+               if (iobuf.in.size - iobuf.in.pos < needed
+                || (iobuf.in.len < needed && iobuf.in.len < 1024
+                 && iobuf.in.size - (iobuf.in.pos + iobuf.in.len) < 1024)) {
+                       memmove(iobuf.in.buf, iobuf.in.buf + iobuf.in.pos, iobuf.in.len);
+                       if (DEBUG_GTE(IO, 4)) {
+                               rprintf(FINFO,
+                                       "[%s] moved %ld bytes from %ld to 0 in the input buffer (size=%ld, needed=%ld).\n",
+                                       who_am_i(), (long)iobuf.in.len, (long)iobuf.in.pos, (long)iobuf.in.size, (long)needed);
+                       }
+                       if (iobuf.raw_input_ends_before)
+                               iobuf.raw_input_ends_before -= iobuf.in.pos;
+                       iobuf.in.pos = 0;
+               }
+               break;
+
+       case PIO_NEED_OUTROOM:
+               /* We never resize the circular output buffer. */
+               if (iobuf.out.size - iobuf.out_empty_len < needed) {
+                       fprintf(stderr, "need to write %ld bytes, iobuf.out.buf is only %ld bytes.\n",
+                               (long)needed, (long)(iobuf.out.size - iobuf.out_empty_len));
+                       exit_cleanup(RERR_PROTOCOL);
+               }
+
+               if (DEBUG_GTE(IO, 3)) {
+                       rprintf(FINFO, "[%s] perform_io(%ld, outroom) needs to flush %ld\n",
+                               who_am_i(), (long)needed,
+                               iobuf.out.len + needed > iobuf.out.size
+                               ? (long)(iobuf.out.len + needed - iobuf.out.size) : 0L);
+               }
+               break;
+
+       case PIO_NEED_MSGROOM:
+               /* We never resize the circular message buffer. */
+               if (iobuf.msg.size < needed) {
+                       fprintf(stderr, "need to write %ld bytes, iobuf.msg.buf is only %ld bytes.\n",
+                               (long)needed, (long)iobuf.msg.size);
+                       exit_cleanup(RERR_PROTOCOL);
+               }
+
+               if (DEBUG_GTE(IO, 3)) {
+                       rprintf(FINFO, "[%s] perform_io(%ld, msgroom) needs to flush %ld\n",
+                               who_am_i(), (long)needed,
+                               iobuf.msg.len + needed > iobuf.msg.size
+                               ? (long)(iobuf.msg.len + needed - iobuf.msg.size) : 0L);
+               }
+               break;
+
+       case 0:
+               if (DEBUG_GTE(IO, 3))
+                       rprintf(FINFO, "[%s] perform_io(%ld, %d)\n", who_am_i(), (long)needed, flags);
+               break;
+
+       default:
+               exit_cleanup(RERR_UNSUPPORTED);
+       }
+
+       while (1) {
+               switch (flags & PIO_NEED_FLAGS) {
+               case PIO_NEED_INPUT:
+                       if (iobuf.in.len >= needed)
+                               goto double_break;
+                       break;
+               case PIO_NEED_OUTROOM:
+                       /* Note that iobuf.out_empty_len doesn't factor into this check
+                        * because iobuf.out.len already holds any needed header len. */
+                       if (iobuf.out.len + needed <= iobuf.out.size)
+                               goto double_break;
+                       break;
+               case PIO_NEED_MSGROOM:
+                       if (iobuf.msg.len + needed <= iobuf.msg.size)
+                               goto double_break;
+                       break;
+               }
+
+               max_fd = -1;
+
+               FD_ZERO(&r_fds);
+               FD_ZERO(&e_fds);
+               if (iobuf.in_fd >= 0 && iobuf.in.size - (iobuf.in.pos + iobuf.in.len)) {
+                       if (!read_batch || batch_fd >= 0) {
+                               FD_SET(iobuf.in_fd, &r_fds);
+                               FD_SET(iobuf.in_fd, &e_fds);
+                       }
+                       if (iobuf.in_fd > max_fd)
+                               max_fd = iobuf.in_fd;
+               }
+
+               /* Only do more filesfrom processing if there is enough room in the out buffer. */
+               if (ff_forward_fd >= 0 && iobuf.out.size - iobuf.out.len > FILESFROM_BUFLEN*2) {
+                       FD_SET(ff_forward_fd, &r_fds);
+                       if (ff_forward_fd > max_fd)
+                               max_fd = ff_forward_fd;
+               }
+
+               FD_ZERO(&w_fds);
+               if (iobuf.out_fd >= 0) {
+                       if (iobuf.raw_flushing_ends_before
+                        || (!iobuf.msg.len && iobuf.out.len > iobuf.out_empty_len && !(flags & PIO_NEED_MSGROOM))) {
+                               if (OUT_MULTIPLEXED && !iobuf.raw_flushing_ends_before) {
+                                       /* The iobuf.raw_flushing_ends_before value can point off the end
+                                        * of the iobuf.out buffer for a while, for easier subtracting. */
+                                       iobuf.raw_flushing_ends_before = iobuf.out.pos + iobuf.out.len;
+
+                                       SIVAL(iobuf.out.buf + iobuf.raw_data_header_pos, 0,
+                                             ((MPLEX_BASE + (int)MSG_DATA)<<24) + iobuf.out.len - 4);
+                                       if (iobuf.raw_data_header_pos + 4 > iobuf.out.size) {
+                                               int siz = (int)(iobuf.raw_data_header_pos + 4 - iobuf.out.size);
+                                               /* We used some of the overflow bytes, so move them. */
+                                               if (DEBUG_GTE(IO, 4)) {
+                                                       rprintf(FINFO, "[%s] wrap-bytes moved: %d (perform_io)\n",
+                                                               who_am_i(), siz);
+                                               }
+                                               memcpy(iobuf.out.buf, iobuf.out.buf + iobuf.out.size, siz);
+                                       }
+
+                                       if (DEBUG_GTE(IO, 1)) {
+                                               rprintf(FINFO, "[%s] send_msg(%d, %ld)\n",
+                                                       who_am_i(), (int)MSG_DATA, (long)iobuf.out.len - 4);
+                                       }
+
+                                       /* reserve room for the next MSG_DATA header */
+                                       iobuf.raw_data_header_pos = iobuf.raw_flushing_ends_before;
+                                       if (iobuf.raw_data_header_pos >= iobuf.out.size)
+                                               iobuf.raw_data_header_pos -= iobuf.out.size;
+                                       /* Yes, it is possible for this to make len > size for a while. */
+                                       iobuf.out.len += 4;
+                               }
+
+                               empty_buf_len = iobuf.out_empty_len;
+                               out = &iobuf.out;
+                       } else if (iobuf.msg.len) {
+                               empty_buf_len = 0;
+                               out = &iobuf.msg;
+                       } else
+                               out = NULL;
+                       if (out) {
+                               FD_SET(iobuf.out_fd, &w_fds);
+                               if (iobuf.out_fd > max_fd)
+                                       max_fd = iobuf.out_fd;
+                       }
+               } else
+                       out = NULL;
+
+               if (max_fd < 0) {
+                       switch (flags & PIO_NEED_FLAGS) {
+                       case PIO_NEED_INPUT:
+                               iobuf.in.len = 0;
+                               if (kluge_around_eof == 2)
+                                       exit_cleanup(0);
+                               if (iobuf.in_fd == -2)
+                                       whine_about_eof(True);
+                               rprintf(FERROR, "error in perform_io: no fd for input.\n");
+                               exit_cleanup(RERR_PROTOCOL);
+                       case PIO_NEED_OUTROOM:
+                       case PIO_NEED_MSGROOM:
+                               msgs2stderr = 1;
+                               drain_multiplex_messages();
+                               if (iobuf.out_fd == -2)
+                                       whine_about_eof(True);
+                               rprintf(FERROR, "error in perform_io: no fd for output.\n");
+                               exit_cleanup(RERR_PROTOCOL);
+                       default:
+                               /* No stated needs, so I guess this is OK. */
+                               break;
+                       }
+                       break;
+               }
+
+               if (extra_flist_sending_enabled) {
+                       if (file_total - file_old_total < MAX_FILECNT_LOOKAHEAD)
+                               tv.tv_sec = 0;
+                       else {
+                               extra_flist_sending_enabled = False;
+                               tv.tv_sec = select_timeout;
+                       }
+               } else
+                       tv.tv_sec = select_timeout;
+               tv.tv_usec = 0;
+
+               cnt = select(max_fd + 1, &r_fds, &w_fds, &e_fds, &tv);
+
+               if (cnt <= 0) {
+                       if (cnt < 0 && errno == EBADF) {
+                               msgs2stderr = 1;
+                               exit_cleanup(RERR_SOCKETIO);
+                       }
+                       if (extra_flist_sending_enabled) {
+                               extra_flist_sending_enabled = False;
+                               send_extra_file_list(sock_f_out, -1);
+                               extra_flist_sending_enabled = !flist_eof;
+                       } else
+                               check_timeout();
+                       FD_ZERO(&r_fds); /* Just in case... */
+                       FD_ZERO(&w_fds);
+               }
+
+               if (iobuf.in_fd >= 0 && FD_ISSET(iobuf.in_fd, &r_fds)) {
+                       size_t pos = iobuf.in.pos + iobuf.in.len;
+                       size_t len = iobuf.in.size - pos;
+                       int n;
+                       if ((n = read(iobuf.in_fd, iobuf.in.buf + pos, len)) <= 0) {
+                               if (n == 0) {
+                                       /* Signal that input has become invalid. */
+                                       if (!read_batch || batch_fd < 0 || am_generator)
+                                               iobuf.in_fd = -2;
+                                       batch_fd = -1;
+                                       continue;
+                               }
+                               if (errno == EINTR || errno == EWOULDBLOCK || errno == EAGAIN)
+                                       n = 0;
+                               else {
+                                       /* Don't write errors on a dead socket. */
+                                       if (iobuf.in_fd == sock_f_in) {
+                                               if (am_sender)
+                                                       msgs2stderr = 1;
+                                               rsyserr(FERROR_SOCKET, errno, "read error");
+                                       } else
+                                               rsyserr(FERROR, errno, "read error");
+                                       exit_cleanup(RERR_SOCKETIO);
+                               }
+                       }
+                       if (msgs2stderr && DEBUG_GTE(IO, 2))
+                               rprintf(FINFO, "[%s] recv=%ld\n", who_am_i(), (long)n);
+
+                       if (io_timeout)
+                               last_io_in = time(NULL);
+                       stats.total_read += n;
+
+                       iobuf.in.len += n;
+               }
+
+               if (iobuf.out_fd >= 0 && FD_ISSET(iobuf.out_fd, &w_fds)) {
+                       size_t len = iobuf.raw_flushing_ends_before ? iobuf.raw_flushing_ends_before - out->pos : out->len;
+                       int n;
+
+                       if (bwlimit_writemax && len > bwlimit_writemax)
+                               len = bwlimit_writemax;
+
+                       if (out->pos + len > out->size)
+                               len = out->size - out->pos;
+                       if ((n = write(iobuf.out_fd, out->buf + out->pos, len)) <= 0) {
+                               if (errno == EINTR || errno == EWOULDBLOCK || errno == EAGAIN)
+                                       n = 0;
+                               else {
+                                       /* Don't write errors on a dead socket. */
+                                       msgs2stderr = 1;
+                                       iobuf.out_fd = -2;
+                                       iobuf.out.len = iobuf.msg.len = iobuf.raw_flushing_ends_before = 0;
+                                       rsyserr(FERROR_SOCKET, errno, "[%s] write error", who_am_i());
+                                       drain_multiplex_messages();
+                                       exit_cleanup(RERR_SOCKETIO);
+                               }
+                       }
+                       if (msgs2stderr && DEBUG_GTE(IO, 2)) {
+                               rprintf(FINFO, "[%s] %s sent=%ld\n",
+                                       who_am_i(), out == &iobuf.out ? "out" : "msg", (long)n);
+                       }
+
+                       if (io_timeout)
+                               last_io_out = time(NULL);
+                       stats.total_written += n;
+
+                       if (bwlimit_writemax)
+                               sleep_for_bwlimit(n);
+
+                       if ((out->pos += n) == out->size) {
+                               if (iobuf.raw_flushing_ends_before)
+                                       iobuf.raw_flushing_ends_before -= out->size;
+                               out->pos = 0;
+                       } else if (out->pos == iobuf.raw_flushing_ends_before)
+                               iobuf.raw_flushing_ends_before = 0;
+                       if ((out->len -= n) == empty_buf_len) {
+                               out->pos = 0;
+                               if (empty_buf_len)
+                                       iobuf.raw_data_header_pos = 0;
+                       }
+               }
+
+               if (ff_forward_fd >= 0 && FD_ISSET(ff_forward_fd, &r_fds)) {
+                       /* This can potentially flush all output and enable
+                        * multiplexed output, so keep this last in the loop
+                        * and be sure to not cache anything that would break
+                        * such a change. */
+                       forward_filesfrom_data();
+               }
+       }
+  double_break:
+
+       data = iobuf.in.buf + iobuf.in.pos;
+
+       if (flags & PIO_CONSUME_INPUT) {
+               iobuf.in.len -= needed;
+               iobuf.in.pos += needed;
+       }
+
+       return data;
+}
+
+void noop_io_until_death(void)
+{
+       char buf[1024];
+
+       kluge_around_eof = 2;
+       /* Setting an I/O timeout ensures that if something inexplicably weird
+        * happens, we won't hang around forever. */
+       if (!io_timeout)
+               set_io_timeout(60);
+
+       while (1)
+               read_buf(iobuf.in_fd, buf, sizeof buf);
+}
+
+/* Buffer a message for the multiplexed output stream.  Is never used for MSG_DATA. */
+int send_msg(enum msgcode code, const char *buf, size_t len, int convert)
+{
+       char *hdr;
+       size_t pos;
+       BOOL want_debug = DEBUG_GTE(IO, 1) && convert >= 0 && (msgs2stderr || code != MSG_INFO);
+
+       if (!OUT_MULTIPLEXED)
+               return 0;
+
+       if (want_debug)
+               rprintf(FINFO, "[%s] send_msg(%d, %ld)\n", who_am_i(), (int)code, (long)len);
+
+#ifdef ICONV_OPTION
+       if (convert > 0 && ic_send == (iconv_t)-1)
+               convert = 0;
+       if (convert > 0) {
+               /* Ensuring double-size room leaves space for maximal conversion expansion. */
+               if (iobuf.msg.len + len*2 + 4 > iobuf.msg.size)
+                       perform_io(len*2 + 4, PIO_NEED_MSGROOM);
+       } else
+#endif
+       if (iobuf.msg.len + len + 4 > iobuf.msg.size)
+               perform_io(len + 4, PIO_NEED_MSGROOM);
+
+       pos = iobuf.msg.pos + iobuf.msg.len; /* Must be set after any flushing. */
+       if (pos >= iobuf.msg.size)
+               pos -= iobuf.msg.size;
+       hdr = iobuf.msg.buf + pos;
+
+       iobuf.msg.len += 4; /* Allocate room for the coming header bytes. */
+
+#ifdef ICONV_OPTION
+       if (convert > 0) {
+               xbuf inbuf;
+
+               INIT_XBUF(inbuf, (char*)buf, len, (size_t)-1);
+
+               len = iobuf.msg.len;
+               iconvbufs(ic_send, &inbuf, &iobuf.msg,
+                         ICB_INCLUDE_BAD | ICB_INCLUDE_INCOMPLETE | ICB_CIRCULAR_OUT | ICB_INIT);
+               if (inbuf.len > 0) {
+                       rprintf(FERROR, "overflowed iobuf.msg buffer in send_msg");
+                       exit_cleanup(RERR_UNSUPPORTED);
+               }
+               len = iobuf.msg.len - len;
+       } else
+#endif
+       {
+               size_t siz;
+
+               if ((pos += 4) >= iobuf.msg.size)
+                       pos -= iobuf.msg.size;
+
+               /* Handle a split copy if we wrap around the end of the circular buffer. */
+               if (pos >= iobuf.msg.pos && (siz = iobuf.msg.size - pos) < len) {
+                       memcpy(iobuf.msg.buf + pos, buf, siz);
+                       memcpy(iobuf.msg.buf, buf + siz, len - siz);
+               } else
+                       memcpy(iobuf.msg.buf + pos, buf, len);
+
+               iobuf.msg.len += len;
+       }
+
+       SIVAL(hdr, 0, ((MPLEX_BASE + (int)code)<<24) + len);
+       /* If the header used any overflow bytes, move them to the start. */
+       if ((pos = hdr+4 - iobuf.msg.buf) > iobuf.msg.size) {
+               int siz = (int)(pos - iobuf.msg.size);
+               if (DEBUG_GTE(IO, 4))
+                       rprintf(FINFO, "[%s] wrap-bytes moved: %d (send_msg)\n", who_am_i(), siz);
+               memcpy(iobuf.msg.buf, iobuf.msg.buf + iobuf.msg.size, siz);
+       }
+
+       if (want_debug && convert > 0)
+               rprintf(FINFO, "[%s] converted msg len=%ld\n", who_am_i(), (long)len);
+
+       return 1;
+}
+
+void send_msg_int(enum msgcode code, int num)
+{
+       char numbuf[4];
+
+       if (DEBUG_GTE(IO, 1))
+               rprintf(FINFO, "[%s] send_msg_int(%d, %d)\n", who_am_i(), (int)code, num);
+
+       SIVAL(numbuf, 0, num);
+       send_msg(code, numbuf, 4, -1);
+}
+
+static void got_flist_entry_status(enum festatus status, int ndx)
+{
+       struct file_list *flist = flist_for_ndx(ndx, "got_flist_entry_status");
+
+       if (remove_source_files) {
+               active_filecnt--;
+               active_bytecnt -= F_LENGTH(flist->files[ndx - flist->ndx_start]);
+       }
+
+       if (inc_recurse)
+               flist->in_progress--;
+
+       switch (status) {
+       case FES_SUCCESS:
+               if (remove_source_files)
+                       send_msg_int(MSG_SUCCESS, ndx);
+               if (preserve_hard_links) {
+                       struct file_struct *file = flist->files[ndx - flist->ndx_start];
+                       if (F_IS_HLINKED(file)) {
+                               flist_ndx_push(&hlink_list, ndx);
+                               flist->in_progress++;
+                       }
+               }
+               break;
+       case FES_REDO:
+               if (read_batch) {
+                       if (inc_recurse)
+                               flist->in_progress++;
+                       break;
+               }
+               if (inc_recurse)
+                       flist->to_redo++;
+               flist_ndx_push(&redo_list, ndx);
+               break;
+       case FES_NO_SEND:
+               break;
+       }
+}
+
+/* Note the fds used for the main socket (which might really be a pipe
+ * for a local transfer, but we can ignore that). */
+void io_set_sock_fds(int f_in, int f_out)
+{
+       sock_f_in = f_in;
+       sock_f_out = f_out;
+}
+
+void set_io_timeout(int secs)
+{
+       io_timeout = secs;
+
+       if (!io_timeout || io_timeout > SELECT_TIMEOUT)
+               select_timeout = SELECT_TIMEOUT;
+       else
+               select_timeout = io_timeout;
+
+       allowed_lull = read_batch ? 0 : (io_timeout + 1) / 2;
 }
 
-void io_end_buffering_out(void)
+static void check_for_d_option_error(const char *msg)
 {
-       if (!iobuf_out)
+       static char rsync263_opts[] = "BCDHIKLPRSTWabceghlnopqrtuvxz";
+       char *colon;
+       int saw_d = 0;
+
+       if (*msg != 'r'
+        || strncmp(msg, REMOTE_OPTION_ERROR, sizeof REMOTE_OPTION_ERROR - 1) != 0)
+               return;
+
+       msg += sizeof REMOTE_OPTION_ERROR - 1;
+       if (*msg == '-' || (colon = strchr(msg, ':')) == NULL
+        || strncmp(colon, REMOTE_OPTION_ERROR2, sizeof REMOTE_OPTION_ERROR2 - 1) != 0)
                return;
+
+       for ( ; *msg != ':'; msg++) {
+               if (*msg == 'd')
+                       saw_d = 1;
+               else if (*msg == 'e')
+                       break;
+               else if (strchr(rsync263_opts, *msg) == NULL)
+                       return;
+       }
+
+       if (saw_d) {
+               rprintf(FWARNING,
+                   "*** Try using \"--old-d\" if remote rsync is <= 2.6.3 ***\n");
+       }
+}
+
+/* This is used by the generator to limit how many file transfers can
+ * be active at once when --remove-source-files is specified.  Without
+ * this, sender-side deletions were mostly happening at the end. */
+void increment_active_files(int ndx, int itemizing, enum logcode code)
+{
+       while (1) {
+               /* TODO: tune these limits? */
+               int limit = active_bytecnt >= 128*1024 ? 10 : 50;
+               if (active_filecnt < limit)
+                       break;
+               check_for_finished_files(itemizing, code, 0);
+               if (active_filecnt < limit)
+                       break;
+               wait_for_receiver();
+       }
+
+       active_filecnt++;
+       active_bytecnt += F_LENGTH(cur_flist->files[ndx - cur_flist->ndx_start]);
+}
+
+int get_redo_num(void)
+{
+       return flist_ndx_pop(&redo_list);
+}
+
+int get_hlink_num(void)
+{
+       return flist_ndx_pop(&hlink_list);
+}
+
+/* When we're the receiver and we have a local --files-from list of names
+ * that needs to be sent over the socket to the sender, we have to do two
+ * things at the same time: send the sender a list of what files we're
+ * processing and read the incoming file+info list from the sender.  We do
+ * this by making recv_file_list() call forward_filesfrom_data(), which
+ * will ensure that we forward data to the sender until we get some data
+ * for recv_file_list() to use. */
+void start_filesfrom_forwarding(int fd)
+{
+       if (protocol_version < 31 && OUT_MULTIPLEXED) {
+               /* Older protocols send the files-from data w/o packaging
+                * it in multiplexed I/O packets, so temporarily switch
+                * to buffered I/O to match this behavior. */
+               iobuf.msg.pos = iobuf.msg.len = 0; /* Be extra sure no messages go out. */
+               ff_reenable_multiplex = io_end_multiplex_out(MPLX_TO_BUFFERED);
+       }
+       ff_forward_fd = fd;
+
+       alloc_xbuf(&ff_xb, FILESFROM_BUFLEN);
+}
+
+/* Read a line into the "buf" buffer. */
+int read_line(int fd, char *buf, size_t bufsiz, int flags)
+{
+       char ch, *s, *eob;
+
+#ifdef ICONV_OPTION
+       if (flags & RL_CONVERT && iconv_buf.size < bufsiz)
+               realloc_xbuf(&iconv_buf, bufsiz + 1024);
+#endif
+
+  start:
+#ifdef ICONV_OPTION
+       s = flags & RL_CONVERT ? iconv_buf.buf : buf;
+#else
+       s = buf;
+#endif
+       eob = s + bufsiz - 1;
+       while (1) {
+               /* We avoid read_byte() for files because files can return an EOF. */
+               if (fd == iobuf.in_fd)
+                       ch = read_byte(fd);
+               else if (safe_read(fd, &ch, 1) == 0)
+                       break;
+               if (flags & RL_EOL_NULLS ? ch == '\0' : (ch == '\r' || ch == '\n')) {
+                       /* Skip empty lines if dumping comments. */
+                       if (flags & RL_DUMP_COMMENTS && s == buf)
+                               continue;
+                       break;
+               }
+               if (s < eob)
+                       *s++ = ch;
+       }
+       *s = '\0';
+
+       if (flags & RL_DUMP_COMMENTS && (*buf == '#' || *buf == ';'))
+               goto start;
+
+#ifdef ICONV_OPTION
+       if (flags & RL_CONVERT) {
+               xbuf outbuf;
+               INIT_XBUF(outbuf, buf, 0, bufsiz);
+               iconv_buf.pos = 0;
+               iconv_buf.len = s - iconv_buf.buf;
+               iconvbufs(ic_recv, &iconv_buf, &outbuf,
+                         ICB_INCLUDE_BAD | ICB_INCLUDE_INCOMPLETE | ICB_INIT);
+               outbuf.buf[outbuf.len] = '\0';
+               return outbuf.len;
+       }
+#endif
+
+       return s - buf;
+}
+
+void read_args(int f_in, char *mod_name, char *buf, size_t bufsiz, int rl_nulls,
+              char ***argv_p, int *argc_p, char **request_p)
+{
+       int maxargs = MAX_ARGS;
+       int dot_pos = 0;
+       int argc = 0;
+       char **argv, *p;
+       int rl_flags = (rl_nulls ? RL_EOL_NULLS : 0);
+
+#ifdef ICONV_OPTION
+       rl_flags |= (protect_args && ic_recv != (iconv_t)-1 ? RL_CONVERT : 0);
+#endif
+
+       if (!(argv = new_array(char *, maxargs)))
+               out_of_memory("read_args");
+       if (mod_name && !protect_args)
+               argv[argc++] = "rsyncd";
+
+       while (1) {
+               if (read_line(f_in, buf, bufsiz, rl_flags) == 0)
+                       break;
+
+               if (argc == maxargs-1) {
+                       maxargs += MAX_ARGS;
+                       if (!(argv = realloc_array(argv, char *, maxargs)))
+                               out_of_memory("read_args");
+               }
+
+               if (dot_pos) {
+                       if (request_p) {
+                               *request_p = strdup(buf);
+                               request_p = NULL;
+                       }
+                       if (mod_name)
+                               glob_expand_module(mod_name, buf, &argv, &argc, &maxargs);
+                       else
+                               glob_expand(buf, &argv, &argc, &maxargs);
+               } else {
+                       if (!(p = strdup(buf)))
+                               out_of_memory("read_args");
+                       argv[argc++] = p;
+                       if (*p == '.' && p[1] == '\0')
+                               dot_pos = argc;
+               }
+       }
+       argv[argc] = NULL;
+
+       glob_expand(NULL, NULL, NULL, NULL);
+
+       *argc_p = argc;
+       *argv_p = argv;
+}
+
+BOOL io_start_buffering_out(int f_out)
+{
+       if (msgs2stderr && DEBUG_GTE(IO, 2))
+               rprintf(FINFO, "[%s] io_start_buffering_out(%d)\n", who_am_i(), f_out);
+
+       if (OUT_MULTIPLEXED && !iobuf.msg.buf) {
+               iobuf.msg.size = IO_BUFFER_SIZE - 4;
+               if (!(iobuf.msg.buf = new_array(char, iobuf.msg.size + 4)))
+                       out_of_memory("io_start_buffering_out");
+               iobuf.msg.pos = iobuf.msg.len = 0;
+       }
+
+       if (iobuf.out.buf) {
+               if (iobuf.out_fd == -1)
+                       iobuf.out_fd = f_out;
+               else
+                       assert(f_out == iobuf.out_fd);
+               return False;
+       }
+
+       iobuf.out.size = IO_BUFFER_SIZE * 2 - 4;
+       /* The 4 overflow bytes makes some circular-buffer wrapping operations easier. */
+       if (!(iobuf.out.buf = new_array(char, iobuf.out.size + 4)))
+               out_of_memory("io_start_buffering_out");
+       iobuf.out.pos = iobuf.out.len = 0;
+       iobuf.out_fd = f_out;
+
+       return True;
+}
+
+BOOL io_start_buffering_in(int f_in)
+{
+       if (msgs2stderr && DEBUG_GTE(IO, 2))
+               rprintf(FINFO, "[%s] io_start_buffering_in(%d)\n", who_am_i(), f_in);
+
+       if (iobuf.in.buf) {
+               if (iobuf.in_fd == -1)
+                       iobuf.in_fd = f_in;
+               else
+                       assert(f_in == iobuf.in_fd);
+               return False;
+       }
+
+       iobuf.in.size = IO_BUFFER_SIZE;
+       if (!(iobuf.in.buf = new_array(char, iobuf.in.size)))
+               out_of_memory("io_start_buffering_in");
+
+       iobuf.in.pos = iobuf.in.len = 0;
+
+       iobuf.in_fd = f_in;
+
+       return True;
+}
+
+void io_end_buffering_in(BOOL free_buffers)
+{
+       if (msgs2stderr && DEBUG_GTE(IO, 2)) {
+               rprintf(FINFO, "[%s] io_end_buffering_in(IOBUF_%s_BUFS)\n",
+                       who_am_i(), free_buffers ? "FREE" : "KEEP");
+       }
+
+       if (free_buffers)
+               free_xbuf(&iobuf.in);
+       else
+               iobuf.in.pos = iobuf.in.len = 0;
+
+       iobuf.in_fd = -1;
+}
+
+void io_end_buffering_out(BOOL free_buffers)
+{
+       if (msgs2stderr && DEBUG_GTE(IO, 2)) {
+               rprintf(FINFO, "[%s] io_end_buffering_out(IOBUF_%s_BUFS)\n",
+                       who_am_i(), free_buffers ? "FREE" : "KEEP");
+       }
+
        io_flush(FULL_FLUSH);
-       free(iobuf_out);
-       iobuf_out = NULL;
-       iobuf_f_out = -1;
+
+       if (free_buffers) {
+               free_xbuf(&iobuf.out);
+               free_xbuf(&iobuf.msg);
+       }
+
+       iobuf.out_fd = -1;
 }
 
-void maybe_flush_socket(void)
+void maybe_flush_socket(int important)
 {
-       if (iobuf_out && iobuf_out_cnt && time(NULL) - last_io_out >= 5)
+       if (flist_eof && iobuf.out.buf && iobuf.out.len > iobuf.out_empty_len
+        && (important || time(NULL) - last_io_out >= 5))
                io_flush(NORMAL_FLUSH);
 }
 
 void maybe_send_keepalive(void)
 {
        if (time(NULL) - last_io_out >= allowed_lull) {
-               if (!iobuf_out || !iobuf_out_cnt) {
+               if (!iobuf.msg.len && iobuf.out.len == iobuf.out_empty_len) {
                        if (protocol_version < 29)
                                return; /* there's nothing we can do */
                        if (protocol_version >= 30)
-                               send_msg(MSG_NOOP, "", 0);
+                               send_msg(MSG_NOOP, "", 0, 0);
                        else {
-                               write_int(sock_f_out, cur_flist->count);
-                               write_shortint(sock_f_out, ITEM_IS_NEW);
+                               write_int(iobuf.out_fd, cur_flist->used);
+                               write_shortint(iobuf.out_fd, ITEM_IS_NEW);
                        }
                }
-               if (iobuf_out)
+               if (iobuf.msg.len)
+                       perform_io(iobuf.msg.size - iobuf.msg.len + 1, PIO_NEED_MSGROOM);
+               else if (iobuf.out.len > iobuf.out_empty_len)
                        io_flush(NORMAL_FLUSH);
        }
 }
 
-void start_flist_forward(int f_in)
-{
-       assert(iobuf_out != NULL);
-       assert(iobuf_f_out == msg_fd_out);
-       flist_forward_from = f_in;
-}
-
-void stop_flist_forward()
-{
-       flist_forward_from = -1;
-       io_flush(FULL_FLUSH);
-}
-
-/**
- * Continue trying to read len bytes - don't return until len has been
- * read.
- **/
-static void read_loop(int fd, char *buf, size_t len)
+void start_flist_forward(int ndx)
+{
+       write_int(iobuf.out_fd, ndx);
+       forward_flist_data = 1;
+}
+
+void stop_flist_forward(void)
+{
+       forward_flist_data = 0;
+}
+
+/* Read a message from a multiplexed source. */
+static void read_a_msg(void)
+{
+       char *data, line[BIGPATHBUFLEN];
+       int tag, val;
+       size_t msg_bytes;
+
+       data = perform_io(4, PIO_INPUT_AND_CONSUME);
+       tag = IVAL(data, 0);
+
+       msg_bytes = tag & 0xFFFFFF;
+       tag = (tag >> 24) - MPLEX_BASE;
+
+       if (DEBUG_GTE(IO, 1) && (msgs2stderr || tag != MSG_INFO))
+               rprintf(FINFO, "[%s] got msg=%d, len=%ld\n", who_am_i(), (int)tag, (long)msg_bytes);
+
+       switch (tag) {
+       case MSG_DATA:
+               assert(iobuf.raw_input_ends_before == 0);
+               /* Though this does not yet read the data, we do mark where in
+                * the buffer the msg data will end once it is read.  It is
+                * possible that this points off the end of the buffer, in
+                * which case the gradual reading of the input stream will
+                * cause this value to decrease and eventually become real. */
+               iobuf.raw_input_ends_before = iobuf.in.pos + msg_bytes;
+               break;
+       case MSG_STATS:
+               if (msg_bytes != sizeof stats.total_read || !am_generator)
+                       goto invalid_msg;
+               data = perform_io(sizeof stats.total_read, PIO_INPUT_AND_CONSUME);
+               memcpy((char*)&stats.total_read, data, sizeof stats.total_read);
+               break;
+       case MSG_REDO:
+               if (msg_bytes != 4 || !am_generator)
+                       goto invalid_msg;
+               data = perform_io(4, PIO_INPUT_AND_CONSUME);
+               got_flist_entry_status(FES_REDO, IVAL(data, 0));
+               break;
+       case MSG_IO_ERROR:
+               if (msg_bytes != 4 || am_sender)
+                       goto invalid_msg;
+               data = perform_io(4, PIO_INPUT_AND_CONSUME);
+               val = IVAL(data, 0);
+               io_error |= val;
+               if (!am_generator)
+                       send_msg_int(MSG_IO_ERROR, val);
+               break;
+       case MSG_IO_TIMEOUT:
+               if (msg_bytes != 4 || am_server || am_generator)
+                       goto invalid_msg;
+               data = perform_io(4, PIO_INPUT_AND_CONSUME);
+               val = IVAL(data, 0);
+               if (!io_timeout || io_timeout > val) {
+                       if (INFO_GTE(MISC, 2))
+                               rprintf(FINFO, "Setting --timeout=%d to match server\n", val);
+                       set_io_timeout(val);
+               }
+               break;
+       case MSG_NOOP:
+               if (am_sender)
+                       maybe_send_keepalive();
+               break;
+       case MSG_DELETED:
+               if (msg_bytes >= sizeof line)
+                       goto overflow;
+               if (am_generator) {
+                       memcpy(line, perform_io(msg_bytes, PIO_INPUT_AND_CONSUME), msg_bytes);
+                       send_msg(MSG_DELETED, line, msg_bytes, 1);
+                       break;
+               }
+#ifdef ICONV_OPTION
+               if (ic_recv != (iconv_t)-1) {
+                       xbuf outbuf, inbuf;
+                       char ibuf[512];
+                       int add_null = 0;
+                       int flags = ICB_INCLUDE_BAD | ICB_INIT;
+
+                       INIT_CONST_XBUF(outbuf, line);
+                       INIT_XBUF(inbuf, ibuf, 0, (size_t)-1);
+
+                       while (msg_bytes) {
+                               size_t len = msg_bytes > sizeof ibuf - inbuf.len ? sizeof ibuf - inbuf.len : msg_bytes;
+                               memcpy(ibuf + inbuf.len, perform_io(len, PIO_INPUT_AND_CONSUME), len);
+                               inbuf.pos = 0;
+                               inbuf.len += len;
+                               if (!(msg_bytes -= len) && !ibuf[inbuf.len-1])
+                                       inbuf.len--, add_null = 1;
+                               if (iconvbufs(ic_send, &inbuf, &outbuf, flags) < 0) {
+                                       if (errno == E2BIG)
+                                               goto overflow;
+                                       /* Buffer ended with an incomplete char, so move the
+                                        * bytes to the start of the buffer and continue. */
+                                       memmove(ibuf, ibuf + inbuf.pos, inbuf.len);
+                               }
+                               flags &= ~ICB_INIT;
+                       }
+                       if (add_null) {
+                               if (outbuf.len == outbuf.size)
+                                       goto overflow;
+                               outbuf.buf[outbuf.len++] = '\0';
+                       }
+                       msg_bytes = outbuf.len;
+               } else
+#endif
+                       memcpy(line, perform_io(msg_bytes, PIO_INPUT_AND_CONSUME), msg_bytes);
+               /* A directory name was sent with the trailing null */
+               if (msg_bytes > 0 && !line[msg_bytes-1])
+                       log_delete(line, S_IFDIR);
+               else {
+                       line[msg_bytes] = '\0';
+                       log_delete(line, S_IFREG);
+               }
+               break;
+       case MSG_SUCCESS:
+               if (msg_bytes != 4) {
+                 invalid_msg:
+                       rprintf(FERROR, "invalid multi-message %d:%lu [%s%s]\n",
+                               tag, (unsigned long)msg_bytes, who_am_i(),
+                               inc_recurse ? "/inc" : "");
+                       exit_cleanup(RERR_STREAMIO);
+               }
+               data = perform_io(4, PIO_INPUT_AND_CONSUME);
+               val = IVAL(data, 0);
+               if (am_generator)
+                       got_flist_entry_status(FES_SUCCESS, val);
+               else
+                       successful_send(val);
+               break;
+       case MSG_NO_SEND:
+               if (msg_bytes != 4)
+                       goto invalid_msg;
+               data = perform_io(4, PIO_INPUT_AND_CONSUME);
+               val = IVAL(data, 0);
+               if (am_generator)
+                       got_flist_entry_status(FES_NO_SEND, val);
+               else
+                       send_msg_int(MSG_NO_SEND, val);
+               break;
+       case MSG_ERROR_SOCKET:
+       case MSG_ERROR_UTF8:
+       case MSG_CLIENT:
+       case MSG_LOG:
+               if (!am_generator)
+                       goto invalid_msg;
+               if (tag == MSG_ERROR_SOCKET)
+                       msgs2stderr = 1;
+               /* FALL THROUGH */
+       case MSG_INFO:
+       case MSG_ERROR:
+       case MSG_ERROR_XFER:
+       case MSG_WARNING:
+               if (msg_bytes >= sizeof line) {
+                   overflow:
+                       rprintf(FERROR,
+                               "multiplexing overflow %d:%lu [%s%s]\n",
+                               tag, (unsigned long)msg_bytes, who_am_i(),
+                               inc_recurse ? "/inc" : "");
+                       exit_cleanup(RERR_STREAMIO);
+               }
+               memcpy(line, perform_io(msg_bytes, PIO_INPUT_AND_CONSUME), msg_bytes);
+               rwrite((enum logcode)tag, line, msg_bytes, !am_generator);
+               if (first_message) {
+                       if (list_only && !am_sender && tag == 1 && msg_bytes < sizeof line) {
+                               line[msg_bytes] = '\0';
+                               check_for_d_option_error(line);
+                       }
+                       first_message = 0;
+               }
+               break;
+       case MSG_ERROR_EXIT:
+               if (msg_bytes == 0) {
+                       if (!am_sender && !am_generator) {
+                               send_msg(MSG_ERROR_EXIT, "", 0, 0);
+                               io_flush(FULL_FLUSH);
+                       }
+                       val = 0;
+               } else if (msg_bytes == 4) {
+                       data = perform_io(4, PIO_INPUT_AND_CONSUME);
+                       val = IVAL(data, 0);
+                       if (protocol_version >= 31) {
+                               if (am_generator)
+                                       send_msg_int(MSG_ERROR_EXIT, val);
+                               else
+                                       send_msg(MSG_ERROR_EXIT, "", 0, 0);
+                       }
+               } else
+                       goto invalid_msg;
+               /* Send a negative linenum so that we don't end up
+                * with a duplicate exit message. */
+               _exit_cleanup(val, __FILE__, 0 - __LINE__);
+       default:
+               rprintf(FERROR, "unexpected tag %d [%s%s]\n",
+                       tag, who_am_i(), inc_recurse ? "/inc" : "");
+               exit_cleanup(RERR_STREAMIO);
+       }
+}
+
+static void drain_multiplex_messages(void)
 {
-       while (len) {
-               int n = read_timeout(fd, buf, len);
-
-               buf += n;
-               len -= n;
+       while (IN_MULTIPLEXED && iobuf.in.len) {
+               if (iobuf.raw_input_ends_before) {
+                       size_t raw_len = iobuf.raw_input_ends_before - iobuf.in.pos;
+                       iobuf.raw_input_ends_before = 0;
+                       if (raw_len >= iobuf.in.len) {
+                               iobuf.in.len = 0;
+                               break;
+                       }
+                       iobuf.in.pos += raw_len;
+                       iobuf.in.len -= raw_len;
+               }
+               read_a_msg();
        }
 }
 
-/**
- * Read from the file descriptor handling multiplexing - return number
- * of bytes read.
- *
- * Never returns <= 0.
- */
-static int readfd_unbuffered(int fd, char *buf, size_t len)
+void wait_for_receiver(void)
 {
-       size_t msg_bytes;
-       int tag, cnt = 0;
-       char line[BIGPATHBUFLEN];
-
-       if (!iobuf_in || fd != iobuf_f_in)
-               return read_timeout(fd, buf, len);
-
-       if (!io_multiplexing_in && iobuf_in_remaining == 0) {
-               iobuf_in_remaining = read_timeout(fd, iobuf_in, iobuf_in_siz);
-               iobuf_in_ndx = 0;
-       }
-
-       while (cnt == 0) {
-               if (iobuf_in_remaining) {
-                       len = MIN(len, iobuf_in_remaining);
-                       memcpy(buf, iobuf_in + iobuf_in_ndx, len);
-                       iobuf_in_ndx += len;
-                       iobuf_in_remaining -= len;
-                       cnt = len;
-                       break;
-               }
-
-               read_loop(fd, line, 4);
-               tag = IVAL(line, 0);
-
-               msg_bytes = tag & 0xFFFFFF;
-               tag = (tag >> 24) - MPLEX_BASE;
-
-               switch (tag) {
-               case MSG_DATA:
-                       if (msg_bytes > iobuf_in_siz) {
-                               if (!(iobuf_in = realloc_array(iobuf_in, char,
-                                                              msg_bytes)))
-                                       out_of_memory("readfd_unbuffered");
-                               iobuf_in_siz = msg_bytes;
-                       }
-                       read_loop(fd, iobuf_in, msg_bytes);
-                       iobuf_in_remaining = msg_bytes;
-                       iobuf_in_ndx = 0;
-                       break;
-               case MSG_NOOP:
-                       if (am_sender)
-                               maybe_send_keepalive();
-                       break;
-               case MSG_IO_ERROR:
-                       if (msg_bytes != 4)
-                               goto invalid_msg;
-                       read_loop(fd, line, msg_bytes);
-                       io_error |= IVAL(line, 0);
-                       break;
-               case MSG_DELETED:
-                       if (msg_bytes >= sizeof line)
-                               goto overflow;
-                       read_loop(fd, line, msg_bytes);
-                       /* A directory name was sent with the trailing null */
-                       if (msg_bytes > 0 && !line[msg_bytes-1])
-                               log_delete(line, S_IFDIR);
-                       else {
-                               line[msg_bytes] = '\0';
-                               log_delete(line, S_IFREG);
-                       }
-                       break;
-               case MSG_SUCCESS:
-                       if (msg_bytes != 4) {
-                         invalid_msg:
-                               rprintf(FERROR, "invalid multi-message %d:%ld [%s]\n",
-                                       tag, (long)msg_bytes, who_am_i());
+       if (!iobuf.raw_input_ends_before)
+               read_a_msg();
+
+       if (iobuf.raw_input_ends_before) {
+               int ndx = read_int(iobuf.in_fd);
+               if (ndx < 0) {
+                       switch (ndx) {
+                       case NDX_FLIST_EOF:
+                               flist_eof = 1;
+                               if (DEBUG_GTE(FLIST, 3))
+                                       rprintf(FINFO, "[%s] flist_eof=1\n", who_am_i());
+                               break;
+                       case NDX_DONE:
+                               msgdone_cnt++;
+                               break;
+                       default:
                                exit_cleanup(RERR_STREAMIO);
                        }
-                       read_loop(fd, line, msg_bytes);
-                       successful_send(IVAL(line, 0));
-                       break;
-               case MSG_NO_SEND:
-                       if (msg_bytes != 4)
-                               goto invalid_msg;
-                       read_loop(fd, line, msg_bytes);
-                       send_msg_int(MSG_NO_SEND, IVAL(line, 0));
-                       break;
-               case MSG_INFO:
-               case MSG_ERROR:
-                       if (msg_bytes >= sizeof line) {
-                           overflow:
-                               rprintf(FERROR,
-                                       "multiplexing overflow %d:%ld [%s]\n",
-                                       tag, (long)msg_bytes, who_am_i());
-                               exit_cleanup(RERR_STREAMIO);
+               } else {
+                       struct file_list *flist;
+                       if (DEBUG_GTE(FLIST, 2)) {
+                               rprintf(FINFO, "[%s] receiving flist for dir %d\n",
+                                       who_am_i(), ndx);
                        }
-                       read_loop(fd, line, msg_bytes);
-                       rwrite((enum logcode)tag, line, msg_bytes);
-                       break;
-               default:
-                       rprintf(FERROR, "unexpected tag %d [%s]\n",
-                               tag, who_am_i());
-                       exit_cleanup(RERR_STREAMIO);
+                       flist = recv_file_list(iobuf.in_fd);
+                       flist->parent_ndx = ndx;
+#ifdef SUPPORT_HARD_LINKS
+                       if (preserve_hard_links)
+                               match_hard_links(flist);
+#endif
                }
        }
-
-       if (iobuf_in_remaining == 0)
-               io_flush(NORMAL_FLUSH);
-
-       return cnt;
-}
-
-/* Do a buffered read from fd.  Don't return until all N bytes have
- * been read.  If all N can't be read then exit with an error. */
-static void readfd(int fd, char *buffer, size_t N)
-{
-       int  cnt;
-       size_t total = 0;
-
-       while (total < N) {
-               cnt = readfd_unbuffered(fd, buffer + total, N-total);
-               total += cnt;
-       }
-
-       if (fd == write_batch_monitor_in) {
-               if ((size_t)write(batch_fd, buffer, total) != total)
-                       exit_cleanup(RERR_FILEIO);
-       }
-
-       if (fd == flist_forward_from)
-               writefd(iobuf_f_out, buffer, total);
-
-       if (fd == sock_f_in)
-               stats.total_read += total;
 }
 
 unsigned short read_shortint(int f)
 {
        char b[2];
-       readfd(f, b, 2);
+       read_buf(f, b, 2);
        return (UVAL(b, 1) << 8) + UVAL(b, 0);
 }
 
@@ -983,7 +1550,7 @@ int32 read_int(int f)
        char b[4];
        int32 num;
 
-       readfd(f, b, 4);
+       read_buf(f, b, 4);
        num = IVAL(b, 0);
 #if SIZEOF_INT32 > 4
        if (num & (int32)0x80000000)
@@ -992,83 +1559,156 @@ int32 read_int(int f)
        return num;
 }
 
-int64 read_longint(int f)
+int32 read_varint(int f)
 {
-       int64 num;
-       char b[9];
+       union {
+               char b[5];
+               int32 x;
+       } u;
+       uchar ch;
+       int extra;
 
-       if (protocol_version < 30) {
-               num = read_int(f);
+       u.x = 0;
+       ch = read_byte(f);
+       extra = int_byte_extra[ch / 4];
+       if (extra) {
+               uchar bit = ((uchar)1<<(8-extra));
+               if (extra >= (int)sizeof u.b) {
+                       rprintf(FERROR, "Overflow in read_varint()\n");
+                       exit_cleanup(RERR_STREAMIO);
+               }
+               read_buf(f, u.b, extra);
+               u.b[extra] = ch & (bit-1);
+       } else
+               u.b[0] = ch;
+#if CAREFUL_ALIGNMENT
+       u.x = IVAL(u.b,0);
+#endif
+#if SIZEOF_INT32 > 4
+       if (u.x & (int32)0x80000000)
+               u.x |= ~(int32)0xffffffff;
+#endif
+       return u.x;
+}
 
-               if ((int32)num != (int32)0xffffffff)
-                       return num;
+int64 read_varlong(int f, uchar min_bytes)
+{
+       union {
+               char b[9];
+               int64 x;
+       } u;
+       char b2[8];
+       int extra;
 
 #if SIZEOF_INT64 < 8
-               rprintf(FERROR, "Integer overflow: attempted 64-bit offset\n");
-               exit_cleanup(RERR_UNSUPPORTED);
+       memset(u.b, 0, 8);
 #else
-               readfd(f, b, 8);
-               num = IVAL(b,0) | (((int64)IVAL(b,4))<<32);
+       u.x = 0;
 #endif
-       } else {
-               int cnt;
-               readfd(f, b, 3);
-               cnt = int_byte_cnt[CVAL(b, 0) / 4];
+       read_buf(f, b2, min_bytes);
+       memcpy(u.b, b2+1, min_bytes-1);
+       extra = int_byte_extra[CVAL(b2, 0) / 4];
+       if (extra) {
+               uchar bit = ((uchar)1<<(8-extra));
+               if (min_bytes + extra > (int)sizeof u.b) {
+                       rprintf(FERROR, "Overflow in read_varlong()\n");
+                       exit_cleanup(RERR_STREAMIO);
+               }
+               read_buf(f, u.b + min_bytes - 1, extra);
+               u.b[min_bytes + extra - 1] = CVAL(b2, 0) & (bit-1);
 #if SIZEOF_INT64 < 8
-               if (cnt > 5 || (cnt == 5 && (CVAL(b,0)&0x3F || CVAL(b,1)&0x80))) {
+               if (min_bytes + extra > 5 || u.b[4] || CVAL(u.b,3) & 0x80) {
                        rprintf(FERROR, "Integer overflow: attempted 64-bit offset\n");
                        exit_cleanup(RERR_UNSUPPORTED);
                }
 #endif
-               if (cnt > 3)
-                       readfd(f, b + 3, cnt - 3);
-               switch (cnt) {
-               case 3:
-                       num = NVAL3(b, 0);
-                       break;
-               case 4:
-                       num = NVAL4(b, 0x80);
-                       break;
-               case 5:
-                       num = NVAL5(b, 0xC0);
-                       break;
+       } else
+               u.b[min_bytes + extra - 1] = CVAL(b2, 0);
+#if SIZEOF_INT64 < 8
+       u.x = IVAL(u.b,0);
+#elif CAREFUL_ALIGNMENT
+       u.x = IVAL(u.b,0) | (((int64)IVAL(u.b,4))<<32);
+#endif
+       return u.x;
+}
+
+int64 read_longint(int f)
+{
 #if SIZEOF_INT64 >= 8
-               case 6:
-                       num = NVAL6(b, 0xE0);
-                       break;
-               case 7:
-                       num = NVAL7(b, 0xF0);
-                       break;
-               case 8:
-                       num = NVAL8(b, 0xF8);
-                       break;
-               case 9:
-                       num = NVAL8(b+1, 0);
-                       break;
+       char b[9];
 #endif
-               default:
-                       exit_cleanup(RERR_PROTOCOL); /* impossible... */
-               }
-       }
+       int32 num = read_int(f);
 
-       return num;
+       if (num != (int32)0xffffffff)
+               return num;
+
+#if SIZEOF_INT64 < 8
+       rprintf(FERROR, "Integer overflow: attempted 64-bit offset\n");
+       exit_cleanup(RERR_UNSUPPORTED);
+#else
+       read_buf(f, b, 8);
+       return IVAL(b,0) | (((int64)IVAL(b,4))<<32);
+#endif
 }
 
 void read_buf(int f, char *buf, size_t len)
 {
-       readfd(f,buf,len);
+       if (f != iobuf.in_fd) {
+               if (safe_read(f, buf, len) != len)
+                       whine_about_eof(False); /* Doesn't return. */
+               goto batch_copy;
+       }
+
+       if (!IN_MULTIPLEXED) {
+               memcpy(buf, perform_io(len, PIO_INPUT_AND_CONSUME), len);
+               total_data_read += len;
+               if (forward_flist_data)
+                       write_buf(iobuf.out_fd, buf, len);
+         batch_copy:
+               if (f == write_batch_monitor_in)
+                       safe_write(batch_fd, buf, len);
+               return;
+       }
+
+       while (1) {
+               char *data;
+               size_t siz;
+
+               while (!iobuf.raw_input_ends_before)
+                       read_a_msg();
+
+               siz = MIN(len, iobuf.raw_input_ends_before - iobuf.in.pos);
+               data = perform_io(siz, PIO_INPUT_AND_CONSUME);
+               if (iobuf.in.pos == iobuf.raw_input_ends_before)
+                       iobuf.raw_input_ends_before = 0;
+
+               /* The bytes at the "data" pointer will survive long
+                * enough to make a copy, but not past future I/O. */
+               memcpy(buf, data, siz);
+               total_data_read += siz;
+
+               if (forward_flist_data)
+                       write_buf(iobuf.out_fd, buf, siz);
+
+               if (f == write_batch_monitor_in)
+                       safe_write(batch_fd, buf, siz);
+
+               if ((len -= siz) == 0)
+                       break;
+               buf += siz;
+       }
 }
 
 void read_sbuf(int f, char *buf, size_t len)
 {
-       readfd(f, buf, len);
+       read_buf(f, buf, len);
        buf[len] = '\0';
 }
 
 uchar read_byte(int f)
 {
        uchar c;
-       readfd(f, (char *)&c, 1);
+       read_buf(f, (char*)&c, 1);
        return c;
 }
 
@@ -1086,7 +1726,7 @@ int read_vstring(int f, char *buf, int bufsize)
        }
 
        if (len)
-               readfd(f, buf, len);
+               read_buf(f, buf, len);
        buf[len] = '\0';
        return len;
 }
@@ -1095,6 +1735,7 @@ int read_vstring(int f, char *buf, int bufsize)
  * called by both the sender and the receiver. */
 void read_sum_head(int f, struct sum_struct *sum)
 {
+       int32 max_blength = protocol_version < 30 ? OLD_MAX_BLOCK_SIZE : MAX_BLOCK_SIZE;
        sum->count = read_int(f);
        if (sum->count < 0) {
                rprintf(FERROR, "Invalid checksum count %ld [%s]\n",
@@ -1102,13 +1743,13 @@ void read_sum_head(int f, struct sum_struct *sum)
                exit_cleanup(RERR_PROTOCOL);
        }
        sum->blength = read_int(f);
-       if (sum->blength < 0 || sum->blength > MAX_BLOCK_SIZE) {
+       if (sum->blength < 0 || sum->blength > max_blength) {
                rprintf(FERROR, "Invalid block length %ld [%s]\n",
                        (long)sum->blength, who_am_i());
                exit_cleanup(RERR_PROTOCOL);
        }
        sum->s2length = protocol_version < 27 ? csum_length : (int)read_int(f);
-       if (sum->s2length < 0 || sum->s2length > MD4_SUM_LENGTH) {
+       if (sum->s2length < 0 || sum->s2length > MAX_DIGEST_LEN) {
                rprintf(FERROR, "Invalid checksum length %d [%s]\n",
                        sum->s2length, who_am_i());
                exit_cleanup(RERR_PROTOCOL);
@@ -1138,8 +1779,7 @@ void write_sum_head(int f, struct sum_struct *sum)
        write_int(f, sum->remainder);
 }
 
-/**
- * Sleep after writing to limit I/O bandwidth usage.
+/* Sleep after writing to limit I/O bandwidth usage.
  *
  * @todo Rather than sleeping after each write, it might be better to
  * use some kind of averaging.  The current algorithm seems to always
@@ -1152,8 +1792,7 @@ void write_sum_head(int f, struct sum_struct *sum)
  * round small waits up to guarantee that we actually wait at least the
  * requested number of microseconds, this can become grossly inaccurate.
  * We therefore keep track of the bytes we've written over time and only
- * sleep when the accumulated delay is at least 1 tenth of a second.
- **/
+ * sleep when the accumulated delay is at least 1 tenth of a second. */
 static void sleep_for_bwlimit(int bytes_written)
 {
        static struct timeval prior_tv;
@@ -1163,9 +1802,6 @@ static void sleep_for_bwlimit(int bytes_written)
 
 #define ONE_SEC        1000000L /* # of microseconds in a second */
 
-       if (!bwlimit_writemax)
-               return;
-
        total_written += bytes_written;
 
        gettimeofday(&start_tv, NULL);
@@ -1193,214 +1829,85 @@ static void sleep_for_bwlimit(int bytes_written)
        total_written = (sleep_usec - elapsed_usec) * bwlimit / (ONE_SEC/1024);
 }
 
-/* Write len bytes to the file descriptor fd, looping as necessary to get
- * the job done and also (in certain circumstances) reading any data on
- * msg_fd_in to avoid deadlock.
- *
- * This function underlies the multiplexing system.  The body of the
- * application never calls this function directly. */
-static void writefd_unbuffered(int fd, const char *buf, size_t len)
+void io_flush(int flush_it_all)
 {
-       size_t n, total = 0;
-       fd_set w_fds, r_fds, e_fds;
-       int maxfd, count, cnt, using_r_fds;
-       int defer_save = defer_forwarding_messages;
-       struct timeval tv;
-
-       no_flush++;
-
-       while (total < len) {
-               FD_ZERO(&w_fds);
-               FD_SET(fd, &w_fds);
-               FD_ZERO(&e_fds);
-               FD_SET(fd, &e_fds);
-               maxfd = fd;
-
-               if (msg_fd_in >= 0) {
-                       FD_ZERO(&r_fds);
-                       FD_SET(msg_fd_in, &r_fds);
-                       if (msg_fd_in > maxfd)
-                               maxfd = msg_fd_in;
-                       using_r_fds = 1;
-               } else
-                       using_r_fds = 0;
-
-               tv.tv_sec = select_timeout;
-               tv.tv_usec = 0;
-
-               errno = 0;
-               count = select(maxfd + 1, using_r_fds ? &r_fds : NULL,
-                              &w_fds, &e_fds, &tv);
-
-               if (count <= 0) {
-                       if (count < 0 && errno == EBADF)
-                               exit_cleanup(RERR_SOCKETIO);
-                       check_timeout();
-                       continue;
-               }
-
-               if (FD_ISSET(fd, &e_fds)) {
-                       rsyserr(FINFO, errno,
-                               "select exception on fd %d", fd);
-               }
-
-               if (using_r_fds && FD_ISSET(msg_fd_in, &r_fds))
-                       read_msg_fd();
-
-               if (!FD_ISSET(fd, &w_fds))
-                       continue;
-
-               n = len - total;
-               if (bwlimit_writemax && n > bwlimit_writemax)
-                       n = bwlimit_writemax;
-               cnt = write(fd, buf + total, n);
-
-               if (cnt <= 0) {
-                       if (cnt < 0) {
-                               if (errno == EINTR)
-                                       continue;
-                               if (errno == EWOULDBLOCK || errno == EAGAIN) {
-                                       msleep(1);
-                                       continue;
-                               }
-                       }
-
-                       /* Don't try to write errors back across the stream. */
-                       if (fd == sock_f_out)
-                               io_end_multiplex_out();
-                       rsyserr(FERROR, errno,
-                               "writefd_unbuffered failed to write %ld bytes [%s]",
-                               (long)len, who_am_i());
-                       /* If the other side is sending us error messages, try
-                        * to grab any messages they sent before they died. */
-                       while (fd == sock_f_out && io_multiplexing_in) {
-                               set_io_timeout(30);
-                               ignore_timeout = 0;
-                               readfd_unbuffered(sock_f_in, io_filesfrom_buf,
-                                                 sizeof io_filesfrom_buf);
-                       }
-                       exit_cleanup(RERR_STREAMIO);
-               }
-
-               total += cnt;
-               defer_forwarding_messages = 1;
-
-               if (fd == sock_f_out) {
-                       if (io_timeout || am_generator)
-                               last_io_out = time(NULL);
-                       sleep_for_bwlimit(cnt);
-               }
+       if (iobuf.out.len > iobuf.out_empty_len) {
+               if (flush_it_all) /* FULL_FLUSH: flush everything in the output buffers */
+                       perform_io(iobuf.out.size - iobuf.out_empty_len, PIO_NEED_OUTROOM);
+               else /* NORMAL_FLUSH: flush at least 1 byte */
+                       perform_io(iobuf.out.size - iobuf.out.len + 1, PIO_NEED_OUTROOM);
        }
-
-       defer_forwarding_messages = defer_save;
-       no_flush--;
+       if (iobuf.msg.len)
+               perform_io(iobuf.msg.size, PIO_NEED_MSGROOM);
 }
 
-static void msg2sndr_flush(void)
+void write_shortint(int f, unsigned short x)
 {
-       if (defer_forwarding_messages)
-               return;
-
-       while (msg2sndr.head && io_multiplexing_out) {
-               struct msg_list_item *m = msg2sndr.head;
-               if (!(msg2sndr.head = m->next))
-                       msg2sndr.tail = NULL;
-               stats.total_written += m->len;
-               defer_forwarding_messages = 1;
-               writefd_unbuffered(sock_f_out, m->buf, m->len);
-               defer_forwarding_messages = 0;
-               free(m);
-       }
+       char b[2];
+       b[0] = (char)x;
+       b[1] = (char)(x >> 8);
+       write_buf(f, b, 2);
 }
 
-/**
- * Write an message to a multiplexed stream. If this fails then rsync
- * exits.
- **/
-static void mplex_write(enum msgcode code, const char *buf, size_t len)
+void write_int(int f, int32 x)
 {
-       char buffer[1024];
-       size_t n = len;
-
-       SIVAL(buffer, 0, ((MPLEX_BASE + (int)code)<<24) + len);
-
-       if (n > sizeof buffer - 4)
-               n = 0;
-       else
-               memcpy(buffer + 4, buf, n);
-
-       writefd_unbuffered(sock_f_out, buffer, n+4);
-
-       len -= n;
-       buf += n;
-
-       if (len) {
-               defer_forwarding_messages = 1;
-               writefd_unbuffered(sock_f_out, buf, len);
-               defer_forwarding_messages = 0;
-               msg2sndr_flush();
-       }
+       char b[4];
+       SIVAL(b, 0, x);
+       write_buf(f, b, 4);
 }
 
-void io_flush(int flush_it_all)
+void write_varint(int f, int32 x)
 {
-       if (flush_it_all) {
-               msg2genr_flush();
-               msg2sndr_flush();
-       }
+       char b[5];
+       uchar bit;
+       int cnt = 4;
 
-       if (!iobuf_out_cnt || no_flush)
-               return;
+       SIVAL(b, 1, x);
 
-       if (io_multiplexing_out)
-               mplex_write(MSG_DATA, iobuf_out, iobuf_out_cnt);
+       while (cnt > 1 && b[cnt] == 0)
+               cnt--;
+       bit = ((uchar)1<<(7-cnt+1));
+       if (CVAL(b, cnt) >= bit) {
+               cnt++;
+               *b = ~(bit-1);
+       } else if (cnt > 1)
+               *b = b[cnt] | ~(bit*2-1);
        else
-               writefd_unbuffered(iobuf_f_out, iobuf_out, iobuf_out_cnt);
-       iobuf_out_cnt = 0;
+               *b = b[cnt];
+
+       write_buf(f, b, cnt);
 }
 
-static void writefd(int fd, const char *buf, size_t len)
+void write_varlong(int f, int64 x, uchar min_bytes)
 {
-       if (fd == sock_f_out)
-               stats.total_written += len;
-
-       if (fd == write_batch_monitor_out) {
-               if ((size_t)write(batch_fd, buf, len) != len)
-                       exit_cleanup(RERR_FILEIO);
-       }
-
-       if (!iobuf_out || fd != iobuf_f_out) {
-               writefd_unbuffered(fd, buf, len);
-               return;
-       }
-
-       while (len) {
-               int n = MIN((int)len, IO_BUFFER_SIZE - iobuf_out_cnt);
-               if (n > 0) {
-                       memcpy(iobuf_out+iobuf_out_cnt, buf, n);
-                       buf += n;
-                       len -= n;
-                       iobuf_out_cnt += n;
-               }
+       char b[9];
+       uchar bit;
+       int cnt = 8;
 
-               if (iobuf_out_cnt == IO_BUFFER_SIZE)
-                       io_flush(NORMAL_FLUSH);
+       SIVAL(b, 1, x);
+#if SIZEOF_INT64 >= 8
+       SIVAL(b, 5, x >> 32);
+#else
+       if (x <= 0x7FFFFFFF && x >= 0)
+               memset(b + 5, 0, 4);
+       else {
+               rprintf(FERROR, "Integer overflow: attempted 64-bit offset\n");
+               exit_cleanup(RERR_UNSUPPORTED);
        }
-}
+#endif
 
-void write_shortint(int f, unsigned short x)
-{
-       char b[2];
-       b[0] = (char)x;
-       b[1] = (char)(x >> 8);
-       writefd(f, b, 2);
-}
+       while (cnt > min_bytes && b[cnt] == 0)
+               cnt--;
+       bit = ((uchar)1<<(7-cnt+min_bytes));
+       if (CVAL(b, cnt) >= bit) {
+               cnt++;
+               *b = ~(bit-1);
+       } else if (cnt > min_bytes)
+               *b = b[cnt] | ~(bit*2-1);
+       else
+               *b = b[cnt];
 
-void write_int(int f, int32 x)
-{
-       char b[4];
-       SIVAL(b, 0, x);
-       writefd(f, b, 4);
+       write_buf(f, b, cnt);
 }
 
 /*
@@ -1409,117 +1916,64 @@ void write_int(int f, int32 x)
  */
 void write_longint(int f, int64 x)
 {
-       char b[12];
+       char b[12], * const s = b+4;
 
-#if SIZEOF_INT64 < 8
-       if (x < 0 || x > 0x7FFFFFFF) {
-               rprintf(FERROR, "Integer overflow: attempted 64-bit offset\n");
-               exit_cleanup(RERR_UNSUPPORTED);
+       SIVAL(s, 0, x);
+       if (x <= 0x7FFFFFFF && x >= 0) {
+               write_buf(f, s, 4);
+               return;
        }
-#endif
-
-       if (protocol_version < 30) {
-               char * const s = b+4;
-               SIVAL(s, 0, x);
-#if SIZEOF_INT64 < 8
-               writefd(f, s, 4);
-#else
-               if (x <= 0x7FFFFFFF && x >= 0) {
-                       writefd(f, s, 4);
-                       return;
-               }
 
-               memset(b, 0xFF, 4);
-               SIVAL(s, 4, x >> 32);
-               writefd(f, b, 12);
-       } else if (x < 0) {
-               goto all_bits;
-#endif
-       } else if (x < ((int32)1<<(3*8-1))) {
-               b[0] = (char)(x >> 16);
-               b[1] = (char)(x >> 8);
-               b[2] = (char)x;
-               writefd(f, b, 3);
-       } else if (x < ((int64)1<<(4*8-2))) {
-               b[0] = (char)((x >> 24) | 0x80);
-               b[1] = (char)(x >> 16);
-               b[2] = (char)(x >> 8);
-               b[3] = (char)x;
-               writefd(f, b, 4);
 #if SIZEOF_INT64 < 8
-       } else {
-               b[0] = 0xC0;
-               b[1] = (char)(x >> 24);
-               b[2] = (char)(x >> 16);
-               b[3] = (char)(x >> 8);
-               b[4] = (char)x;
-               writefd(f, b, 5);
-       }
+       rprintf(FERROR, "Integer overflow: attempted 64-bit offset\n");
+       exit_cleanup(RERR_UNSUPPORTED);
 #else
-       } else if (x < ((int64)1<<(5*8-3))) {
-               b[0] = (char)((x >> 32) | 0xC0);
-               b[1] = (char)(x >> 24);
-               b[2] = (char)(x >> 16);
-               b[3] = (char)(x >> 8);
-               b[4] = (char)x;
-               writefd(f, b, 5);
-       } else if (x < ((int64)1<<(6*8-4))) {
-               b[0] = (char)((x >> 40) | 0xE0);
-               b[1] = (char)(x >> 32);
-               b[2] = (char)(x >> 24);
-               b[3] = (char)(x >> 16);
-               b[4] = (char)(x >> 8);
-               b[5] = (char)x;
-               writefd(f, b, 6);
-       } else if (x < ((int64)1<<(7*8-5))) {
-               b[0] = (char)((x >> 48) | 0xF0);
-               b[1] = (char)(x >> 40);
-               b[2] = (char)(x >> 32);
-               b[3] = (char)(x >> 24);
-               b[4] = (char)(x >> 16);
-               b[5] = (char)(x >> 8);
-               b[6] = (char)x;
-               writefd(f, b, 7);
-       } else if (x < ((int64)1<<(8*8-6))) {
-               b[0] = (char)((x >> 56) | 0xF8);
-               b[1] = (char)(x >> 48);
-               b[2] = (char)(x >> 40);
-               b[3] = (char)(x >> 32);
-               b[4] = (char)(x >> 24);
-               b[5] = (char)(x >> 16);
-               b[6] = (char)(x >> 8);
-               b[7] = (char)x;
-               writefd(f, b, 8);
-       } else {
-         all_bits:
-               b[0] = (char)0xFC;
-               b[1] = (char)(x >> 56);
-               b[2] = (char)(x >> 48);
-               b[3] = (char)(x >> 40);
-               b[4] = (char)(x >> 32);
-               b[5] = (char)(x >> 24);
-               b[6] = (char)(x >> 16);
-               b[7] = (char)(x >> 8);
-               b[8] = (char)x;
-               writefd(f, b, 9);
-       }
+       memset(b, 0xFF, 4);
+       SIVAL(s, 4, x >> 32);
+       write_buf(f, b, 12);
 #endif
 }
 
 void write_buf(int f, const char *buf, size_t len)
 {
-       writefd(f,buf,len);
+       size_t pos, siz;
+
+       if (f != iobuf.out_fd) {
+               safe_write(f, buf, len);
+               goto batch_copy;
+       }
+
+       if (iobuf.out.len + len > iobuf.out.size)
+               perform_io(len, PIO_NEED_OUTROOM);
+
+       pos = iobuf.out.pos + iobuf.out.len; /* Must be set after any flushing. */
+       if (pos >= iobuf.out.size)
+               pos -= iobuf.out.size;
+
+       /* Handle a split copy if we wrap around the end of the circular buffer. */
+       if (pos >= iobuf.out.pos && (siz = iobuf.out.size - pos) < len) {
+               memcpy(iobuf.out.buf + pos, buf, siz);
+               memcpy(iobuf.out.buf, buf + siz, len - siz);
+       } else
+               memcpy(iobuf.out.buf + pos, buf, len);
+
+       iobuf.out.len += len;
+       total_data_written += len;
+
+  batch_copy:
+       if (f == write_batch_monitor_out)
+               safe_write(batch_fd, buf, len);
 }
 
-/** Write a string to the connection */
+/* Write a string to the connection */
 void write_sbuf(int f, const char *buf)
 {
-       writefd(f, buf, strlen(buf));
+       write_buf(f, buf, strlen(buf));
 }
 
 void write_byte(int f, uchar c)
 {
-       writefd(f, (char *)&c, 1);
+       write_buf(f, (char *)&c, 1);
 }
 
 void write_vstring(int f, const char *str, int len)
@@ -1537,9 +1991,9 @@ void write_vstring(int f, const char *str, int len)
        }
        *lb = len;
 
-       writefd(f, (char*)lenbuf, lb - lenbuf + 1);
+       write_buf(f, (char*)lenbuf, lb - lenbuf + 1);
        if (len)
-               writefd(f, str, len);
+               write_buf(f, str, len);
 }
 
 /* Send a file-list index using a byte-reduction method. */
@@ -1561,7 +2015,7 @@ void write_ndx(int f, int32 ndx)
                prev_positive = ndx;
        } else if (ndx == NDX_DONE) {
                *b = 0;
-               writefd(f, b, 1);
+               write_buf(f, b, 1);
                return;
        } else {
                b[cnt++] = (char)0xFF;
@@ -1578,15 +2032,15 @@ void write_ndx(int f, int32 ndx)
        else if (diff < 0 || diff > 0x7FFF) {
                b[cnt++] = (char)0xFE;
                b[cnt++] = (char)((ndx >> 24) | 0x80);
-               b[cnt++] = (char)(ndx >> 16);
-               b[cnt++] = (char)(ndx >> 8);
                b[cnt++] = (char)ndx;
+               b[cnt++] = (char)(ndx >> 8);
+               b[cnt++] = (char)(ndx >> 16);
        } else {
                b[cnt++] = (char)0xFE;
                b[cnt++] = (char)(diff >> 8);
                b[cnt++] = (char)diff;
        }
-       writefd(f, b, cnt);
+       write_buf(f, b, cnt);
 }
 
 /* Receive a file-list index using a byte-reduction method. */
@@ -1599,52 +2053,52 @@ int32 read_ndx(int f)
        if (protocol_version < 30)
                return read_int(f);
 
-       readfd(f, b, 1);
+       read_buf(f, b, 1);
        if (CVAL(b, 0) == 0xFF) {
-               readfd(f, b, 1);
+               read_buf(f, b, 1);
                prev_ptr = &prev_negative;
        } else if (CVAL(b, 0) == 0)
                return NDX_DONE;
        else
                prev_ptr = &prev_positive;
        if (CVAL(b, 0) == 0xFE) {
-               readfd(f, b, 2);
+               read_buf(f, b, 2);
                if (CVAL(b, 0) & 0x80) {
-                       readfd(f, b+2, 2);
-                       num = NVAL4(b, 0x80);
+                       b[3] = CVAL(b, 0) & ~0x80;
+                       b[0] = b[1];
+                       read_buf(f, b+1, 2);
+                       num = IVAL(b, 0);
                } else
-                       num = NVAL2(b, 0) + *prev_ptr;
+                       num = (UVAL(b,0)<<8) + UVAL(b,1) + *prev_ptr;
        } else
-               num = CVAL(b, 0) + *prev_ptr;
+               num = UVAL(b, 0) + *prev_ptr;
        *prev_ptr = num;
        if (prev_ptr == &prev_negative)
                num = -num;
        return num;
 }
 
-/**
- * Read a line of up to @p maxlen characters into @p buf (not counting
- * the trailing null).  Strips the (required) trailing newline and all
- * carriage returns.
- *
- * @return 1 for success; 0 for I/O error or truncation.
- **/
-int read_line(int f, char *buf, size_t maxlen)
+/* Read a line of up to bufsiz-1 characters into buf.  Strips
+ * the (required) trailing newline and all carriage returns.
+ * Returns 1 for success; 0 for I/O error or truncation. */
+int read_line_old(int fd, char *buf, size_t bufsiz)
 {
-       while (maxlen) {
-               buf[0] = 0;
-               read_buf(f, buf, 1);
-               if (buf[0] == 0)
+       bufsiz--; /* leave room for the null */
+       while (bufsiz > 0) {
+               assert(fd != iobuf.in_fd);
+               if (safe_read(fd, buf, 1) == 0)
                        return 0;
-               if (buf[0] == '\n')
+               if (*buf == '\0')
+                       return 0;
+               if (*buf == '\n')
                        break;
-               if (buf[0] != '\r') {
+               if (*buf != '\r') {
                        buf++;
-                       maxlen--;
+                       bufsiz--;
                }
        }
        *buf = '\0';
-       return maxlen > 0;
+       return bufsiz > 0;
 }
 
 void io_printf(int fd, const char *format, ...)
@@ -1658,54 +2112,75 @@ void io_printf(int fd, const char *format, ...)
        va_end(ap);
 
        if (len < 0)
-               exit_cleanup(RERR_STREAMIO);
+               exit_cleanup(RERR_PROTOCOL);
 
        if (len > (int)sizeof buf) {
                rprintf(FERROR, "io_printf() was too long for the buffer.\n");
-               exit_cleanup(RERR_STREAMIO);
+               exit_cleanup(RERR_PROTOCOL);
        }
 
        write_sbuf(fd, buf);
 }
 
-/** Setup for multiplexing a MSG_* stream with the data stream. */
-void io_start_multiplex_out(void)
+/* Setup for multiplexing a MSG_* stream with the data stream. */
+void io_start_multiplex_out(int fd)
 {
-       io_flush(NORMAL_FLUSH);
-       io_start_buffering_out(sock_f_out);
-       io_multiplexing_out = 1;
-}
+       io_flush(FULL_FLUSH);
 
-/** Setup for multiplexing a MSG_* stream with the data stream. */
-void io_start_multiplex_in(void)
-{
-       io_flush(NORMAL_FLUSH);
-       io_start_buffering_in(sock_f_in);
-       io_multiplexing_in = 1;
+       if (msgs2stderr && DEBUG_GTE(IO, 2))
+               rprintf(FINFO, "[%s] io_start_multiplex_out(%d)\n", who_am_i(), fd);
+
+       iobuf.out_empty_len = 4; /* See also OUT_MULTIPLEXED */
+       io_start_buffering_out(fd);
+
+       iobuf.raw_data_header_pos = iobuf.out.pos + iobuf.out.len;
+       iobuf.out.len += 4;
 }
 
-/** Write an message to the multiplexed data stream. */
-int io_multiplex_write(enum msgcode code, const char *buf, size_t len)
+/* Setup for multiplexing a MSG_* stream with the data stream. */
+void io_start_multiplex_in(int fd)
 {
-       if (!io_multiplexing_out)
-               return 0;
-       io_flush(NORMAL_FLUSH);
-       stats.total_written += (len+4);
-       mplex_write(code, buf, len);
-       return 1;
+       if (msgs2stderr && DEBUG_GTE(IO, 2))
+               rprintf(FINFO, "[%s] io_start_multiplex_in(%d)\n", who_am_i(), fd);
+
+       iobuf.in_multiplexed = True; /* See also IN_MULTIPLEXED */
+       io_start_buffering_in(fd);
 }
 
-void io_end_multiplex_in(void)
+int io_end_multiplex_in(int mode)
 {
-       io_multiplexing_in = 0;
-       io_end_buffering_in();
+       int ret = iobuf.in_multiplexed ? iobuf.in_fd : -1;
+
+       if (msgs2stderr && DEBUG_GTE(IO, 2))
+               rprintf(FINFO, "[%s] io_end_multiplex_in(mode=%d)\n", who_am_i(), mode);
+
+       iobuf.in_multiplexed = False;
+       if (mode == MPLX_SWITCHING)
+               iobuf.raw_input_ends_before = 0;
+       else
+               assert(iobuf.raw_input_ends_before == 0);
+       if (mode != MPLX_TO_BUFFERED)
+               io_end_buffering_in(mode);
+
+       return ret;
 }
 
-/** Stop output multiplexing. */
-void io_end_multiplex_out(void)
+int io_end_multiplex_out(int mode)
 {
-       io_multiplexing_out = 0;
-       io_end_buffering_out();
+       int ret = iobuf.out_empty_len ? iobuf.out_fd : -1;
+
+       if (msgs2stderr && DEBUG_GTE(IO, 2))
+               rprintf(FINFO, "[%s] io_end_multiplex_out(mode=%d)\n", who_am_i(), mode);
+
+       if (mode != MPLX_TO_BUFFERED)
+               io_end_buffering_out(mode);
+       else
+               io_flush(FULL_FLUSH);
+
+       iobuf.out.len = 0;
+       iobuf.out_empty_len = 0;
+
+       return ret;
 }
 
 void start_write_batch(int fd)
@@ -1716,6 +2191,8 @@ void start_write_batch(int fd)
         * actual communication so far depends on whether a daemon
         * is involved. */
        write_int(batch_fd, protocol_version);
+       if (protocol_version >= 30)
+               write_byte(batch_fd, inc_recurse);
        write_int(batch_fd, checksum_seed);
 
        if (am_sender)