libnsl/rpc/xdr_rec.c

	xdr_rec.c revision 7c478bd95313f5f23a4c958a745db2134aa03244
/*
 * CDDL HEADER START
 *
 * The contents of this file are subject to the terms of the
 * Common Development and Distribution License, Version 1.0 only
 * (the "License").  You may not use this file except in compliance
 * with the License.
 *
 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
 * or http://www.opensolaris.org/os/licensing.
 * See the License for the specific language governing permissions
 * and limitations under the License.
 *
 * When distributing Covered Code, include this CDDL HEADER in each
 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
 * If applicable, add the following below this CDDL HEADER, with the
 * fields enclosed by brackets "[]" replaced with your own identifying
 * information: Portions Copyright [yyyy] [name of copyright owner]
 *
 * CDDL HEADER END
 */
/*
 * Copyright 2004 Sun Microsystems, Inc.  All rights reserved.
 * Use is subject to license terms.
 */
/* Copyright (c) 1983, 1984, 1985, 1986, 1987, 1988, 1989 AT&T */
/* All Rights Reserved */
/*
 * Portions of this source code were derived from Berkeley
 * 4.3 BSD under license from the Regents of the University of
 * California.
 */

#pragma ident   "%Z%%M% %I% %E% SMI"

/*
 * xdr_rec.c, Implements (TCP/IP based) XDR streams with a "record marking"
 * layer above connection oriented transport layer (e.g. tcp) (for rpc's use).
 *
 *
 * These routines interface XDRSTREAMS to a (tcp/ip) connection transport.
 * There is a record marking layer between the xdr stream
 * and the (tcp) cv transport level.  A record is composed on one or more
 * record fragments.  A record fragment is a thirty-two bit header followed
 * by n bytes of data, where n is contained in the header.  The header
 * is represented as a htonl(ulong_t).  The order bit encodes
 * whether or not the fragment is the last fragment of the record
 * (1 => fragment is last, 0 => more fragments to follow.
 * The other 31 bits encode the byte length of the fragment.
 */

#include "mt.h"
#include "rpc_mt.h"
#include <stdio.h>
#include <rpc/types.h>
#include <rpc/rpc.h>
#include <sys/types.h>
#include <rpc/trace.h>
#include <syslog.h>
#include <memory.h>
#include <stdlib.h>
#include <unistd.h>
#include <inttypes.h>
#include <string.h>

static uint_t   fix_buf_size();
static struct   xdr_ops *xdrrec_ops();
static bool_t   xdrrec_getbytes();
static bool_t   flush_out();
static bool_t   get_input_bytes();
static bool_t   set_input_fragment();
static bool_t   skip_input_bytes();

bool_t      __xdrrec_getbytes_nonblock();

/*
 * A record is composed of one or more record fragments.
 * A record fragment is a four-byte header followed by zero to
 * 2**32-1 bytes.  The header is treated as a long unsigned and is
 * encode/decoded to the network via htonl/ntohl.  The low order 31 bits
 * are a byte count of the fragment.  The highest order bit is a boolean:
 * 1 => this fragment is the last fragment of the record,
 * 0 => this fragment is followed by more fragment(s).
 *
 * The fragment/record machinery is not general;  it is constructed to
 * meet the needs of xdr and rpc based on tcp.
 */

#define LAST_FRAG (((uint32_t)1 << 31))

/*
 * Minimum fragment size is size of rpc callmsg over TCP:
 * xid direction vers prog vers proc
 *   cred flavor, cred length, cred
 *   verf flavor, verf length, verf
 *   (with no cred or verf allocated)
 */
#define MIN_FRAG    (10 * BYTES_PER_XDR_UNIT)

typedef struct rec_strm {
    caddr_t tcp_handle;
    /*
     * out-going bits
     */
    int (*writeit)();
    caddr_t out_base;   /* output buffer (points to frag header) */
    caddr_t out_finger; /* next output position */
    caddr_t out_boundry;    /* data cannot up to this address */
    uint32_t *frag_header;  /* beginning of current fragment */
    bool_t frag_sent;   /* true if buffer sent in middle of record */
    /*
     * in-coming bits
     */
    int (*readit)();
    caddr_t in_base;    /* input buffer */
    caddr_t in_finger;  /* location of next byte to be had */
    caddr_t in_boundry; /* can read up to this location */
    int fbtbc;      /* fragment bytes to be consumed */
    bool_t last_frag;
    uint_t sendsize;
    uint_t recvsize;
    /*
     * Is this the first time that the
     * getbytes routine has been called ?
     */
    uint_t firsttime;
    /*
     * Is this non-blocked?
     */
    uint_t in_nonblock; /* non-blocked input */
    uint_t in_needpoll; /* need to poll to get more data ? */
    uint32_t in_maxrecsz;   /* maximum record size */
    caddr_t in_nextrec; /* start of next record */
    uint32_t in_nextrecsz;  /* part of next record in buffer */
} RECSTREAM;

/*
 * Create an xdr handle for xdrrec
 * xdrrec_create fills in xdrs.  Sendsize and recvsize are
 * send and recv buffer sizes (0 => use default).
 * vc_handle is an opaque handle that is passed as the first parameter to
 * the procedures readit and writeit.  Readit and writeit are read and
 * write respectively. They are like the system calls expect that they
 * take an opaque handle rather than an fd.
 */

static const char mem_err_msg_rec[] = "xdrrec_create: out of memory";

void
xdrrec_create(XDR *xdrs, uint_t sendsize, uint_t recvsize, caddr_t tcp_handle,
    int (*readit)(), int (*writeit)())
{
    RECSTREAM *rstrm =
        (RECSTREAM *)mem_alloc(sizeof (RECSTREAM));

    /*
     * XXX: Should still rework xdrrec_create to return a handle,
     * and in any malloc-failure case return NULL.
     */
    trace3(TR_xdrrec_create, 0, sendsize, recvsize);
    if (rstrm == NULL) {
        (void) syslog(LOG_ERR, mem_err_msg_rec);
        trace1(TR_xdrrec_create, 1);
        return;
    }
    /*
     * Adjust sizes and allocate buffers; malloc(3C), for which mem_alloc
     * is a wrapper, provides a buffer suitably aligned for any use, so
     * there's no need for us to mess around with alignment.
     *
     * Since non-blocking connections may need to reallocate the input
     * buffer, we use separate mem_alloc()s for input and output.
     */
    rstrm->sendsize = sendsize = fix_buf_size(sendsize);
    rstrm->recvsize = recvsize = fix_buf_size(recvsize);
    rstrm->out_base = (caddr_t)mem_alloc(rstrm->sendsize);
    if (rstrm->out_base == NULL) {
        (void) syslog(LOG_ERR, mem_err_msg_rec);
        (void) mem_free((char *)rstrm, sizeof (RECSTREAM));
        trace1(TR_xdrrec_create, 1);
        return;
    }
    rstrm->in_base = (caddr_t)mem_alloc(rstrm->recvsize);
    if (rstrm->in_base == NULL) {
        (void) syslog(LOG_ERR, mem_err_msg_rec);
        (void) mem_free(rstrm->out_base, rstrm->sendsize);
        (void) mem_free(rstrm, sizeof (RECSTREAM));
        trace1(TR_xdrrec_create, 1);
        return;
    }

    /*
     * now the rest ...
     */

    xdrs->x_ops = xdrrec_ops();
    xdrs->x_private = (caddr_t)rstrm;
    rstrm->tcp_handle = tcp_handle;
    rstrm->readit = readit;
    rstrm->writeit = writeit;
    rstrm->out_finger = rstrm->out_boundry = rstrm->out_base;
    rstrm->frag_header = (uint32_t *)rstrm->out_base;
    rstrm->out_finger += sizeof (uint_t);
    rstrm->out_boundry += sendsize;
    rstrm->frag_sent = FALSE;
    rstrm->in_boundry = rstrm->in_base;
    rstrm->in_finger = (rstrm->in_boundry += recvsize);
    rstrm->fbtbc = 0;
    rstrm->last_frag = TRUE;
    rstrm->firsttime = 0;
    rstrm->in_nonblock = 0;
    rstrm->in_needpoll = 1;
    rstrm->in_maxrecsz = 0;
    rstrm->in_nextrec = rstrm->in_base;
    rstrm->in_nextrecsz = 0;

    trace1(TR_xdrrec_create, 1);
}

/*
 * Align input stream.  If all applications behaved correctly, this
 * defensive procedure will not be necessary, since received data will be
 * aligned correctly.
 */
static void
align_instream(RECSTREAM *rstrm)
{
    int current = rstrm->in_boundry - rstrm->in_finger;

    (void) memcpy(rstrm->in_base, rstrm->in_finger, current);
    rstrm->in_finger = rstrm->in_base;
    rstrm->in_boundry = rstrm->in_finger + current;
}

/*
 * The routines defined below are the xdr ops which will go into the
 * xdr handle filled in by xdrrec_create.
 */
static bool_t
xdrrec_getint32(XDR *xdrs, int32_t *ip)
{
    RECSTREAM *rstrm = (RECSTREAM *)(xdrs->x_private);
    int32_t *buflp = (int32_t *)(rstrm->in_finger);
    int32_t mylong;

    trace1(TR_xdrrec_getint32, 0);
    /* first try the inline, fast case */
    if ((rstrm->fbtbc >= (int)sizeof (int32_t)) &&
        ((uint_t)(rstrm->in_boundry - (caddr_t)buflp) >=
                    (uint_t)sizeof (int32_t))) {
        /*
         * Check if buflp is longword aligned.  If not, align it.
         */
        if (((uintptr_t)buflp) & ((int)sizeof (int32_t) - 1)) {
            align_instream(rstrm);
            buflp = (int32_t *)(rstrm->in_finger);
        }
        *ip = (int32_t)ntohl((uint32_t)(*buflp));
        rstrm->fbtbc -= (int)sizeof (int32_t);
        rstrm->in_finger += sizeof (int32_t);
    } else {
        if (!xdrrec_getbytes(xdrs, &mylong, sizeof (int32_t))) {
            trace1(TR_xdrrec_getint32_t, 1);
            return (FALSE);
        }
        *ip = (int32_t)ntohl((uint32_t)mylong);
    }
    trace1(TR_xdrrec_getint32, 1);
    return (TRUE);
}

static bool_t
xdrrec_putint32(XDR *xdrs, int32_t *ip)
{
    RECSTREAM *rstrm = (RECSTREAM *)(xdrs->x_private);
    int32_t *dest_lp = ((int32_t *)(rstrm->out_finger));

    trace1(TR_xdrrec_putint32, 0);
    if ((rstrm->out_finger += sizeof (int32_t)) > rstrm->out_boundry) {
        /*
         * this case should almost never happen so the code is
         * inefficient
         */
        rstrm->out_finger -= sizeof (int32_t);
        rstrm->frag_sent = TRUE;
        if (! flush_out(rstrm, FALSE)) {
            trace1(TR_xdrrec_putint32_t, 1);
            return (FALSE);
        }
        dest_lp = ((int32_t *)(rstrm->out_finger));
        rstrm->out_finger += sizeof (int32_t);
    }
    *dest_lp = (int32_t)htonl((uint32_t)(*ip));
    trace1(TR_xdrrec_putint32, 1);
    return (TRUE);
}

static bool_t
xdrrec_getlong(XDR *xdrs, long *lp)
{
    int32_t i;

    if (!xdrrec_getint32(xdrs, &i))
        return (FALSE);

    *lp = (long)i;

    return (TRUE);
}

static bool_t
xdrrec_putlong(XDR *xdrs, long *lp)
{
    int32_t i;

#if defined(_LP64)
    if ((*lp > INT32_MAX) || (*lp < INT32_MIN)) {
        return (FALSE);
    }
#endif

    i = (int32_t)*lp;

    return (xdrrec_putint32(xdrs, &i));
}

static bool_t   /* must manage buffers, fragments, and records */
xdrrec_getbytes(XDR *xdrs, caddr_t addr, int len)
{
    RECSTREAM *rstrm = (RECSTREAM *)(xdrs->x_private);
    int current;

    trace2(TR_xdrrec_getbytes, 0, len);
    while (len > 0) {
        current = rstrm->fbtbc;
        if (current == 0) {
            if (rstrm->last_frag) {
                trace1(TR_xdrrec_getbytes, 1);
                return (FALSE);
            }
            if (! set_input_fragment(rstrm)) {
                trace1(TR_xdrrec_getbytes, 1);
                return (FALSE);
            }
            continue;
        }
        current = (len < current) ? len : current;
        if (! get_input_bytes(rstrm, addr, current, FALSE)) {
            trace1(TR_xdrrec_getbytes, 1);
            return (FALSE);
        }
        addr += current;
        rstrm->fbtbc -= current;
        len -= current;
    }
    trace1(TR_xdrrec_getbytes, 1);
    return (TRUE);
}

static bool_t
xdrrec_putbytes(XDR *xdrs, caddr_t addr, int len)
{
    RECSTREAM *rstrm = (RECSTREAM *)(xdrs->x_private);
    int current;

    trace2(TR_xdrrec_putbytes, 0, len);
    while (len > 0) {

        current = (uintptr_t)rstrm->out_boundry -
            (uintptr_t)rstrm->out_finger;
        current = (len < current) ? len : current;
        (void) memcpy(rstrm->out_finger, addr, current);
        rstrm->out_finger += current;
        addr += current;
        len -= current;
        if (rstrm->out_finger == rstrm->out_boundry) {
            rstrm->frag_sent = TRUE;
            if (! flush_out(rstrm, FALSE)) {
                trace1(TR_xdrrec_putbytes, 1);
                return (FALSE);
            }
        }
    }
    trace1(TR_xdrrec_putbytes, 1);
    return (TRUE);
}
/*
 * This is just like the ops vector x_getbytes(), except that
 * instead of returning success or failure on getting a certain number
 * of bytes, it behaves much more like the read() system call against a
 * pipe -- it returns up to the number of bytes requested and a return of
 * zero indicates end-of-record.  A -1 means something very bad happened.
 */
uint_t /* must manage buffers, fragments, and records */
xdrrec_readbytes(XDR *xdrs, caddr_t addr, uint_t l)
{
    RECSTREAM *rstrm = (RECSTREAM *)(xdrs->x_private);
    int current, len;

    len = l;
    while (len > 0) {
        current = rstrm->fbtbc;
        if (current == 0) {
            if (rstrm->last_frag)
                return (l - len);
            if (! set_input_fragment(rstrm))
                return ((uint_t)-1);
            continue;
        }
        current = (len < current) ? len : current;
        if (! get_input_bytes(rstrm, addr, current, FALSE))
            return ((uint_t)-1);
        addr += current;
        rstrm->fbtbc -= current;
        len -= current;
    }
    return (l - len);
}

static uint_t
xdrrec_getpos(XDR *xdrs)
{
    RECSTREAM *rstrm = (RECSTREAM *)xdrs->x_private;
    int32_t pos;

    trace1(TR_xdrrec_getpos, 0);
    pos = lseek((intptr_t)rstrm->tcp_handle, 0, 1);
    if (pos != -1)
        switch (xdrs->x_op) {

        case XDR_ENCODE:
            pos += rstrm->out_finger - rstrm->out_base;
            break;

        case XDR_DECODE:
            pos -= rstrm->in_boundry - rstrm->in_finger;
            break;

        default:
            pos = (uint_t)-1;
            break;
        }
    trace1(TR_xdrrec_getpos, 1);
    return ((uint_t)pos);
}

static bool_t
xdrrec_setpos(XDR *xdrs, uint_t pos)
{
    RECSTREAM *rstrm = (RECSTREAM *)xdrs->x_private;
    uint_t currpos = xdrrec_getpos(xdrs);
    int delta = currpos - pos;
    caddr_t newpos;

    trace2(TR_xdrrec_setpos, 0, pos);
    if ((int)currpos != -1)
        switch (xdrs->x_op) {

        case XDR_ENCODE:
            newpos = rstrm->out_finger - delta;
            if ((newpos > (caddr_t)(rstrm->frag_header)) &&
                (newpos < rstrm->out_boundry)) {
                rstrm->out_finger = newpos;
                trace1(TR_xdrrec_setpos, 1);
                return (TRUE);
            }
            break;

        case XDR_DECODE:
            newpos = rstrm->in_finger - delta;
            if ((delta < (int)(rstrm->fbtbc)) &&
                (newpos <= rstrm->in_boundry) &&
                (newpos >= rstrm->in_base)) {
                rstrm->in_finger = newpos;
                rstrm->fbtbc -= delta;
                trace1(TR_xdrrec_setpos, 1);
                return (TRUE);
            }
            break;
        }
    trace1(TR_xdrrec_setpos, 1);
    return (FALSE);
}

static rpc_inline_t *
xdrrec_inline(XDR *xdrs, int len)
{
    RECSTREAM *rstrm = (RECSTREAM *)xdrs->x_private;
    rpc_inline_t *buf = NULL;

    trace2(TR_xdrrec_inline, 0, len);
    switch (xdrs->x_op) {

    case XDR_ENCODE:
        if ((rstrm->out_finger + len) <= rstrm->out_boundry) {
            buf = (rpc_inline_t *)rstrm->out_finger;
            rstrm->out_finger += len;
        }
        break;

    case XDR_DECODE:
        if ((len <= rstrm->fbtbc) &&
            ((rstrm->in_finger + len) <= rstrm->in_boundry)) {
            /*
             * Check if rstrm->in_finger is longword aligned;
             * if not, align it.
             */
            if (((intptr_t)rstrm->in_finger) &
                (sizeof (int32_t) - 1))
                align_instream(rstrm);
            buf = (rpc_inline_t *)rstrm->in_finger;
            rstrm->fbtbc -= len;
            rstrm->in_finger += len;
        }
        break;
    }
    trace1(TR_xdrrec_inline, 1);
    return (buf);
}

static void
xdrrec_destroy(XDR *xdrs)
{
    RECSTREAM *rstrm = (RECSTREAM *)xdrs->x_private;

    trace1(TR_xdrrec_destroy, 0);
    mem_free(rstrm->out_base, rstrm->sendsize);
    mem_free(rstrm->in_base,  rstrm->recvsize);
    mem_free((caddr_t)rstrm, sizeof (RECSTREAM));
    trace1(TR_xdrrec_destroy, 1);
}


/*
 * Exported routines to manage xdr records
 */

/*
 * Before reading (deserializing) from the stream, one should always call
 * this procedure to guarantee proper record alignment.
 */
bool_t
xdrrec_skiprecord(XDR *xdrs)
{
    RECSTREAM *rstrm = (RECSTREAM *)(xdrs->x_private);

    trace1(TR_xdrrec_skiprecord, 0);
    if (rstrm->in_nonblock) {
        enum xprt_stat pstat;
        /*
         * Read and discard a record from the non-blocking
         * buffer. Return succes only if a complete record can
         * be retrieved without blocking, or if the buffer was
         * empty and there was no data to fetch.
         */
        if (__xdrrec_getbytes_nonblock(xdrs, &pstat) ||
            (pstat == XPRT_MOREREQS &&
                rstrm->in_finger == rstrm->in_boundry)) {
            rstrm->fbtbc = 0;
            trace1(TR_xdrrec_skiprecord, 1);
            return (TRUE);
        } else {
            trace1(TR_xdrrec_skiprecord, 1);
            return (FALSE);
        }
    }
    while (rstrm->fbtbc > 0 || (! rstrm->last_frag)) {
        if (! skip_input_bytes(rstrm, rstrm->fbtbc)) {
            trace1(TR_xdrrec_skiprecord, 1);
            return (FALSE);
        }
        rstrm->fbtbc = 0;
        if ((! rstrm->last_frag) && (! set_input_fragment(rstrm))) {
            trace1(TR_xdrrec_skiprecord, 1);
            return (FALSE);
        }
    }
    rstrm->last_frag = FALSE;
    trace1(TR_xdrrec_skiprecord, 1);
    return (TRUE);
}

/*
 * Look ahead fuction.
 * Returns TRUE iff there is no more input in the buffer
 * after consuming the rest of the current record.
 */
bool_t
xdrrec_eof(XDR *xdrs)
{
    RECSTREAM *rstrm = (RECSTREAM *)(xdrs->x_private);

    trace1(TR_xdrrec_eof, 0);
    if (rstrm->in_nonblock) {
        /*
         * If in_needpoll is true, the non-blocking XDR stream
         * does not have a complete record.
         */
        return (rstrm->in_needpoll);
    }
    while (rstrm->fbtbc > 0 || (! rstrm->last_frag)) {
        if (! skip_input_bytes(rstrm, rstrm->fbtbc)) {
            trace1(TR_xdrrec_eof, 1);
            return (TRUE);
        }
        rstrm->fbtbc = 0;
        if ((! rstrm->last_frag) && (! set_input_fragment(rstrm))) {
            trace1(TR_xdrrec_eof, 1);
            return (TRUE);
        }
    }
    if (rstrm->in_finger == rstrm->in_boundry) {
        trace1(TR_xdrrec_eof, 1);
        return (TRUE);
    }
    trace1(TR_xdrrec_eof, 1);
    return (FALSE);
}

/*
 * The client must tell the package when an end-of-record has occurred.
 * The second parameters tells whether the record should be flushed to the
 * (output) tcp stream.  (This let's the package support batched or
 * pipelined procedure calls.)  TRUE => immmediate flush to tcp connection.
 */
bool_t
xdrrec_endofrecord(XDR *xdrs, bool_t sendnow)
{
    RECSTREAM *rstrm = (RECSTREAM *)(xdrs->x_private);
    uint32_t len;   /* fragment length */
    bool_t dummy;

    trace1(TR_xdrrec_endofrecord, 0);
    if (sendnow || rstrm->frag_sent ||
        ((uintptr_t)rstrm->out_finger + sizeof (uint32_t) >=
        (uintptr_t)rstrm->out_boundry)) {
        rstrm->frag_sent = FALSE;
        dummy = flush_out(rstrm, TRUE);
        trace1(TR_xdrrec_endofrecord, 1);
        return (dummy);
    }
    len = (uintptr_t)(rstrm->out_finger) - (uintptr_t)(rstrm->frag_header) -
        sizeof (uint32_t);
    *(rstrm->frag_header) = htonl((uint32_t)len | LAST_FRAG);
    rstrm->frag_header = (uint32_t *)rstrm->out_finger;
    rstrm->out_finger += sizeof (uint32_t);
    trace1(TR_xdrrec_endofrecord, 1);
    return (TRUE);
}


/*
 * Internal useful routines
 */
static bool_t
flush_out(RECSTREAM *rstrm, bool_t eor)
{
    uint32_t eormask = (eor == TRUE) ? LAST_FRAG : 0;
    uint32_t len = (uintptr_t)(rstrm->out_finger) -
        (uintptr_t)(rstrm->frag_header) - sizeof (uint32_t);
    int written;

    trace1(TR_flush_out, 0);
    *(rstrm->frag_header) = htonl(len | eormask);
    len = (uintptr_t)(rstrm->out_finger) - (uintptr_t)(rstrm->out_base);

    written = (*(rstrm->writeit))
        (rstrm->tcp_handle, rstrm->out_base, (int)len);
    /*
     * Handle the specific 'CANT_STORE' error. In this case, the
     * fragment must be cleared.
     */
    if ((written != (int)len) && (written != -2)) {
        trace1(TR_flush_out, 1);
        return (FALSE);
    }
    rstrm->frag_header = (uint32_t *)rstrm->out_base;
    rstrm->out_finger = (caddr_t)rstrm->out_base + sizeof (uint32_t);

    trace1(TR_flush_out, 1);
    return (TRUE);
}

/* knows nothing about records!  Only about input buffers */
static bool_t
fill_input_buf(RECSTREAM *rstrm, bool_t do_align)
{
    caddr_t where;
    int len;

    trace1(TR_fill_input_buf, 0);
    if (rstrm->in_nonblock) {
        /* Should never get here in the non-blocking case */
        trace1(TR_fill_input_buf, 1);
        return (FALSE);
    }
    where = rstrm->in_base;
    if (do_align) {
        len = rstrm->recvsize;
    } else {
        uint_t i = (uintptr_t)rstrm->in_boundry % BYTES_PER_XDR_UNIT;

        where += i;
        len = rstrm->recvsize - i;
    }
    if ((len = (*(rstrm->readit))(rstrm->tcp_handle, where, len)) == -1) {
        trace1(TR_fill_input_buf, 1);
        return (FALSE);
    }
    rstrm->in_finger = where;
    where += len;
    rstrm->in_boundry = where;
    trace1(TR_fill_input_buf, 1);
    return (TRUE);
}

/* knows nothing about records!  Only about input buffers */
static bool_t
get_input_bytes(RECSTREAM *rstrm, caddr_t addr,
        int len, bool_t do_align)
{
    int current;

    trace2(TR_get_input_bytes, 0, len);

    if (rstrm->in_nonblock) {
        /*
         * Data should already be in the rstrm buffer, so we just
         * need to copy it to 'addr'.
         */
        current = (int)(rstrm->in_boundry - rstrm->in_finger);
        if (len > current) {
            trace1(TR_get_input_bytes, 1);
            return (FALSE);
        }
        (void) memcpy(addr, rstrm->in_finger, len);
        rstrm->in_finger += len;
        addr += len;
        trace1(TR_get_input_bytes, 1);
        return (TRUE);
    }

    while (len > 0) {
        current = (intptr_t)rstrm->in_boundry -
            (intptr_t)rstrm->in_finger;
        if (current == 0) {
            if (! fill_input_buf(rstrm, do_align)) {
                trace1(TR_get_input_bytes, 1);
                return (FALSE);
            }
            continue;
        }
        current = (len < current) ? len : current;
        (void) memcpy(addr, rstrm->in_finger, current);
        rstrm->in_finger += current;
        addr += current;
        len -= current;
        do_align = FALSE;
    }
    trace1(TR_get_input_bytes, 1);
    return (TRUE);
}

/* next four bytes of the input stream are treated as a header */
static bool_t
set_input_fragment(RECSTREAM *rstrm)
{
    uint32_t header;

    trace1(TR_set_input_fragment, 0);
    if (rstrm->in_nonblock) {
        /*
         * In the non-blocking case, the fragment headers should
         * already have been consumed, so we should never get
         * here. Might as well return failure right away.
         */
        trace1(TR_set_input_fragment, 1);
        return (FALSE);
    }
    if (! get_input_bytes(rstrm, (caddr_t)&header, (int)sizeof (header),
                            rstrm->last_frag)) {
        trace1(TR_set_input_fragment, 1);
        return (FALSE);
    }
    header = (uint32_t)ntohl(header);
    rstrm->last_frag = ((header & LAST_FRAG) == 0) ? FALSE : TRUE;
    rstrm->fbtbc = header & (~LAST_FRAG);
    trace1(TR_set_input_fragment, 1);
    return (TRUE);
}

/* consumes input bytes; knows nothing about records! */
static bool_t
skip_input_bytes(RECSTREAM *rstrm, int32_t cnt)
{
    int current;

    trace2(TR_skip_input_bytes, 0, cnt);
    while (cnt > 0) {
        current = (intptr_t)rstrm->in_boundry -
            (intptr_t)rstrm->in_finger;
        if (current == 0) {
            if (! fill_input_buf(rstrm, FALSE)) {
                trace1(TR_skip_input_bytes, 1);
                return (FALSE);
            }
            continue;
        }
        current = (cnt < current) ? cnt : current;
        rstrm->in_finger += current;
        cnt -= current;
    }
    trace1(TR_skip_input_bytes, 1);
    return (TRUE);
}


static bool_t
__xdrrec_nonblock_realloc(RECSTREAM *rstrm, uint32_t newsize)
{
    caddr_t newbuf = rstrm->in_base;
    ptrdiff_t offset;
    bool_t ret = TRUE;

    if (newsize > rstrm->recvsize) {
        newbuf = (caddr_t)realloc(newbuf, newsize);
        if (newbuf == 0) {
            ret = FALSE;
        } else {
            /* Make pointers valid for the new buffer */
            offset = newbuf - rstrm->in_base;
            rstrm->in_finger += offset;
            rstrm->in_boundry += offset;
            rstrm->in_nextrec += offset;
            rstrm->in_base = newbuf;
            rstrm->recvsize = newsize;
        }
    }

    return (ret);
}

/*
 * adjust sizes and allocate buffer quad byte aligned
 */
bool_t
__xdrrec_set_conn_nonblock(XDR *xdrs, uint32_t tcp_maxrecsz)
{
    RECSTREAM *rstrm = (RECSTREAM *)(xdrs->x_private);
    caddr_t realloc_buffer;
    size_t newsize;

    rstrm->in_nonblock = TRUE;
    if (tcp_maxrecsz == 0) {
        /*
         * If maxrecsz has not been set, use the default
         * that was set from xdrrec_create() and
         * fix_buf_size()
         */
        rstrm->in_maxrecsz = rstrm->recvsize;
        return (TRUE);
    }
    rstrm->in_maxrecsz = tcp_maxrecsz;
    if (tcp_maxrecsz <= rstrm->recvsize)
        return (TRUE);

    /*
     * For nonblocked connection, the entire record is read into the
     * buffer before any xdr processing. This implies that the record
     * size must allow for the maximum expected message size of the
     * service. However, it's inconvenient to allocate very large
     * buffers up front, so we limit ourselves to a reasonable
     * default size here, and reallocate (up to the maximum record
     * size allowed for the connection) as necessary.
     */
    if ((newsize = tcp_maxrecsz) > RPC_MAXDATASIZE) {
        newsize = RPC_MAXDATASIZE;
    }
    if (! __xdrrec_nonblock_realloc(rstrm, newsize)) {
        (void) syslog(LOG_ERR, mem_err_msg_rec);
        (void) mem_free(rstrm->out_base, rstrm->sendsize);
        (void) mem_free(rstrm->in_base,  rstrm->recvsize);
        (void) mem_free((char *)rstrm, sizeof (RECSTREAM));
        trace1(TR_xdrrec_create, 1);
        return (FALSE);
    }

    return (TRUE);
}

/*
 * Retrieve input data from the non-blocking connection, increase
 * the size of the read buffer if necessary, and check that the
 * record size stays below the allowed maximum for the connection.
 */
bool_t
__xdrrec_getbytes_nonblock(XDR *xdrs, enum xprt_stat *pstat)
{
    RECSTREAM *rstrm = (RECSTREAM *)(xdrs->x_private);
    uint32_t prevbytes_thisrec, minreqrecsize;
    uint32_t *header;
    uint32_t len_received = 0, unprocessed = 0;

    trace2(TR__xdrrec_getbytes_nonblock, 0, len);

    /*
     * For connection oriented protocols, there's no guarantee that
     * we will receive the data nicely chopped into records, no
     * matter how it was sent. We use the in_nextrec pointer to
     * indicate where in the buffer the next record starts. If
     * in_nextrec != in_base, there's data in the buffer from
     * previous reads, and if in_nextrecsz > 0, we need to copy
     * the portion of the next record already read to the start of
     * the input buffer
     */
    if (rstrm->in_nextrecsz > 0) {
        /* Starting on new record with data already in the buffer */
        (void) memmove(rstrm->in_base, rstrm->in_nextrec,
            rstrm->in_nextrecsz);
        rstrm->in_nextrec = rstrm->in_finger = rstrm->in_base;
        rstrm->in_boundry = rstrm->in_nextrec + rstrm->in_nextrecsz;
        unprocessed = rstrm->in_nextrecsz;
        rstrm->in_nextrecsz = 0;
    } else if (rstrm->in_nextrec == rstrm->in_base) {
        /* Starting on new record with empty buffer */
        rstrm->in_boundry = rstrm->in_finger = rstrm->in_base;
        rstrm->last_frag = FALSE;
        rstrm->in_needpoll = TRUE;
    }

    prevbytes_thisrec = (uint32_t)(rstrm->in_boundry - rstrm->in_base);

    /* Do we need to retrieve data ? */
    if (rstrm->in_needpoll) {
        int len_requested, len_total_received;

        rstrm->in_needpoll = FALSE;
        len_total_received =
            (int)(rstrm->in_boundry - rstrm->in_base);
        len_requested = rstrm->recvsize - len_total_received;
        /*
         * if len_requested is 0, this means that the input
         * buffer is full and need to be increased.
         * The minimum record size we will need is whatever's
         * already in the buffer, plus what's yet to be
         * consumed in the current fragment, plus space for at
         * least one more fragment header, if this is not the
         * last fragment. We use the RNDUP() macro to
         * account for possible realignment of the next
         * fragment header.
         */
        if (len_requested == 0) {
            minreqrecsize = rstrm->recvsize +
                rstrm->fbtbc +
                (rstrm->last_frag ? 0 : sizeof (*header));
            minreqrecsize = RNDUP(minreqrecsize);
            if (minreqrecsize == rstrm->recvsize) {
                /*
                 * no more bytes to be consumed and
                 * last fragment. We should never end up
                 * here. Might as well return failure
                 * right away.
                 */
                *pstat = XPRT_DIED;
                trace1(TR__xdrrec_getbytes_nonblock, 1);
                return (FALSE);
            } else if (minreqrecsize > rstrm->in_maxrecsz) {
                goto recsz_invalid;
            } else {
                goto needpoll;
            }
        }
        if ((len_received = (*(rstrm->readit))(rstrm->tcp_handle,
                rstrm->in_boundry, len_requested)) == -1) {
            *pstat = XPRT_DIED;
            trace1(TR__xdrrec_getbytes_nonblock, 1);
            return (FALSE);
        }
        rstrm->in_boundry += len_received;
        rstrm->in_nextrec = rstrm->in_boundry;
    }

    /* Account for any left over data from previous processing */
    len_received += unprocessed;

    /* Set a lower limit on the buffer space we'll need */
    minreqrecsize = prevbytes_thisrec + rstrm->fbtbc;

    /*
     * Consume bytes for this record until it's either complete,
     * rejected, or we need to poll for more bytes.
     *
     * If fbtbc == 0, in_finger points to the start of the fragment
     * header. Otherwise, it points to the start of the fragment data.
     */
    while (len_received > 0) {
        if (rstrm->fbtbc == 0) {
            uint32_t hdrlen, minfraglen = 0;
            uint32_t len_recvd_thisfrag;
            bool_t last_frag;

            len_recvd_thisfrag = (uint32_t)(rstrm->in_boundry -
                        rstrm->in_finger);
            header = (uint32_t *)rstrm->in_finger;
            hdrlen = (len_recvd_thisfrag < sizeof (*header)) ?
                len_recvd_thisfrag : sizeof (*header);
            memcpy(&minfraglen, header, hdrlen);
            last_frag = (ntohl(minfraglen) & LAST_FRAG) != 0;
            minfraglen = ntohl(minfraglen) & (~LAST_FRAG);
            /*
             * The minimum record size we will need is whatever's
             * already in the buffer, plus the size of this
             * fragment, plus (if this isn't the last fragment)
             * space for at least one more fragment header. We
             * use the RNDUP() macro to account for possible
             * realignment of the next fragment header.
             */
            minreqrecsize += minfraglen +
                    (last_frag?0:sizeof (*header));
            minreqrecsize = RNDUP(minreqrecsize);

            if (hdrlen < sizeof (*header)) {
                /*
                 * We only have a partial fragment header,
                 * but we can still put a lower limit on the
                 * final fragment size, and check against the
                 * maximum allowed.
                 */
                if (len_recvd_thisfrag > 0 &&
                    (minreqrecsize > rstrm->in_maxrecsz)) {
                    goto recsz_invalid;
                }
                /* Need more bytes to obtain fbtbc value */
                goto needpoll;
            }
            /*
             * We've got a complete fragment header, so
             * 'minfraglen' is the actual fragment length, and
             * 'minreqrecsize' the requested record size.
             */
            rstrm->last_frag = last_frag;
            rstrm->fbtbc = minfraglen;
            /*
             * Check that the sum of the total number of bytes read
             * so far (for the record) and the size of the incoming
             * fragment is less than the maximum allowed.
             *
             * If this is the last fragment, also check that the
             * record (message) meets the minimum length
             * requirement.
             *
             * If this isn't the last fragment, check for a zero
             * fragment length. Accepting such fragments would
             * leave us open to an attack where the sender keeps
             * the connection open indefinitely, without any
             * progress, by occasionally sending a zero length
             * fragment.
             */
            if ((minreqrecsize > rstrm->in_maxrecsz) ||
            (rstrm->last_frag && minreqrecsize < MIN_FRAG) ||
            (!rstrm->last_frag && minfraglen == 0)) {
recsz_invalid:
                rstrm->fbtbc = 0;
                rstrm->last_frag = 1;
                *pstat = XPRT_DIED;
                trace1(TR__xdrrec_getbytes_nonblock, 1);
                return (FALSE);
            }
            /*
             * Make this fragment abut the previous one. If it's
             * the first fragment, just advance in_finger past
             * the header. This avoids buffer copying for the
             * usual case where there's one fragment per record.
             */
            if (rstrm->in_finger == rstrm->in_base) {
                rstrm->in_finger += sizeof (*header);
            } else {
                rstrm->in_boundry -= sizeof (*header);
                (void) memmove(rstrm->in_finger,
                    rstrm->in_finger + sizeof (*header),
                    rstrm->in_boundry - rstrm->in_finger);
            }
            /* Consume the fragment header */
            if (len_received > sizeof (*header)) {
                len_received -= sizeof (*header);
            } else {
                len_received = 0;
            }
        }
        /*
         * Consume whatever fragment bytes we have.
         * If we've received all bytes for this fragment, advance
         * in_finger to point to the start of the next fragment
         * header. Otherwise, make fbtbc tell how much is left in
         * in this fragment and advance finger to point to end of
         * fragment data.
         */
        if (len_received >= rstrm->fbtbc) {
            len_received -= rstrm->fbtbc;
            rstrm->in_finger += rstrm->fbtbc;
            rstrm->fbtbc = 0;
        } else {
            rstrm->fbtbc -= len_received;
            rstrm->in_finger += len_received;
            len_received = 0;
        }
        /*
         * If there's more data in the buffer, there are two
         * possibilities:
         *
         * (1)  This is the last fragment, so the extra data
         *  presumably belongs to the next record.
         *
         * (2)  Not the last fragment, so we'll start over
         *  from the top of the loop.
         */
        if (len_received > 0 && rstrm->last_frag) {
            rstrm->in_nextrec = rstrm->in_finger;
            rstrm->in_nextrecsz = (uint32_t)(rstrm->in_boundry -
                            rstrm->in_nextrec);
            len_received = 0;
        }
    }

    /* Was this the last fragment, and have we read the entire record ? */
    if (rstrm->last_frag && rstrm->fbtbc == 0) {
        *pstat = XPRT_MOREREQS;
        /*
         * We've been using both in_finger and fbtbc for our own
         * purposes. Now's the time to update them to be what
         * xdrrec_inline() expects. Set in_finger to point to the
         * start of data for this record, and fbtbc to the number
         * of bytes in the record.
         */
        rstrm->fbtbc = (int)(rstrm->in_finger -
                rstrm->in_base - sizeof (*header));
        rstrm->in_finger = rstrm->in_base + sizeof (*header);
        if (rstrm->in_nextrecsz == 0)
            rstrm->in_nextrec = rstrm->in_base;
        trace1(TR__xdrrec_getbytes_nonblock, 1);
        return (TRUE);
    }
needpoll:
    /*
     * Need more bytes, so we set the needpoll flag, and go back to
     * the main RPC request loop. However, first we reallocate the
     * input buffer, if necessary.
     */
    if (minreqrecsize > rstrm->recvsize) {
        if (! __xdrrec_nonblock_realloc(rstrm, minreqrecsize)) {
            rstrm->fbtbc = 0;
            rstrm->last_frag = 1;
            *pstat = XPRT_DIED;
            trace1(TR__xdrrec_getbytes_nonblock, 1);
            return (FALSE);
        }
    }

    rstrm->in_needpoll = TRUE;
    *pstat = XPRT_MOREREQS;
    trace1(TR__xdrrec_getbytes_nonblock, 1);
    return (FALSE);
}

int
__is_xdrrec_first(XDR *xdrs)
{
    RECSTREAM *rstrm = (RECSTREAM *)(xdrs->x_private);
    return ((rstrm->firsttime == TRUE)? 1 : 0);
}

int
__xdrrec_setfirst(XDR *xdrs)
{
    RECSTREAM *rstrm = (RECSTREAM *)(xdrs->x_private);

    /*
     * Set rstrm->firsttime only if the input buffer is empty.
     * Otherwise, the first read from the network could skip
     * a poll.
     */
    if (rstrm->in_finger == rstrm->in_boundry)
        rstrm->firsttime = TRUE;
    else
        rstrm->firsttime = FALSE;
    return (1);
}

int
__xdrrec_resetfirst(XDR *xdrs)
{
    RECSTREAM *rstrm = (RECSTREAM *)(xdrs->x_private);

    rstrm->firsttime = FALSE;
    return (1);
}


static uint_t
fix_buf_size(uint_t s)
{
    uint_t dummy1;

    trace2(TR_fix_buf_size, 0, s);
    if (s < 100)
        s = 4000;
    dummy1 = RNDUP(s);
    trace1(TR_fix_buf_size, 1);
    return (dummy1);
}


static bool_t
xdrrec_control(XDR *xdrs, int request, void *info)
{
    RECSTREAM *rstrm = (RECSTREAM *)(xdrs->x_private);
    xdr_bytesrec *xptr;

    switch (request) {

    case XDR_GET_BYTES_AVAIL:
        /* Check if at end of fragment and not last fragment */
        if ((rstrm->fbtbc == 0) && (!rstrm->last_frag))
            if (!set_input_fragment(rstrm)) {
                return (FALSE);
            };

        xptr = (xdr_bytesrec *)info;
        xptr->xc_is_last_record = rstrm->last_frag;
        xptr->xc_num_avail = rstrm->fbtbc;

        return (TRUE);
    default:
        return (FALSE);

    }

}

static struct xdr_ops *
xdrrec_ops()
{
    static struct xdr_ops ops;
    extern mutex_t  ops_lock;

/* VARIABLES PROTECTED BY ops_lock: ops */

    trace1(TR_xdrrec_ops, 0);
    mutex_lock(&ops_lock);
    if (ops.x_getlong == NULL) {
        ops.x_getlong = xdrrec_getlong;
        ops.x_putlong = xdrrec_putlong;
        ops.x_getbytes = xdrrec_getbytes;
        ops.x_putbytes = xdrrec_putbytes;
        ops.x_getpostn = xdrrec_getpos;
        ops.x_setpostn = xdrrec_setpos;
        ops.x_inline = xdrrec_inline;
        ops.x_destroy = xdrrec_destroy;
        ops.x_control = xdrrec_control;
#if defined(_LP64)
        ops.x_getint32 = xdrrec_getint32;
        ops.x_putint32 = xdrrec_putint32;
#endif
    }
    mutex_unlock(&ops_lock);
    trace1(TR_xdrrec_ops, 1);
    return (&ops);
}