inet/ipf/fil.c

/*
 * Copyright (C) 1993-2003 by Darren Reed.
 *
 * See the IPFILTER.LICENCE file for details on licencing.
 *
 * Copyright (c) 2003, 2010, Oracle and/or its affiliates. All rights reserved.
 *
 * Copyright (c) 2014, Joyent, Inc.  All rights reserved.
 */

#if defined(KERNEL) || defined(_KERNEL)
# undef KERNEL
# undef _KERNEL
# define        KERNEL  1
# define        _KERNEL 1
#endif
#include <sys/errno.h>
#include <sys/types.h>
#include <sys/param.h>
#include <sys/time.h>
#if defined(__NetBSD__)
# if (NetBSD >= 199905) && !defined(IPFILTER_LKM) && defined(_KERNEL)
#  include "opt_ipfilter_log.h"
# endif
#endif
#if defined(_KERNEL) && defined(__FreeBSD_version) && \
    (__FreeBSD_version >= 220000)
# if (__FreeBSD_version >= 400000)
#  if !defined(IPFILTER_LKM)
#   include "opt_inet6.h"
#  endif
#  if (__FreeBSD_version == 400019)
#   define CSUM_DELAY_DATA
#  endif
# endif
# include <sys/filio.h>
#else
# include <sys/ioctl.h>
#endif
#if !defined(_AIX51)
# include <sys/fcntl.h>
#endif
#if defined(_KERNEL)
# include <sys/systm.h>
# include <sys/file.h>
#else
# include <stdio.h>
# include <string.h>
# include <stdlib.h>
# include <stddef.h>
# include <sys/file.h>
# define _KERNEL
# ifdef __OpenBSD__
struct file;
# endif
# include <sys/uio.h>
# undef _KERNEL
#endif
#if !defined(__SVR4) && !defined(__svr4__) && !defined(__hpux) && \
    !defined(linux)
# include <sys/mbuf.h>
#else
# if !defined(linux)
#  include <sys/byteorder.h>
# endif
# if (SOLARIS2 < 5) && defined(sun)
#  include <sys/dditypes.h>
# endif
#endif
#ifdef __hpux
# define _NET_ROUTE_INCLUDED
#endif
#if !defined(linux)
# include <sys/protosw.h>
#endif
#include <sys/socket.h>
#include <net/if.h>
#ifdef sun
# include <net/af.h>
#endif
#if !defined(_KERNEL) && defined(__FreeBSD__)
# include "radix_ipf.h"
#endif
#include <net/route.h>
#include <netinet/in.h>
#include <netinet/in_systm.h>
#include <netinet/ip.h>
#if !defined(linux)
# include <netinet/ip_var.h>
#endif
#if defined(__sgi) && defined(IFF_DRVRLOCK) /* IRIX 6 */
# include <sys/hashing.h>
# include <netinet/in_var.h>
#endif
#include <netinet/tcp.h>
#if (!defined(__sgi) && !defined(AIX)) || defined(_KERNEL)
# include <netinet/udp.h>
# include <netinet/ip_icmp.h>
#endif
#ifdef __hpux
# undef _NET_ROUTE_INCLUDED
#endif
#include "netinet/ip_compat.h"
#ifdef  USE_INET6
# include <netinet/icmp6.h>
# if !SOLARIS && defined(_KERNEL) && !defined(__osf__) && !defined(__hpux)
#  include <netinet6/in6_var.h>
# endif
#endif
#include <netinet/tcpip.h>
#include "netinet/ip_fil.h"
#include "netinet/ip_nat.h"
#include "netinet/ip_frag.h"
#include "netinet/ip_state.h"
#include "netinet/ip_proxy.h"
#include "netinet/ip_auth.h"
#include "netinet/ipf_stack.h"
#ifdef IPFILTER_SCAN
# include "netinet/ip_scan.h"
#endif
#ifdef IPFILTER_SYNC
# include "netinet/ip_sync.h"
#endif
#include "netinet/ip_pool.h"
#include "netinet/ip_htable.h"
#ifdef IPFILTER_COMPILED
# include "netinet/ip_rules.h"
#endif
#if defined(IPFILTER_BPF) && defined(_KERNEL)
# include <net/bpf.h>
#endif
#if defined(__FreeBSD_version) && (__FreeBSD_version >= 300000)
# include <sys/malloc.h>
# if defined(_KERNEL) && !defined(IPFILTER_LKM)
#  include "opt_ipfilter.h"
# endif
#endif
#include "netinet/ipl.h"
#if defined(_KERNEL)
#include <sys/sunddi.h>
#endif
/* END OF INCLUDES */

#if !defined(lint)
static const char sccsid[] = "@(#)fil.c 1.36 6/5/96 (C) 1993-2000 Darren Reed";
static const char rcsid[] = "@(#)$Id: fil.c,v 2.243.2.64 2005/08/13 05:19:59 darrenr Exp $";
#endif

#ifndef _KERNEL
# include "ipf.h"
# include "ipt.h"
# include "bpf-ipf.h"
extern  int opts;

# define    FR_VERBOSE(verb_pr)         verbose verb_pr
# define    FR_DEBUG(verb_pr)           debug verb_pr
#else /* #ifndef _KERNEL */
# define    FR_VERBOSE(verb_pr)
# define    FR_DEBUG(verb_pr)
#endif /* _KERNEL */


char    ipfilter_version[] = IPL_VERSION;
int fr_features = 0
#ifdef  IPFILTER_LKM
        | IPF_FEAT_LKM
#endif
#ifdef  IPFILTER_LOG
        | IPF_FEAT_LOG
#endif
#ifdef  IPFILTER_LOOKUP
        | IPF_FEAT_LOOKUP
#endif
#ifdef  IPFILTER_BPF
        | IPF_FEAT_BPF
#endif
#ifdef  IPFILTER_COMPILED
        | IPF_FEAT_COMPILED
#endif
#ifdef  IPFILTER_CKSUM
        | IPF_FEAT_CKSUM
#endif
#ifdef  IPFILTER_SYNC
        | IPF_FEAT_SYNC
#endif
#ifdef  IPFILTER_SCAN
        | IPF_FEAT_SCAN
#endif
#ifdef  USE_INET6
        | IPF_FEAT_IPV6
#endif
    ;

#define IPF_BUMP(x) (x)++

static  INLINE int  fr_ipfcheck __P((fr_info_t *, frentry_t *, int));
static  INLINE int  fr_ipfcheck __P((fr_info_t *, frentry_t *, int));
static  int     fr_portcheck __P((frpcmp_t *, u_short *));
static  int     frflushlist __P((int, minor_t, int *, frentry_t **,
                     ipf_stack_t *));
static  ipfunc_t    fr_findfunc __P((ipfunc_t));
static  frentry_t   *fr_firewall __P((fr_info_t *, u_32_t *));
static  int     fr_funcinit __P((frentry_t *fr, ipf_stack_t *));
static  INLINE void frpr_ah __P((fr_info_t *));
static  INLINE void frpr_esp __P((fr_info_t *));
static  INLINE void frpr_gre __P((fr_info_t *));
static  INLINE void frpr_udp __P((fr_info_t *));
static  INLINE void frpr_tcp __P((fr_info_t *));
static  INLINE void frpr_icmp __P((fr_info_t *));
static  INLINE void frpr_ipv4hdr __P((fr_info_t *));
static  INLINE int  frpr_pullup __P((fr_info_t *, int));
static  INLINE void frpr_short __P((fr_info_t *, int));
static  INLINE void frpr_tcpcommon __P((fr_info_t *));
static  INLINE void frpr_udpcommon __P((fr_info_t *));
static  INLINE int  fr_updateipid __P((fr_info_t *));
#ifdef  IPFILTER_LOOKUP
static  int     fr_grpmapinit __P((frentry_t *fr, ipf_stack_t *));
static  INLINE void *fr_resolvelookup __P((u_int, u_int, lookupfunc_t *,
                           ipf_stack_t *));
#endif
static  void        frsynclist __P((int, int, void *, char *, frentry_t *,
    ipf_stack_t *));
static  void        *fr_ifsync __P((int, int, char *, char *,
                    void *, void *, ipf_stack_t *));
static  ipftuneable_t   *fr_findtunebyname __P((const char *, ipf_stack_t *));
static  ipftuneable_t   *fr_findtunebycookie __P((void *, void **, ipf_stack_t *));

/*
 * bit values for identifying presence of individual IP options
 * All of these tables should be ordered by increasing key value on the left
 * hand side to allow for binary searching of the array and include a trailer
 * with a 0 for the bitmask for linear searches to easily find the end with.
 */
const   struct  optlist ipopts[20] = {
    { IPOPT_NOP,    0x000001 },
    { IPOPT_RR, 0x000002 },
    { IPOPT_ZSU,    0x000004 },
    { IPOPT_MTUP,   0x000008 },
    { IPOPT_MTUR,   0x000010 },
    { IPOPT_ENCODE, 0x000020 },
    { IPOPT_TS, 0x000040 },
    { IPOPT_TR, 0x000080 },
    { IPOPT_SECURITY, 0x000100 },
    { IPOPT_LSRR,   0x000200 },
    { IPOPT_E_SEC,  0x000400 },
    { IPOPT_CIPSO,  0x000800 },
    { IPOPT_SATID,  0x001000 },
    { IPOPT_SSRR,   0x002000 },
    { IPOPT_ADDEXT, 0x004000 },
    { IPOPT_VISA,   0x008000 },
    { IPOPT_IMITD,  0x010000 },
    { IPOPT_EIP,    0x020000 },
    { IPOPT_FINN,   0x040000 },
    { 0,        0x000000 }
};

#ifdef USE_INET6
struct optlist ip6exthdr[] = {
    { IPPROTO_HOPOPTS,      0x000001 },
    { IPPROTO_IPV6,         0x000002 },
    { IPPROTO_ROUTING,      0x000004 },
    { IPPROTO_FRAGMENT,     0x000008 },
    { IPPROTO_ESP,          0x000010 },
    { IPPROTO_AH,           0x000020 },
    { IPPROTO_NONE,         0x000040 },
    { IPPROTO_DSTOPTS,      0x000080 },
    { 0,                0 }
};
#endif

struct optlist tcpopts[] = {
    { TCPOPT_NOP,           0x000001 },
    { TCPOPT_MAXSEG,        0x000002 },
    { TCPOPT_WINDOW,        0x000004 },
    { TCPOPT_SACK_PERMITTED,    0x000008 },
    { TCPOPT_SACK,          0x000010 },
    { TCPOPT_TIMESTAMP,     0x000020 },
    { 0,                0x000000 }
};

/*
 * bit values for identifying presence of individual IP security options
 */
const   struct  optlist secopt[8] = {
    { IPSO_CLASS_RES4,  0x01 },
    { IPSO_CLASS_TOPS,  0x02 },
    { IPSO_CLASS_SECR,  0x04 },
    { IPSO_CLASS_RES3,  0x08 },
    { IPSO_CLASS_CONF,  0x10 },
    { IPSO_CLASS_UNCL,  0x20 },
    { IPSO_CLASS_RES2,  0x40 },
    { IPSO_CLASS_RES1,  0x80 }
};


/*
 * Table of functions available for use with call rules.
 */
static ipfunc_resolve_t fr_availfuncs[] = {
#ifdef  IPFILTER_LOOKUP
    { "fr_srcgrpmap", fr_srcgrpmap, fr_grpmapinit },
    { "fr_dstgrpmap", fr_dstgrpmap, fr_grpmapinit },
#endif
    { "", NULL }
};


/*
 * Below we declare a list of constants used only by the ipf_extraflush()
 * routine.  We are placing it here, instead of in ipf_extraflush() itself,
 * because we want to make it visible to tools such as mdb, nm etc., so the
 * values can easily be altered during debugging.
 */
static  const   int idletime_tab[] = {
    IPF_TTLVAL(30),     /* 30 seconds */
    IPF_TTLVAL(1800),   /* 30 minutes */
    IPF_TTLVAL(43200),  /* 12 hours */
    IPF_TTLVAL(345600), /* 4 days */
};


/*
 * The next section of code is a a collection of small routines that set
 * fields in the fr_info_t structure passed based on properties of the
 * current packet.  There are different routines for the same protocol
 * for each of IPv4 and IPv6.  Adding a new protocol, for which there
 * will "special" inspection for setup, is now more easily done by adding
 * a new routine and expanding the frpr_ipinit*() function rather than by
 * adding more code to a growing switch statement.
 */
#ifdef USE_INET6
static  INLINE int  frpr_ah6 __P((fr_info_t *));
static  INLINE void frpr_esp6 __P((fr_info_t *));
static  INLINE void frpr_gre6 __P((fr_info_t *));
static  INLINE void frpr_udp6 __P((fr_info_t *));
static  INLINE void frpr_tcp6 __P((fr_info_t *));
static  INLINE void frpr_icmp6 __P((fr_info_t *));
static  INLINE void frpr_ipv6hdr __P((fr_info_t *));
static  INLINE void frpr_short6 __P((fr_info_t *, int));
static  INLINE int  frpr_hopopts6 __P((fr_info_t *));
static  INLINE int  frpr_routing6 __P((fr_info_t *));
static  INLINE int  frpr_dstopts6 __P((fr_info_t *));
static  INLINE int  frpr_fragment6 __P((fr_info_t *));
static  INLINE int  frpr_ipv6exthdr __P((fr_info_t *, int, int));


/* ------------------------------------------------------------------------ */
/* Function:    frpr_short6                                                 */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* IPv6 Only                                                                */
/* This is function enforces the 'is a packet too short to be legit' rule   */
/* for IPv6 and marks the packet with FI_SHORT if so.  See function comment */
/* for frpr_short() for more details.                                       */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_short6(fin, xmin)
fr_info_t *fin;
int xmin;
{

    if (fin->fin_dlen < xmin)
        fin->fin_flx |= FI_SHORT;
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_ipv6hdr                                                */
/* Returns:     Nil                                                         */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* IPv6 Only                                                                */
/* Copy values from the IPv6 header into the fr_info_t struct and call the  */
/* per-protocol analyzer if it exists.                                      */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_ipv6hdr(fin)
fr_info_t *fin;
{
    ip6_t *ip6 = (ip6_t *)fin->fin_ip;
    int p, go = 1, i, hdrcount;
    fr_ip_t *fi = &fin->fin_fi;

    fin->fin_off = 0;

    fi->fi_tos = 0;
    fi->fi_optmsk = 0;
    fi->fi_secmsk = 0;
    fi->fi_auth = 0;

    p = ip6->ip6_nxt;
    fi->fi_ttl = ip6->ip6_hlim;
    fi->fi_src.in6 = ip6->ip6_src;
    fi->fi_dst.in6 = ip6->ip6_dst;
    fin->fin_id = 0;

    hdrcount = 0;
    while (go && !(fin->fin_flx & (FI_BAD|FI_SHORT))) {
        switch (p)
        {
        case IPPROTO_UDP :
            frpr_udp6(fin);
            go = 0;
            break;

        case IPPROTO_TCP :
            frpr_tcp6(fin);
            go = 0;
            break;

        case IPPROTO_ICMPV6 :
            frpr_icmp6(fin);
            go = 0;
            break;

        case IPPROTO_GRE :
            frpr_gre6(fin);
            go = 0;
            break;

        case IPPROTO_HOPOPTS :
            /*
             * hop by hop ext header is only allowed
             * right after IPv6 header.
             */
            if (hdrcount != 0) {
                fin->fin_flx |= FI_BAD;
                p = IPPROTO_NONE;
            } else {
                p = frpr_hopopts6(fin);
            }
            break;

        case IPPROTO_DSTOPTS :
            p = frpr_dstopts6(fin);
            break;

        case IPPROTO_ROUTING :
            p = frpr_routing6(fin);
            break;

        case IPPROTO_AH :
            p = frpr_ah6(fin);
            break;

        case IPPROTO_ESP :
            frpr_esp6(fin);
            go = 0;
            break;

        case IPPROTO_IPV6 :
            for (i = 0; ip6exthdr[i].ol_bit != 0; i++)
                if (ip6exthdr[i].ol_val == p) {
                    fin->fin_flx |= ip6exthdr[i].ol_bit;
                    break;
                }
            go = 0;
            break;

        case IPPROTO_NONE :
            go = 0;
            break;

        case IPPROTO_FRAGMENT :
            p = frpr_fragment6(fin);
            if (fin->fin_off != 0)  /* Not the first frag */
                go = 0;
            break;

        default :
            go = 0;
            break;
        }
        hdrcount++;

        /*
         * It is important to note that at this point, for the
         * extension headers (go != 0), the entire header may not have
         * been pulled up when the code gets to this point.  This is
         * only done for "go != 0" because the other header handlers
         * will all pullup their complete header.  The other indicator
         * of an incomplete packet is that this was just an extension
         * header.
         */
        if ((go != 0) && (p != IPPROTO_NONE) &&
            (frpr_pullup(fin, 0) == -1)) {
            p = IPPROTO_NONE;
            go = 0;
        }
    }
    fi->fi_p = p;
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_ipv6exthdr                                             */
/* Returns:     int    - value of the next header or IPPROTO_NONE if error  */
/* Parameters:  fin(I)      - pointer to packet information                 */
/*              multiple(I) - flag indicating yes/no if multiple occurances */
/*                            of this extension header are allowed.         */
/*              proto(I)    - protocol number for this extension header     */
/*                                                                          */
/* IPv6 Only                                                                */
/* This function expects to find an IPv6 extension header at fin_dp.        */
/* There must be at least 8 bytes of data at fin_dp for there to be a valid */
/* extension header present. If a good one is found, fin_dp is advanced to  */
/* point at the first piece of data after the extension header, fin_exthdr  */
/* points to the start of the extension header and the "protocol" of the    */
/* *NEXT* header is returned.                                               */
/* ------------------------------------------------------------------------ */
static INLINE int frpr_ipv6exthdr(fin, multiple, proto)
fr_info_t *fin;
int multiple, proto;
{
    struct ip6_ext *hdr;
    u_short shift;
    int i;

    fin->fin_flx |= FI_V6EXTHDR;

                /* 8 is default length of extension hdr */
    if ((fin->fin_dlen - 8) < 0) {
        fin->fin_flx |= FI_SHORT;
        return IPPROTO_NONE;
    }

    if (frpr_pullup(fin, 8) == -1)
        return IPPROTO_NONE;

    hdr = fin->fin_dp;
    shift = 8 + (hdr->ip6e_len << 3);
    if (shift > fin->fin_dlen) {    /* Nasty extension header length? */
        fin->fin_flx |= FI_BAD;
        return IPPROTO_NONE;
    }

    for (i = 0; ip6exthdr[i].ol_bit != 0; i++)
        if (ip6exthdr[i].ol_val == proto) {
            /*
             * Most IPv6 extension headers are only allowed once.
             */
            if ((multiple == 0) &&
                ((fin->fin_optmsk & ip6exthdr[i].ol_bit) != 0))
                fin->fin_flx |= FI_BAD;
            else
                fin->fin_optmsk |= ip6exthdr[i].ol_bit;
            break;
        }

    fin->fin_dp = (char *)fin->fin_dp + shift;
    fin->fin_dlen -= shift;

    return hdr->ip6e_nxt;
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_hopopts6                                               */
/* Returns:     int    - value of the next header or IPPROTO_NONE if error  */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* IPv6 Only                                                                */
/* This is function checks pending hop by hop options extension header      */
/* ------------------------------------------------------------------------ */
static INLINE int frpr_hopopts6(fin)
fr_info_t *fin;
{
    return frpr_ipv6exthdr(fin, 0, IPPROTO_HOPOPTS);
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_routing6                                               */
/* Returns:     int    - value of the next header or IPPROTO_NONE if error  */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* IPv6 Only                                                                */
/* This is function checks pending routing extension header                 */
/* ------------------------------------------------------------------------ */
static INLINE int frpr_routing6(fin)
fr_info_t *fin;
{
    struct ip6_ext *hdr;
    int shift;

    hdr = fin->fin_dp;
    if (frpr_ipv6exthdr(fin, 0, IPPROTO_ROUTING) == IPPROTO_NONE)
        return IPPROTO_NONE;

    shift = 8 + (hdr->ip6e_len << 3);
    /*
     * Nasty extension header length?
     */
    if ((hdr->ip6e_len << 3) & 15) {
        fin->fin_flx |= FI_BAD;
        /*
         * Compensate for the changes made in frpr_ipv6exthdr()
         */
        fin->fin_dlen += shift;
        fin->fin_dp = (char *)fin->fin_dp - shift;
        return IPPROTO_NONE;
    }

    return hdr->ip6e_nxt;
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_fragment6                                              */
/* Returns:     int    - value of the next header or IPPROTO_NONE if error  */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* IPv6 Only                                                                */
/* Examine the IPv6 fragment header and extract fragment offset information.*/
/*                                                                          */
/* We don't know where the transport layer header (or whatever is next is), */
/* as it could be behind destination options (amongst others).  Because     */
/* there is no fragment cache, there is no knowledge about whether or not an*/
/* upper layer header has been seen (or where it ends) and thus we are not  */
/* able to continue processing beyond this header with any confidence.      */
/* ------------------------------------------------------------------------ */
static INLINE int frpr_fragment6(fin)
fr_info_t *fin;
{
    struct ip6_frag *frag;

    fin->fin_flx |= FI_FRAG;

    /*
     * A fragmented IPv6 packet implies that there must be something
     * else after the fragment.
     */
    if (frpr_ipv6exthdr(fin, 0, IPPROTO_FRAGMENT) == IPPROTO_NONE)
        return IPPROTO_NONE;

    frag = (struct ip6_frag *)((char *)fin->fin_dp - sizeof(*frag));

    /*
     * If this fragment isn't the last then the packet length must
     * be a multiple of 8.
     */
    if ((frag->ip6f_offlg & IP6F_MORE_FRAG) != 0) {
        fin->fin_flx |= FI_MOREFRAG;

        if ((fin->fin_plen & 0x7) != 0)
            fin->fin_flx |= FI_BAD;
    }

    fin->fin_id = frag->ip6f_ident;
    fin->fin_off = ntohs(frag->ip6f_offlg & IP6F_OFF_MASK);
    if (fin->fin_off != 0)
        fin->fin_flx |= FI_FRAGBODY;

    return frag->ip6f_nxt;
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_dstopts6                                               */
/* Returns:     int    - value of the next header or IPPROTO_NONE if error  */
/* Parameters:  fin(I) - pointer to packet information                      */
/*              nextheader(I) - stores next header value                    */
/*                                                                          */
/* IPv6 Only                                                                */
/* This is function checks pending destination options extension header     */
/* ------------------------------------------------------------------------ */
static INLINE int frpr_dstopts6(fin)
fr_info_t *fin;
{
    return frpr_ipv6exthdr(fin, 1, IPPROTO_DSTOPTS);
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_icmp6                                                  */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* IPv6 Only                                                                */
/* This routine is mainly concerned with determining the minimum valid size */
/* for an ICMPv6 packet.                                                    */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_icmp6(fin)
fr_info_t *fin;
{
    int minicmpsz = sizeof(struct icmp6_hdr);
    struct icmp6_hdr *icmp6;

    if (frpr_pullup(fin, ICMP6ERR_MINPKTLEN - sizeof(ip6_t)) == -1)
        return;

    if (fin->fin_dlen > 1) {
        icmp6 = fin->fin_dp;

        fin->fin_data[0] = *(u_short *)icmp6;

        if ((icmp6->icmp6_type & ICMP6_INFOMSG_MASK) != 0)
            fin->fin_flx |= FI_ICMPQUERY;

        switch (icmp6->icmp6_type)
        {
        case ICMP6_ECHO_REPLY :
        case ICMP6_ECHO_REQUEST :
            if (fin->fin_dlen >= 6)
                fin->fin_data[1] = icmp6->icmp6_id;
            minicmpsz = ICMP6ERR_MINPKTLEN - sizeof(ip6_t);
            break;
        case ICMP6_DST_UNREACH :
        case ICMP6_PACKET_TOO_BIG :
        case ICMP6_TIME_EXCEEDED :
        case ICMP6_PARAM_PROB :
            if ((fin->fin_m != NULL) &&
                (M_LEN(fin->fin_m) < fin->fin_plen)) {
                if (fr_coalesce(fin) != 1)
                    return;
            }
            fin->fin_flx |= FI_ICMPERR;
            minicmpsz = ICMP6ERR_IPICMPHLEN - sizeof(ip6_t);
            break;
        default :
            break;
        }
    }

    frpr_short6(fin, minicmpsz);
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_udp6                                                   */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* IPv6 Only                                                                */
/* Analyse the packet for IPv6/UDP properties.                              */
/* Is not expected to be called for fragmented packets.                     */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_udp6(fin)
fr_info_t *fin;
{

    fr_checkv6sum(fin);

    frpr_short6(fin, sizeof(struct udphdr));
    if (frpr_pullup(fin, sizeof(struct udphdr)) == -1)
        return;

    frpr_udpcommon(fin);
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_tcp6                                                   */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* IPv6 Only                                                                */
/* Analyse the packet for IPv6/TCP properties.                              */
/* Is not expected to be called for fragmented packets.                     */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_tcp6(fin)
fr_info_t *fin;
{

    fr_checkv6sum(fin);

    frpr_short6(fin, sizeof(struct tcphdr));
    if (frpr_pullup(fin, sizeof(struct tcphdr)) == -1)
        return;

    frpr_tcpcommon(fin);
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_esp6                                                   */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* IPv6 Only                                                                */
/* Analyse the packet for ESP properties.                                   */
/* The minimum length is taken to be the SPI (32bits) plus a tail (32bits)  */
/* even though the newer ESP packets must also have a sequence number that  */
/* is 32bits as well, it is not possible(?) to determine the version from a */
/* simple packet header.                                                    */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_esp6(fin)
fr_info_t *fin;
{
    int i;
    frpr_short6(fin, sizeof(grehdr_t));

    (void) frpr_pullup(fin, 8);

    for (i = 0; ip6exthdr[i].ol_bit != 0; i++)
        if (ip6exthdr[i].ol_val == IPPROTO_ESP) {
            fin->fin_optmsk |= ip6exthdr[i].ol_bit;
            break;
        }
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_ah6                                                    */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* IPv6 Only                                                                */
/* Analyse the packet for AH properties.                                    */
/* The minimum length is taken to be the combination of all fields in the   */
/* header being present and no authentication data (null algorithm used.)   */
/* ------------------------------------------------------------------------ */
static INLINE int frpr_ah6(fin)
fr_info_t *fin;
{
    authhdr_t *ah;
    int i, shift;

    frpr_short6(fin, 12);

    if (frpr_pullup(fin, sizeof(*ah)) == -1)
        return IPPROTO_NONE;

    for (i = 0; ip6exthdr[i].ol_bit != 0; i++)
        if (ip6exthdr[i].ol_val == IPPROTO_AH) {
            fin->fin_optmsk |= ip6exthdr[i].ol_bit;
            break;
        }

    ah = (authhdr_t *)fin->fin_dp;

    shift = (ah->ah_plen + 2) * 4;
    fin->fin_dlen -= shift;
    fin->fin_dp = (char*)fin->fin_dp + shift;

    return ah->ah_next;
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_gre6                                                   */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* Analyse the packet for GRE properties.                                   */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_gre6(fin)
fr_info_t *fin;
{
    grehdr_t *gre;

    frpr_short6(fin, sizeof(grehdr_t));

    if (frpr_pullup(fin, sizeof(grehdr_t)) == -1)
        return;

    gre = fin->fin_dp;
    if (GRE_REV(gre->gr_flags) == 1)
        fin->fin_data[0] = gre->gr_call;
}
#endif  /* USE_INET6 */


/* ------------------------------------------------------------------------ */
/* Function:    frpr_pullup                                                 */
/* Returns:     int     - 0 == pullup succeeded, -1 == failure              */
/* Parameters:  fin(I)  - pointer to packet information                     */
/*              plen(I) - length (excluding L3 header) to pullup            */
/*                                                                          */
/* Short inline function to cut down on code duplication to perform a call  */
/* to fr_pullup to ensure there is the required amount of data,             */
/* consecutively in the packet buffer.                                      */
/* ------------------------------------------------------------------------ */
static INLINE int frpr_pullup(fin, plen)
fr_info_t *fin;
int plen;
{
#if defined(_KERNEL)
    if (fin->fin_m != NULL) {
        int ipoff;

        ipoff = (char *)fin->fin_ip - MTOD(fin->fin_m, char *);

        if (fin->fin_dp != NULL)
            plen += (char *)fin->fin_dp -
                ((char *)fin->fin_ip + fin->fin_hlen);
        plen += fin->fin_hlen;
        /*
         * We don't do 'plen += ipoff;' here. The fr_pullup() will
         * do it for us.
         */
        if (M_LEN(fin->fin_m) < plen + ipoff) {
            if (fr_pullup(fin->fin_m, fin, plen) == NULL)
                return -1;
        }
    }
#endif
    return 0;
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_short                                                  */
/* Returns:     void                                                        */
/* Parameters:  fin(I)  - pointer to packet information                     */
/*              xmin(I) - minimum header size                               */
/*                                                                          */
/* Check if a packet is "short" as defined by xmin.  The rule we are        */
/* applying here is that the packet must not be fragmented within the layer */
/* 4 header.  That is, it must not be a fragment that has its offset set to */
/* start within the layer 4 header (hdrmin) or if it is at offset 0, the    */
/* entire layer 4 header must be present (min).                             */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_short(fin, xmin)
fr_info_t *fin;
int xmin;
{

    if (fin->fin_off == 0) {
        if (fin->fin_dlen < xmin)
            fin->fin_flx |= FI_SHORT;
    } else if (fin->fin_off < xmin) {
        fin->fin_flx |= FI_SHORT;
    }
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_icmp                                                   */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* IPv4 Only                                                                */
/* Do a sanity check on the packet for ICMP (v4).  In nearly all cases,     */
/* except extrememly bad packets, both type and code will be present.       */
/* The expected minimum size of an ICMP packet is very much dependent on    */
/* the type of it.                                                          */
/*                                                                          */
/* XXX - other ICMP sanity checks?                                          */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_icmp(fin)
fr_info_t *fin;
{
    int minicmpsz = sizeof(struct icmp);
    icmphdr_t *icmp;
    ip_t *oip;
    ipf_stack_t *ifs = fin->fin_ifs;

    if (fin->fin_off != 0) {
        frpr_short(fin, ICMPERR_ICMPHLEN);
        return;
    }

    if (frpr_pullup(fin, ICMPERR_ICMPHLEN) == -1)
        return;

    fr_checkv4sum(fin);

    /*
     * This is a right place to set icmp pointer, since the memory
     * referenced by fin_dp could get reallocated. The code down below can
     * rely on fact icmp variable always points to ICMP header.
     */
    icmp = fin->fin_dp;
    fin->fin_data[0] = *(u_short *)icmp;
    fin->fin_data[1] = icmp->icmp_id;

    switch (icmp->icmp_type)
    {
    case ICMP_ECHOREPLY :
    case ICMP_ECHO :
    /* Router discovery messaes - RFC 1256 */
    case ICMP_ROUTERADVERT :
    case ICMP_ROUTERSOLICIT :
        minicmpsz = ICMP_MINLEN;
        break;
    /*
     * type(1) + code(1) + cksum(2) + id(2) seq(2) +
     * 3 * timestamp(3 * 4)
     */
    case ICMP_TSTAMP :
    case ICMP_TSTAMPREPLY :
        minicmpsz = 20;
        break;
    /*
     * type(1) + code(1) + cksum(2) + id(2) seq(2) +
     * mask(4)
     */
    case ICMP_MASKREQ :
    case ICMP_MASKREPLY :
            minicmpsz = 12;
            break;
    /*
     * type(1) + code(1) + cksum(2) + id(2) seq(2) + ip(20+)
     */
    case ICMP_UNREACH :
        if (icmp->icmp_code == ICMP_UNREACH_NEEDFRAG) {
            if (icmp->icmp_nextmtu < ifs->ifs_fr_icmpminfragmtu)
                fin->fin_flx |= FI_BAD;
        }
        /* FALLTHRU */
    case ICMP_SOURCEQUENCH :
    case ICMP_REDIRECT :
    case ICMP_TIMXCEED :
    case ICMP_PARAMPROB :
        fin->fin_flx |= FI_ICMPERR;
        if (fr_coalesce(fin) != 1)
            return;
        /*
         * ICMP error packets should not be generated for IP
         * packets that are a fragment that isn't the first
         * fragment.
         */
        oip = (ip_t *)((char *)fin->fin_dp + ICMPERR_ICMPHLEN);
        if ((ntohs(oip->ip_off) & IP_OFFMASK) != 0)
            fin->fin_flx |= FI_BAD;
        break;
    default :
        break;
    }

    frpr_short(fin, minicmpsz);
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_tcpcommon                                              */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* TCP header sanity checking.  Look for bad combinations of TCP flags,     */
/* and make some checks with how they interact with other fields.           */
/* If compiled with IPFILTER_CKSUM, check to see if the TCP checksum is     */
/* valid and mark the packet as bad if not.                                 */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_tcpcommon(fin)
fr_info_t *fin;
{
    int flags, tlen;
    tcphdr_t *tcp;

    fin->fin_flx |= FI_TCPUDP;
    if (fin->fin_off != 0)
        return;

    if (frpr_pullup(fin, sizeof(*tcp)) == -1)
        return;
    tcp = fin->fin_dp;

    if (fin->fin_dlen > 3) {
        fin->fin_sport = ntohs(tcp->th_sport);
        fin->fin_dport = ntohs(tcp->th_dport);
    }

    if ((fin->fin_flx & FI_SHORT) != 0)
        return;

    /*
     * Use of the TCP data offset *must* result in a value that is at
     * least the same size as the TCP header.
     */
    tlen = TCP_OFF(tcp) << 2;
    if (tlen < sizeof(tcphdr_t)) {
        fin->fin_flx |= FI_BAD;
        return;
    }

    flags = tcp->th_flags;
    fin->fin_tcpf = tcp->th_flags;

    /*
     * If the urgent flag is set, then the urgent pointer must
     * also be set and vice versa.  Good TCP packets do not have
     * just one of these set.
     */
    if ((flags & TH_URG) != 0 && (tcp->th_urp == 0)) {
        fin->fin_flx |= FI_BAD;
    } else if ((flags & TH_URG) == 0 && (tcp->th_urp != 0)) {
        /* Ignore this case, it shows up in "real" traffic with */
        /* bogus values in the urgent pointer field. */
        flags = flags; /* LINT */
    } else if (((flags & (TH_SYN|TH_FIN)) != 0) &&
           ((flags & (TH_RST|TH_ACK)) == TH_RST)) {
        /* TH_FIN|TH_RST|TH_ACK seems to appear "naturally" */
        fin->fin_flx |= FI_BAD;
    } else if (!(flags & TH_ACK)) {
        /*
         * If the ack bit isn't set, then either the SYN or
         * RST bit must be set.  If the SYN bit is set, then
         * we expect the ACK field to be 0.  If the ACK is
         * not set and if URG, PSH or FIN are set, consdier
         * that to indicate a bad TCP packet.
         */
        if ((flags == TH_SYN) && (tcp->th_ack != 0)) {
            /*
             * Cisco PIX sets the ACK field to a random value.
             * In light of this, do not set FI_BAD until a patch
             * is available from Cisco to ensure that
             * interoperability between existing systems is
             * achieved.
             */
            /*fin->fin_flx |= FI_BAD*/;
            flags = flags; /* LINT */
        } else if (!(flags & (TH_RST|TH_SYN))) {
            fin->fin_flx |= FI_BAD;
        } else if ((flags & (TH_URG|TH_PUSH|TH_FIN)) != 0) {
            fin->fin_flx |= FI_BAD;
        }
    }

    /*
     * At this point, it's not exactly clear what is to be gained by
     * marking up which TCP options are and are not present.  The one we
     * are most interested in is the TCP window scale.  This is only in
     * a SYN packet [RFC1323] so we don't need this here...?
     * Now if we were to analyse the header for passive fingerprinting,
     * then that might add some weight to adding this...
     */
    if (tlen == sizeof(tcphdr_t))
        return;

    if (frpr_pullup(fin, tlen) == -1)
        return;

#if 0
    ip = fin->fin_ip;
    s = (u_char *)(tcp + 1);
    off = IP_HL(ip) << 2;
# ifdef _KERNEL
    if (fin->fin_mp != NULL) {
        mb_t *m = *fin->fin_mp;

        if (off + tlen > M_LEN(m))
            return;
    }
# endif
    for (tlen -= (int)sizeof(*tcp); tlen > 0; ) {
        opt = *s;
        if (opt == '\0')
            break;
        else if (opt == TCPOPT_NOP)
            ol = 1;
        else {
            if (tlen < 2)
                break;
            ol = (int)*(s + 1);
            if (ol < 2 || ol > tlen)
                break;
        }

        for (i = 9, mv = 4; mv >= 0; ) {
            op = ipopts + i;
            if (opt == (u_char)op->ol_val) {
                optmsk |= op->ol_bit;
                break;
            }
        }
        tlen -= ol;
        s += ol;
    }
#endif /* 0 */
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_udpcommon                                              */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* Extract the UDP source and destination ports, if present.  If compiled   */
/* with IPFILTER_CKSUM, check to see if the UDP checksum is valid.          */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_udpcommon(fin)
fr_info_t *fin;
{
    udphdr_t *udp;

    fin->fin_flx |= FI_TCPUDP;

    if (!fin->fin_off && (fin->fin_dlen > 3)) {
        if (frpr_pullup(fin, sizeof(*udp)) == -1) {
            fin->fin_flx |= FI_SHORT;
            return;
        }

        udp = fin->fin_dp;

        fin->fin_sport = ntohs(udp->uh_sport);
        fin->fin_dport = ntohs(udp->uh_dport);
    }
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_tcp                                                    */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* IPv4 Only                                                                */
/* Analyse the packet for IPv4/TCP properties.                              */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_tcp(fin)
fr_info_t *fin;
{

    fr_checkv4sum(fin);

    frpr_short(fin, sizeof(tcphdr_t));

    frpr_tcpcommon(fin);
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_udp                                                    */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* IPv4 Only                                                                */
/* Analyse the packet for IPv4/UDP properties.                              */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_udp(fin)
fr_info_t *fin;
{

    fr_checkv4sum(fin);

    frpr_short(fin, sizeof(udphdr_t));

    frpr_udpcommon(fin);
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_esp                                                    */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* Analyse the packet for ESP properties.                                   */
/* The minimum length is taken to be the SPI (32bits) plus a tail (32bits)  */
/* even though the newer ESP packets must also have a sequence number that  */
/* is 32bits as well, it is not possible(?) to determine the version from a */
/* simple packet header.                                                    */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_esp(fin)
fr_info_t *fin;
{
    if ((fin->fin_off == 0) && (frpr_pullup(fin, 8) == -1))
        return;

    frpr_short(fin, 8);
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_ah                                                     */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* Analyse the packet for AH properties.                                    */
/* The minimum length is taken to be the combination of all fields in the   */
/* header being present and no authentication data (null algorithm used.)   */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_ah(fin)
fr_info_t *fin;
{
    authhdr_t *ah;
    int len;

    if ((fin->fin_off == 0) && (frpr_pullup(fin, sizeof(*ah)) == -1))
        return;

    ah = (authhdr_t *)fin->fin_dp;

    len = (ah->ah_plen + 2) << 2;
    frpr_short(fin, len);
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_gre                                                    */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* Analyse the packet for GRE properties.                                   */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_gre(fin)
fr_info_t *fin;
{
    grehdr_t *gre;

    if ((fin->fin_off == 0) && (frpr_pullup(fin, sizeof(grehdr_t)) == -1))
        return;

    frpr_short(fin, sizeof(grehdr_t));

    if (fin->fin_off == 0) {
        gre = fin->fin_dp;
        if (GRE_REV(gre->gr_flags) == 1)
            fin->fin_data[0] = gre->gr_call;
    }
}


/* ------------------------------------------------------------------------ */
/* Function:    frpr_ipv4hdr                                                */
/* Returns:     void                                                        */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* IPv4 Only                                                                */
/* Analyze the IPv4 header and set fields in the fr_info_t structure.       */
/* Check all options present and flag their presence if any exist.          */
/* ------------------------------------------------------------------------ */
static INLINE void frpr_ipv4hdr(fin)
fr_info_t *fin;
{
    u_short optmsk = 0, secmsk = 0, auth = 0;
    int hlen, ol, mv, p, i;
    const struct optlist *op;
    u_char *s, opt;
    u_short off;
    fr_ip_t *fi;
    ip_t *ip;

    fi = &fin->fin_fi;
    hlen = fin->fin_hlen;

    ip = fin->fin_ip;
    p = ip->ip_p;
    fi->fi_p = p;
    fi->fi_tos = ip->ip_tos;
    fin->fin_id = ip->ip_id;
    off = ip->ip_off;

    /* Get both TTL and protocol */
    fi->fi_p = ip->ip_p;
    fi->fi_ttl = ip->ip_ttl;
#if 0
    (*(((u_short *)fi) + 1)) = (*(((u_short *)ip) + 4));
#endif

    /* Zero out bits not used in IPv6 address */
    fi->fi_src.i6[1] = 0;
    fi->fi_src.i6[2] = 0;
    fi->fi_src.i6[3] = 0;
    fi->fi_dst.i6[1] = 0;
    fi->fi_dst.i6[2] = 0;
    fi->fi_dst.i6[3] = 0;

    fi->fi_saddr = ip->ip_src.s_addr;
    fi->fi_daddr = ip->ip_dst.s_addr;

    /*
     * set packet attribute flags based on the offset and
     * calculate the byte offset that it represents.
     */
    off &= IP_MF|IP_OFFMASK;
    if (off != 0) {
        int morefrag = off & IP_MF;

        fi->fi_flx |= FI_FRAG;
        if (morefrag)
            fi->fi_flx |= FI_MOREFRAG;
        off &= IP_OFFMASK;
        if (off != 0) {
            fin->fin_flx |= FI_FRAGBODY;
            off <<= 3;
            if ((off + fin->fin_dlen > 65535) ||
                (fin->fin_dlen == 0) ||
                ((morefrag != 0) && ((fin->fin_dlen & 7) != 0))) {
                /*
                 * The length of the packet, starting at its
                 * offset cannot exceed 65535 (0xffff) as the
                 * length of an IP packet is only 16 bits.
                 *
                 * Any fragment that isn't the last fragment
                 * must have a length greater than 0 and it
                 * must be an even multiple of 8.
                 */
                fi->fi_flx |= FI_BAD;
            }
        }
    }
    fin->fin_off = off;

    /*
     * Call per-protocol setup and checking
     */
    switch (p)
    {
    case IPPROTO_UDP :
        frpr_udp(fin);
        break;
    case IPPROTO_TCP :
        frpr_tcp(fin);
        break;
    case IPPROTO_ICMP :
        frpr_icmp(fin);
        break;
    case IPPROTO_AH :
        frpr_ah(fin);
        break;
    case IPPROTO_ESP :
        frpr_esp(fin);
        break;
    case IPPROTO_GRE :
        frpr_gre(fin);
        break;
    }

    ip = fin->fin_ip;
    if (ip == NULL)
        return;

    /*
     * If it is a standard IP header (no options), set the flag fields
     * which relate to options to 0.
     */
    if (hlen == sizeof(*ip)) {
        fi->fi_optmsk = 0;
        fi->fi_secmsk = 0;
        fi->fi_auth = 0;
        return;
    }

    /*
     * So the IP header has some IP options attached.  Walk the entire
     * list of options present with this packet and set flags to indicate
     * which ones are here and which ones are not.  For the somewhat out
     * of date and obscure security classification options, set a flag to
     * represent which classification is present.
     */
    fi->fi_flx |= FI_OPTIONS;

    for (s = (u_char *)(ip + 1), hlen -= (int)sizeof(*ip); hlen > 0; ) {
        opt = *s;
        if (opt == '\0')
            break;
        else if (opt == IPOPT_NOP)
            ol = 1;
        else {
            if (hlen < 2)
                break;
            ol = (int)*(s + 1);
            if (ol < 2 || ol > hlen)
                break;
        }
        for (i = 9, mv = 4; mv >= 0; ) {
            op = ipopts + i;
            if ((opt == (u_char)op->ol_val) && (ol > 4)) {
                optmsk |= op->ol_bit;
                if (opt == IPOPT_SECURITY) {
                    const struct optlist *sp;
                    u_char  sec;
                    int j, m;

                    sec = *(s + 2); /* classification */
                    for (j = 3, m = 2; m >= 0; ) {
                        sp = secopt + j;
                        if (sec == sp->ol_val) {
                            secmsk |= sp->ol_bit;
                            auth = *(s + 3);
                            auth *= 256;
                            auth += *(s + 4);
                            break;
                        }
                        if (sec < sp->ol_val)
                            j -= m;
                        else
                            j += m;
                        m--;
                    }
                }
                break;
            }
            if (opt < op->ol_val)
                i -= mv;
            else
                i += mv;
            mv--;
        }
        hlen -= ol;
        s += ol;
    }

    /*
     *
     */
    if (auth && !(auth & 0x0100))
        auth &= 0xff00;
    fi->fi_optmsk = optmsk;
    fi->fi_secmsk = secmsk;
    fi->fi_auth = auth;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_makefrip                                                 */
/* Returns:     int - 1 == hdr checking error, 0 == OK                      */
/* Parameters:  hlen(I) - length of IP packet header                        */
/*              ip(I)   - pointer to the IP header                          */
/*              fin(IO) - pointer to packet information                     */
/*                                                                          */
/* Compact the IP header into a structure which contains just the info.     */
/* which is useful for comparing IP headers with and store this information */
/* in the fr_info_t structure pointer to by fin.  At present, it is assumed */
/* this function will be called with either an IPv4 or IPv6 packet.         */
/* ------------------------------------------------------------------------ */
int fr_makefrip(hlen, ip, fin)
int hlen;
ip_t *ip;
fr_info_t *fin;
{
    int v;

    fin->fin_depth = 0;
    fin->fin_hlen = (u_short)hlen;
    fin->fin_ip = ip;
    fin->fin_rule = 0xffffffff;
    fin->fin_group[0] = -1;
    fin->fin_group[1] = '\0';
    fin->fin_dlen = fin->fin_plen - hlen;
    fin->fin_dp = (char *)ip + hlen;

    v = fin->fin_v;
    if (v == 4)
        frpr_ipv4hdr(fin);
#ifdef  USE_INET6
    else if (v == 6)
        frpr_ipv6hdr(fin);
#endif
    if (fin->fin_ip == NULL)
        return -1;
    return 0;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_portcheck                                                */
/* Returns:     int - 1 == port matched, 0 == port match failed             */
/* Parameters:  frp(I) - pointer to port check `expression'                 */
/*              pop(I) - pointer to port number to evaluate                 */
/*                                                                          */
/* Perform a comparison of a port number against some other(s), using a     */
/* structure with compare information stored in it.                         */
/* ------------------------------------------------------------------------ */
static INLINE int fr_portcheck(frp, pop)
frpcmp_t *frp;
u_short *pop;
{
    u_short tup, po;
    int err = 1;

    tup = *pop;
    po = frp->frp_port;

    /*
     * Do opposite test to that required and continue if that succeeds.
     */
    switch (frp->frp_cmp)
    {
    case FR_EQUAL :
        if (tup != po) /* EQUAL */
            err = 0;
        break;
    case FR_NEQUAL :
        if (tup == po) /* NOTEQUAL */
            err = 0;
        break;
    case FR_LESST :
        if (tup >= po) /* LESSTHAN */
            err = 0;
        break;
    case FR_GREATERT :
        if (tup <= po) /* GREATERTHAN */
            err = 0;
        break;
    case FR_LESSTE :
        if (tup > po) /* LT or EQ */
            err = 0;
        break;
    case FR_GREATERTE :
        if (tup < po) /* GT or EQ */
            err = 0;
        break;
    case FR_OUTRANGE :
        if (tup >= po && tup <= frp->frp_top) /* Out of range */
            err = 0;
        break;
    case FR_INRANGE :
        if (tup <= po || tup >= frp->frp_top) /* In range */
            err = 0;
        break;
    case FR_INCRANGE :
        if (tup < po || tup > frp->frp_top) /* Inclusive range */
            err = 0;
        break;
    default :
        break;
    }
    return err;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_tcpudpchk                                                */
/* Returns:     int - 1 == protocol matched, 0 == check failed              */
/* Parameters:  fin(I) - pointer to packet information                      */
/*              ft(I)  - pointer to structure with comparison data          */
/*                                                                          */
/* Compares the current pcket (assuming it is TCP/UDP) information with a   */
/* structure containing information that we want to match against.          */
/* ------------------------------------------------------------------------ */
int fr_tcpudpchk(fin, ft)
fr_info_t *fin;
frtuc_t *ft;
{
    int err = 1;

    /*
     * Both ports should *always* be in the first fragment.
     * So far, I cannot find any cases where they can not be.
     *
     * compare destination ports
     */
    if (ft->ftu_dcmp)
        err = fr_portcheck(&ft->ftu_dst, &fin->fin_dport);

    /*
     * compare source ports
     */
    if (err && ft->ftu_scmp)
        err = fr_portcheck(&ft->ftu_src, &fin->fin_sport);

    /*
     * If we don't have all the TCP/UDP header, then how can we
     * expect to do any sort of match on it ?  If we were looking for
     * TCP flags, then NO match.  If not, then match (which should
     * satisfy the "short" class too).
     */
    if (err && (fin->fin_p == IPPROTO_TCP)) {
        if (fin->fin_flx & FI_SHORT)
            return !(ft->ftu_tcpf | ft->ftu_tcpfm);
        /*
         * Match the flags ?  If not, abort this match.
         */
        if (ft->ftu_tcpfm &&
            ft->ftu_tcpf != (fin->fin_tcpf & ft->ftu_tcpfm)) {
            FR_DEBUG(("f. %#x & %#x != %#x\n", fin->fin_tcpf,
                 ft->ftu_tcpfm, ft->ftu_tcpf));
            err = 0;
        }
    }
    return err;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_ipfcheck                                                 */
/* Returns:     int - 0 == match, 1 == no match                             */
/* Parameters:  fin(I)     - pointer to packet information                  */
/*              fr(I)      - pointer to filter rule                         */
/*              portcmp(I) - flag indicating whether to attempt matching on */
/*                           TCP/UDP port data.                             */
/*                                                                          */
/* Check to see if a packet matches an IPFilter rule.  Checks of addresses, */
/* port numbers, etc, for "standard" IPFilter rules are all orchestrated in */
/* this function.                                                           */
/* ------------------------------------------------------------------------ */
static INLINE int fr_ipfcheck(fin, fr, portcmp)
fr_info_t *fin;
frentry_t *fr;
int portcmp;
{
    u_32_t  *ld, *lm, *lip;
    fripf_t *fri;
    fr_ip_t *fi;
    int i;
    ipf_stack_t *ifs = fin->fin_ifs;

    fi = &fin->fin_fi;
    fri = fr->fr_ipf;
    lip = (u_32_t *)fi;
    lm = (u_32_t *)&fri->fri_mip;
    ld = (u_32_t *)&fri->fri_ip;

    /*
     * first 32 bits to check coversion:
     * IP version, TOS, TTL, protocol
     */
    i = ((*lip & *lm) != *ld);
    FR_DEBUG(("0. %#08x & %#08x != %#08x\n",
           *lip, *lm, *ld));
    if (i)
        return 1;

    /*
     * Next 32 bits is a constructed bitmask indicating which IP options
     * are present (if any) in this packet.
     */
    lip++, lm++, ld++;
    i |= ((*lip & *lm) != *ld);
    FR_DEBUG(("1. %#08x & %#08x != %#08x\n",
           *lip, *lm, *ld));
    if (i)
        return 1;

    lip++, lm++, ld++;
    /*
     * Unrolled loops (4 each, for 32 bits) for address checks.
     */
    /*
     * Check the source address.
     */
#ifdef  IPFILTER_LOOKUP
    if (fr->fr_satype == FRI_LOOKUP) {
        fin->fin_flx |= FI_DONTCACHE;
        i = (*fr->fr_srcfunc)(fr->fr_srcptr, fi->fi_v, lip, fin, ifs);
        if (i == -1)
            return 1;
        lip += 3;
        lm += 3;
        ld += 3;
    } else {
#endif
        i = ((*lip & *lm) != *ld);
        FR_DEBUG(("2a. %#08x & %#08x != %#08x\n",
               *lip, *lm, *ld));
        if (fi->fi_v == 6) {
            lip++, lm++, ld++;
            i |= ((*lip & *lm) != *ld);
            FR_DEBUG(("2b. %#08x & %#08x != %#08x\n",
                   *lip, *lm, *ld));
            lip++, lm++, ld++;
            i |= ((*lip & *lm) != *ld);
            FR_DEBUG(("2c. %#08x & %#08x != %#08x\n",
                   *lip, *lm, *ld));
            lip++, lm++, ld++;
            i |= ((*lip & *lm) != *ld);
            FR_DEBUG(("2d. %#08x & %#08x != %#08x\n",
                   *lip, *lm, *ld));
        } else {
            lip += 3;
            lm += 3;
            ld += 3;
        }
#ifdef  IPFILTER_LOOKUP
    }
#endif
    i ^= (fr->fr_flags & FR_NOTSRCIP) >> 6;
    if (i)
        return 1;

    /*
     * Check the destination address.
     */
    lip++, lm++, ld++;
#ifdef  IPFILTER_LOOKUP
    if (fr->fr_datype == FRI_LOOKUP) {
        fin->fin_flx |= FI_DONTCACHE;
        i = (*fr->fr_dstfunc)(fr->fr_dstptr, fi->fi_v, lip, fin, ifs);
        if (i == -1)
            return 1;
        lip += 3;
        lm += 3;
        ld += 3;
    } else {
#endif
        i = ((*lip & *lm) != *ld);
        FR_DEBUG(("3a. %#08x & %#08x != %#08x\n",
               *lip, *lm, *ld));
        if (fi->fi_v == 6) {
            lip++, lm++, ld++;
            i |= ((*lip & *lm) != *ld);
            FR_DEBUG(("3b. %#08x & %#08x != %#08x\n",
                   *lip, *lm, *ld));
            lip++, lm++, ld++;
            i |= ((*lip & *lm) != *ld);
            FR_DEBUG(("3c. %#08x & %#08x != %#08x\n",
                   *lip, *lm, *ld));
            lip++, lm++, ld++;
            i |= ((*lip & *lm) != *ld);
            FR_DEBUG(("3d. %#08x & %#08x != %#08x\n",
                   *lip, *lm, *ld));
        } else {
            lip += 3;
            lm += 3;
            ld += 3;
        }
#ifdef  IPFILTER_LOOKUP
    }
#endif
    i ^= (fr->fr_flags & FR_NOTDSTIP) >> 7;
    if (i)
        return 1;
    /*
     * IP addresses matched.  The next 32bits contains:
     * mast of old IP header security & authentication bits.
     */
    lip++, lm++, ld++;
    i |= ((*lip & *lm) != *ld);
    FR_DEBUG(("4. %#08x & %#08x != %#08x\n",
           *lip, *lm, *ld));

    /*
     * Next we have 32 bits of packet flags.
     */
    lip++, lm++, ld++;
    i |= ((*lip & *lm) != *ld);
    FR_DEBUG(("5. %#08x & %#08x != %#08x\n",
           *lip, *lm, *ld));

    if (i == 0) {
        /*
         * If a fragment, then only the first has what we're
         * looking for here...
         */
        if (portcmp) {
            if (!fr_tcpudpchk(fin, &fr->fr_tuc))
                i = 1;
        } else {
            if (fr->fr_dcmp || fr->fr_scmp ||
                fr->fr_tcpf || fr->fr_tcpfm)
                i = 1;
            if (fr->fr_icmpm || fr->fr_icmp) {
                if (((fi->fi_p != IPPROTO_ICMP) &&
                     (fi->fi_p != IPPROTO_ICMPV6)) ||
                    fin->fin_off || (fin->fin_dlen < 2))
                    i = 1;
                else if ((fin->fin_data[0] & fr->fr_icmpm) !=
                     fr->fr_icmp) {
                    FR_DEBUG(("i. %#x & %#x != %#x\n",
                         fin->fin_data[0],
                         fr->fr_icmpm, fr->fr_icmp));
                    i = 1;
                }
            }
        }
    }
    return i;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_scanlist                                                 */
/* Returns:     int - result flags of scanning filter list                  */
/* Parameters:  fin(I) - pointer to packet information                      */
/*              pass(I) - default result to return for filtering            */
/*                                                                          */
/* Check the input/output list of rules for a match to the current packet.  */
/* If a match is found, the value of fr_flags from the rule becomes the     */
/* return value and fin->fin_fr points to the matched rule.                 */
/*                                                                          */
/* This function may be called recusively upto 16 times (limit inbuilt.)    */
/* When unwinding, it should finish up with fin_depth as 0.                 */
/*                                                                          */
/* Could be per interface, but this gets real nasty when you don't have,    */
/* or can't easily change, the kernel source code to .                      */
/* ------------------------------------------------------------------------ */
int fr_scanlist(fin, pass)
fr_info_t *fin;
u_32_t pass;
{
    int rulen, portcmp, off, logged, skip;
    struct frentry *fr, *fnext;
    u_32_t passt, passo;
    ipf_stack_t *ifs = fin->fin_ifs;

    /*
     * Do not allow nesting deeper than 16 levels.
     */
    if (fin->fin_depth >= 16)
        return pass;

    fr = fin->fin_fr;

    /*
     * If there are no rules in this list, return now.
     */
    if (fr == NULL)
        return pass;

    skip = 0;
    logged = 0;
    portcmp = 0;
    fin->fin_depth++;
    fin->fin_fr = NULL;
    off = fin->fin_off;

    if ((fin->fin_flx & FI_TCPUDP) && (fin->fin_dlen > 3) && !off)
        portcmp = 1;

    for (rulen = 0; fr; fr = fnext, rulen++) {
        fnext = fr->fr_next;
        if (skip != 0) {
            FR_VERBOSE(("%d (%#x)\n", skip, fr->fr_flags));
            skip--;
            continue;
        }

        /*
         * In all checks below, a null (zero) value in the
         * filter struture is taken to mean a wildcard.
         *
         * check that we are working for the right interface
         */
#ifdef  _KERNEL
        if (fr->fr_ifa && fr->fr_ifa != fin->fin_ifp)
            continue;
#else
        if (opts & (OPT_VERBOSE|OPT_DEBUG))
            printf("\n");
        FR_VERBOSE(("%c", FR_ISSKIP(pass) ? 's' :
                  FR_ISPASS(pass) ? 'p' :
                  FR_ISACCOUNT(pass) ? 'A' :
                  FR_ISAUTH(pass) ? 'a' :
                  (pass & FR_NOMATCH) ? 'n' :'b'));
        if (fr->fr_ifa && fr->fr_ifa != fin->fin_ifp)
            continue;
        FR_VERBOSE((":i"));
#endif

        switch (fr->fr_type)
        {
        case FR_T_IPF :
        case FR_T_IPF|FR_T_BUILTIN :
            if (fr_ipfcheck(fin, fr, portcmp))
                continue;
            break;
#if defined(IPFILTER_BPF)
        case FR_T_BPFOPC :
        case FR_T_BPFOPC|FR_T_BUILTIN :
            {
            u_char *mc;

            if (*fin->fin_mp == NULL)
                continue;
            if (fin->fin_v != fr->fr_v)
                continue;
            mc = (u_char *)fin->fin_m;
            if (!bpf_filter(fr->fr_data, mc, fin->fin_plen, 0))
                continue;
            break;
            }
#endif
        case FR_T_CALLFUNC|FR_T_BUILTIN :
            {
            frentry_t *f;

            f = (*fr->fr_func)(fin, &pass);
            if (f != NULL)
                fr = f;
            else
                continue;
            break;
            }
        default :
            break;
        }

        if ((fin->fin_out == 0) && (fr->fr_nattag.ipt_num[0] != 0)) {
            if (fin->fin_nattag == NULL)
                continue;
            if (fr_matchtag(&fr->fr_nattag, fin->fin_nattag) == 0)
                continue;
        }
        FR_VERBOSE(("=%s.%d *", fr->fr_group, rulen));

        passt = fr->fr_flags;

        /*
         * Allowing a rule with the "keep state" flag set to match
         * packets that have been tagged "out of window" by the TCP
         * state tracking is foolish as the attempt to add a new
         * state entry to the table will fail.
         */
        if ((passt & FR_KEEPSTATE) && (fin->fin_flx & FI_OOW))
            continue;

        /*
         * If the rule is a "call now" rule, then call the function
         * in the rule, if it exists and use the results from that.
         * If the function pointer is bad, just make like we ignore
         * it, except for increasing the hit counter.
         */
        IPF_BUMP(fr->fr_hits);
        fr->fr_bytes += (U_QUAD_T)fin->fin_plen;
        if ((passt & FR_CALLNOW) != 0) {
            if ((fr->fr_func != NULL) &&
                (fr->fr_func != (ipfunc_t)-1)) {
                frentry_t *frs;

                frs = fin->fin_fr;
                fin->fin_fr = fr;
                fr = (*fr->fr_func)(fin, &passt);
                if (fr == NULL) {
                    fin->fin_fr = frs;
                    continue;
                }
                passt = fr->fr_flags;
                fin->fin_fr = fr;
            }
        } else {
            fin->fin_fr = fr;
        }

#ifdef  IPFILTER_LOG
        /*
         * Just log this packet...
         */
        if ((passt & FR_LOGMASK) == FR_LOG) {
            if (ipflog(fin, passt) == -1) {
                if (passt & FR_LOGORBLOCK) {
                    passt &= ~FR_CMDMASK;
                    passt |= FR_BLOCK|FR_QUICK;
                }
                IPF_BUMP(ifs->ifs_frstats[fin->fin_out].fr_skip);
            }
            IPF_BUMP(ifs->ifs_frstats[fin->fin_out].fr_pkl);
            logged = 1;
        }
#endif /* IPFILTER_LOG */
        passo = pass;
        if (FR_ISSKIP(passt))
            skip = fr->fr_arg;
        else if ((passt & FR_LOGMASK) != FR_LOG)
            pass = passt;
        if (passt & (FR_RETICMP|FR_FAKEICMP))
            fin->fin_icode = fr->fr_icode;
        FR_DEBUG(("pass %#x\n", pass));
        fin->fin_rule = rulen;
        (void) strncpy(fin->fin_group, fr->fr_group, FR_GROUPLEN);
        if (fr->fr_grp != NULL) {
            fin->fin_fr = *fr->fr_grp;
            pass = fr_scanlist(fin, pass);
            if (fin->fin_fr == NULL) {
                fin->fin_rule = rulen;
                (void) strncpy(fin->fin_group, fr->fr_group,
                           FR_GROUPLEN);
                fin->fin_fr = fr;
            }
            if (fin->fin_flx & FI_DONTCACHE)
                logged = 1;
        }

        if (pass & FR_QUICK) {
            /*
             * Finally, if we've asked to track state for this
             * packet, set it up.  Add state for "quick" rules
             * here so that if the action fails we can consider
             * the rule to "not match" and keep on processing
             * filter rules.
             */
            if ((pass & FR_KEEPSTATE) &&
                !(fin->fin_flx & FI_STATE)) {
                int out = fin->fin_out;

                if (fr_addstate(fin, NULL, 0) != NULL) {
                    IPF_BUMP(ifs->ifs_frstats[out].fr_ads);
                } else {
                    IPF_BUMP(ifs->ifs_frstats[out].fr_bads);
                    pass = passo;
                    continue;
                }
            }
            break;
        }
    }
    if (logged)
        fin->fin_flx |= FI_DONTCACHE;
    fin->fin_depth--;
    return pass;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_acctpkt                                                  */
/* Returns:     frentry_t* - always returns NULL                            */
/* Parameters:  fin(I) - pointer to packet information                      */
/*              passp(IO) - pointer to current/new filter decision (unused) */
/*                                                                          */
/* Checks a packet against accounting rules, if there are any for the given */
/* IP protocol version.                                                     */
/*                                                                          */
/* N.B.: this function returns NULL to match the prototype used by other    */
/* functions called from the IPFilter "mainline" in fr_check().             */
/* ------------------------------------------------------------------------ */
frentry_t *fr_acctpkt(fin, passp)
fr_info_t *fin;
u_32_t *passp;
{
    char group[FR_GROUPLEN];
    frentry_t *fr, *frsave;
    u_32_t pass, rulen;
    ipf_stack_t *ifs = fin->fin_ifs;

    passp = passp;
#ifdef  USE_INET6
    if (fin->fin_v == 6)
        fr = ifs->ifs_ipacct6[fin->fin_out][ifs->ifs_fr_active];
    else
#endif
        fr = ifs->ifs_ipacct[fin->fin_out][ifs->ifs_fr_active];

    if (fr != NULL) {
        frsave = fin->fin_fr;
        bcopy(fin->fin_group, group, FR_GROUPLEN);
        rulen = fin->fin_rule;
        fin->fin_fr = fr;
        pass = fr_scanlist(fin, FR_NOMATCH);
        if (FR_ISACCOUNT(pass)) {
            IPF_BUMP(ifs->ifs_frstats[0].fr_acct);
        }
        fin->fin_fr = frsave;
        bcopy(group, fin->fin_group, FR_GROUPLEN);
        fin->fin_rule = rulen;
    }
    return NULL;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_firewall                                                 */
/* Returns:     frentry_t* - returns pointer to matched rule, if no matches */
/*                           were found, returns NULL.                      */
/* Parameters:  fin(I) - pointer to packet information                      */
/*              passp(IO) - pointer to current/new filter decision (unused) */
/*                                                                          */
/* Applies an appropriate set of firewall rules to the packet, to see if    */
/* there are any matches.  The first check is to see if a match can be seen */
/* in the cache.  If not, then search an appropriate list of rules.  Once a */
/* matching rule is found, take any appropriate actions as defined by the   */
/* rule - except logging.                                                   */
/* ------------------------------------------------------------------------ */
static frentry_t *fr_firewall(fin, passp)
fr_info_t *fin;
u_32_t *passp;
{
    frentry_t *fr;
    fr_info_t *fc;
    u_32_t pass;
    int out;
    ipf_stack_t *ifs = fin->fin_ifs;

    out = fin->fin_out;
    pass = *passp;

#ifdef  USE_INET6
    if (fin->fin_v == 6)
        fin->fin_fr = ifs->ifs_ipfilter6[out][ifs->ifs_fr_active];
    else
#endif
        fin->fin_fr = ifs->ifs_ipfilter[out][ifs->ifs_fr_active];

    /*
     * If there are no rules loaded skip all checks and return.
     */
    if (fin->fin_fr == NULL) {

        if ((pass & FR_NOMATCH)) {
            IPF_BUMP(ifs->ifs_frstats[out].fr_nom);
        }

        return (NULL);
    }

    fc = &ifs->ifs_frcache[out][CACHE_HASH(fin)];
    READ_ENTER(&ifs->ifs_ipf_frcache);
    if (!bcmp((char *)fin, (char *)fc, FI_CSIZE)) {
        /*
         * copy cached data so we can unlock the mutexes earlier.
         */
        bcopy((char *)fc, (char *)fin, FI_COPYSIZE);
        RWLOCK_EXIT(&ifs->ifs_ipf_frcache);
        IPF_BUMP(ifs->ifs_frstats[out].fr_chit);

        if ((fr = fin->fin_fr) != NULL) {
            IPF_BUMP(fr->fr_hits);
            fr->fr_bytes += (U_QUAD_T)fin->fin_plen;
            pass = fr->fr_flags;
        }
    } else {
        RWLOCK_EXIT(&ifs->ifs_ipf_frcache);

        pass = fr_scanlist(fin, ifs->ifs_fr_pass);

        if (((pass & FR_KEEPSTATE) == 0) &&
            ((fin->fin_flx & FI_DONTCACHE) == 0)) {
            WRITE_ENTER(&ifs->ifs_ipf_frcache);
            bcopy((char *)fin, (char *)fc, FI_COPYSIZE);
            RWLOCK_EXIT(&ifs->ifs_ipf_frcache);
        }

        fr = fin->fin_fr;
    }

    if ((pass & FR_NOMATCH)) {
        IPF_BUMP(ifs->ifs_frstats[out].fr_nom);
    }

    /*
     * Apply packets per second rate-limiting to a rule as required.
     */
    if ((fr != NULL) && (fr->fr_pps != 0) &&
        !ppsratecheck(&fr->fr_lastpkt, &fr->fr_curpps, fr->fr_pps)) {
        pass &= ~(FR_CMDMASK|FR_DUP|FR_RETICMP|FR_RETRST);
        pass |= FR_BLOCK;
        IPF_BUMP(ifs->ifs_frstats[out].fr_ppshit);
    }

    /*
     * If we fail to add a packet to the authorization queue, then we
     * drop the packet later.  However, if it was added then pretend
     * we've dropped it already.
     */
    if (FR_ISAUTH(pass)) {
        if (fr_newauth(fin->fin_m, fin) != 0) {
#ifdef  _KERNEL
            fin->fin_m = *fin->fin_mp = NULL;
#else
            ;
#endif
            fin->fin_error = 0;
        } else
            fin->fin_error = ENOSPC;
    }

    if ((fr != NULL) && (fr->fr_func != NULL) &&
        (fr->fr_func != (ipfunc_t)-1) && !(pass & FR_CALLNOW))
        (void) (*fr->fr_func)(fin, &pass);

    /*
     * If a rule is a pre-auth rule, check again in the list of rules
     * loaded for authenticated use.  It does not particulary matter
     * if this search fails because a "preauth" result, from a rule,
     * is treated as "not a pass", hence the packet is blocked.
     */
    if (FR_ISPREAUTH(pass)) {
        if ((fin->fin_fr = ifs->ifs_ipauth) != NULL)
            pass = fr_scanlist(fin, ifs->ifs_fr_pass);
    }

    /*
     * If the rule has "keep frag" and the packet is actually a fragment,
     * then create a fragment state entry.
     */
    if ((pass & (FR_KEEPFRAG|FR_KEEPSTATE)) == FR_KEEPFRAG) {
        if (fin->fin_flx & FI_FRAG) {
            if (fr_newfrag(fin, pass) == -1) {
                IPF_BUMP(ifs->ifs_frstats[out].fr_bnfr);
            } else {
                IPF_BUMP(ifs->ifs_frstats[out].fr_nfr);
            }
        } else {
            IPF_BUMP(ifs->ifs_frstats[out].fr_cfr);
        }
    }

    /*
     * Finally, if we've asked to track state for this packet, set it up.
     */
    if ((pass & FR_KEEPSTATE) && !(fin->fin_flx & FI_STATE)) {
        if (fr_addstate(fin, NULL, 0) != NULL) {
            IPF_BUMP(ifs->ifs_frstats[out].fr_ads);
        } else {
            IPF_BUMP(ifs->ifs_frstats[out].fr_bads);
            if (FR_ISPASS(pass)) {
                pass &= ~FR_CMDMASK;
                pass |= FR_BLOCK;
            }
        }
    }

    fr = fin->fin_fr;

    if (passp != NULL)
        *passp = pass;

    return fr;
}

/* ------------------------------------------------------------------------ */
/* Function:    fr_check                                                    */
/* Returns:     int -  0 == packet allowed through,                         */
/*              User space:                                                 */
/*                    -1 == packet blocked                                  */
/*                     1 == packet not matched                              */
/*                    -2 == requires authentication                         */
/*              Kernel:                                                     */
/*                   > 0 == filter error # for packet                       */
/* Parameters: ip(I)   - pointer to start of IPv4/6 packet                  */
/*             hlen(I) - length of header                                   */
/*             ifp(I)  - pointer to interface this packet is on             */
/*             out(I)  - 0 == packet going in, 1 == packet going out        */
/*             mp(IO)  - pointer to caller's buffer pointer that holds this */
/*                       IP packet.                                         */
/* Solaris & HP-UX ONLY :                                                   */
/*             qpi(I)  - pointer to STREAMS queue information for this      */
/*                       interface & direction.                             */
/*                                                                          */
/* fr_check() is the master function for all IPFilter packet processing.    */
/* It orchestrates: Network Address Translation (NAT), checking for packet  */
/* authorisation (or pre-authorisation), presence of related state info.,   */
/* generating log entries, IP packet accounting, routing of packets as      */
/* directed by firewall rules and of course whether or not to allow the     */
/* packet to be further processed by the kernel.                            */
/*                                                                          */
/* For packets blocked, the contents of "mp" will be NULL'd and the buffer  */
/* freed.  Packets passed may be returned with the pointer pointed to by    */
/* by "mp" changed to a new buffer.                                         */
/* ------------------------------------------------------------------------ */
int fr_check(ip, hlen, ifp, out
#if defined(_KERNEL) && defined(MENTAT)
, qif, mp, ifs)
void *qif;
#else
, mp, ifs)
#endif
mb_t **mp;
ip_t *ip;
int hlen;
void *ifp;
int out;
ipf_stack_t *ifs;
{
    /*
     * The above really sucks, but short of writing a diff
     */
    fr_info_t frinfo;
    fr_info_t *fin = &frinfo;
    u_32_t pass;
    frentry_t *fr = NULL;
    int v = IP_V(ip);
    mb_t *mc = NULL;
    mb_t *m;
#ifdef USE_INET6
    ip6_t *ip6;
#endif
#ifdef  _KERNEL
# ifdef MENTAT
    qpktinfo_t *qpi = qif;
#endif
#endif

    SPL_INT(s);
    pass = ifs->ifs_fr_pass;

    /*
     * The first part of fr_check() deals with making sure that what goes
     * into the filtering engine makes some sense.  Information about the
     * the packet is distilled, collected into a fr_info_t structure and
     * the an attempt to ensure the buffer the packet is in is big enough
     * to hold all the required packet headers.
     */
#ifdef  _KERNEL
# ifdef MENTAT
    if (!OK_32PTR(ip))
        return 2;
# endif


    if (ifs->ifs_fr_running <= 0) {
        return 0;
    }

    bzero((char *)fin, sizeof(*fin));

# ifdef MENTAT
    fin->fin_flx = qpi->qpi_flags & (FI_NOCKSUM|FI_MBCAST|FI_MULTICAST|
                     FI_BROADCAST);
    m = qpi->qpi_m;
    fin->fin_qfm = m;
    fin->fin_qpi = qpi;
# else /* MENTAT */

    m = *mp;

#  if defined(M_MCAST)
    if ((m->m_flags & M_MCAST) != 0)
        fin->fin_flx |= FI_MBCAST|FI_MULTICAST;
#  endif
#  if defined(M_MLOOP)
    if ((m->m_flags & M_MLOOP) != 0)
        fin->fin_flx |= FI_MBCAST|FI_MULTICAST;
#  endif
#  if defined(M_BCAST)
    if ((m->m_flags & M_BCAST) != 0)
        fin->fin_flx |= FI_MBCAST|FI_BROADCAST;
#  endif
#  ifdef M_CANFASTFWD
    /*
     * XXX For now, IP Filter and fast-forwarding of cached flows
     * XXX are mutually exclusive.  Eventually, IP Filter should
     * XXX get a "can-fast-forward" filter rule.
     */
    m->m_flags &= ~M_CANFASTFWD;
#  endif /* M_CANFASTFWD */
#  ifdef CSUM_DELAY_DATA
    /*
     * disable delayed checksums.
     */
    if (m->m_pkthdr.csum_flags & CSUM_DELAY_DATA) {
        in_delayed_cksum(m);
        m->m_pkthdr.csum_flags &= ~CSUM_DELAY_DATA;
    }
#  endif /* CSUM_DELAY_DATA */
# endif /* MENTAT */
#else

    bzero((char *)fin, sizeof(*fin));
    m = *mp;
#endif /* _KERNEL */

    fin->fin_v = v;
    fin->fin_m = m;
    fin->fin_ip = ip;
    fin->fin_mp = mp;
    fin->fin_out = out;
    fin->fin_ifp = ifp;
    fin->fin_error = ENETUNREACH;
    fin->fin_hlen = (u_short)hlen;
    fin->fin_dp = (char *)ip + hlen;
    fin->fin_ipoff = (char *)ip - MTOD(m, char *);
    fin->fin_ifs = ifs;

    SPL_NET(s);

#ifdef  USE_INET6
    if (v == 6) {
        IPF_BUMP(ifs->ifs_frstats[out].fr_ipv6);
        /*
         * Jumbo grams are quite likely too big for internal buffer
         * structures to handle comfortably, for now, so just drop
         * them.
         */
        ip6 = (ip6_t *)ip;
        fin->fin_plen = ntohs(ip6->ip6_plen);
        if (fin->fin_plen == 0) {
            READ_ENTER(&ifs->ifs_ipf_mutex);
            pass = FR_BLOCK|FR_NOMATCH;
            goto filtered;
        }
        fin->fin_plen += sizeof(ip6_t);
    } else
#endif
    {
#if (OpenBSD >= 200311) && defined(_KERNEL)
        ip->ip_len = ntohs(ip->ip_len);
        ip->ip_off = ntohs(ip->ip_off);
#endif
        fin->fin_plen = ip->ip_len;
    }

    if (fr_makefrip(hlen, ip, fin) == -1) {
        READ_ENTER(&ifs->ifs_ipf_mutex);
        pass = FR_BLOCK;
        goto filtered;
    }

    /*
     * For at least IPv6 packets, if a m_pullup() fails then this pointer
     * becomes NULL and so we have no packet to free.
     */
    if (*fin->fin_mp == NULL)
        goto finished;

    if (!out) {
        if (v == 4) {
#ifdef _KERNEL
            if (ifs->ifs_fr_chksrc && !fr_verifysrc(fin)) {
                IPF_BUMP(ifs->ifs_frstats[0].fr_badsrc);
                fin->fin_flx |= FI_BADSRC;
            }
#endif
            if (fin->fin_ip->ip_ttl < ifs->ifs_fr_minttl) {
                IPF_BUMP(ifs->ifs_frstats[0].fr_badttl);
                fin->fin_flx |= FI_LOWTTL;
            }
        }
#ifdef USE_INET6
        else  if (v == 6) {
            ip6 = (ip6_t *)ip;
#ifdef _KERNEL
            if (ifs->ifs_fr_chksrc && !fr_verifysrc(fin)) {
                IPF_BUMP(ifs->ifs_frstats[0].fr_badsrc);
                fin->fin_flx |= FI_BADSRC;
            }
#endif
            if (ip6->ip6_hlim < ifs->ifs_fr_minttl) {
                IPF_BUMP(ifs->ifs_frstats[0].fr_badttl);
                fin->fin_flx |= FI_LOWTTL;
            }
        }
#endif
    }

    if (fin->fin_flx & FI_SHORT) {
        IPF_BUMP(ifs->ifs_frstats[out].fr_short);
    }

    READ_ENTER(&ifs->ifs_ipf_mutex);

    /*
     * Check auth now.  This, combined with the check below to see if apass
     * is 0 is to ensure that we don't count the packet twice, which can
     * otherwise occur when we reprocess it.  As it is, we only count it
     * after it has no auth. table matchup.  This also stops NAT from
     * occuring until after the packet has been auth'd.
     */
    fr = fr_checkauth(fin, &pass);
    if (!out) {
        switch (fin->fin_v)
        {
        case 4 :
            if (fr_checknatin(fin, &pass) == -1) {
                RWLOCK_EXIT(&ifs->ifs_ipf_mutex);
                goto finished;
            }
            break;
#ifdef  USE_INET6
        case 6 :
            if (fr_checknat6in(fin, &pass) == -1) {
                RWLOCK_EXIT(&ifs->ifs_ipf_mutex);
                goto finished;
            }
            break;
#endif
        default :
            break;
        }
    }
    if (!out)
        (void) fr_acctpkt(fin, NULL);

    if (fr == NULL)
        if ((fin->fin_flx & (FI_FRAG|FI_BAD)) == FI_FRAG)
            fr = fr_knownfrag(fin, &pass);
    if (fr == NULL)
        fr = fr_checkstate(fin, &pass);

    if ((pass & FR_NOMATCH) || (fr == NULL))
        fr = fr_firewall(fin, &pass);

    fin->fin_fr = fr;

    /*
     * Only count/translate packets which will be passed on, out the
     * interface.
     */
    if (out && FR_ISPASS(pass)) {
        (void) fr_acctpkt(fin, NULL);

        switch (fin->fin_v)
        {
        case 4 :
            if (fr_checknatout(fin, &pass) == -1) {
                RWLOCK_EXIT(&ifs->ifs_ipf_mutex);
                goto finished;
            }
            break;
#ifdef  USE_INET6
        case 6 :
            if (fr_checknat6out(fin, &pass) == -1) {
                RWLOCK_EXIT(&ifs->ifs_ipf_mutex);
                goto finished;
            }
            break;
#endif
        default :
            break;
        }

        if ((ifs->ifs_fr_update_ipid != 0) && (v == 4)) {
            if (fr_updateipid(fin) == -1) {
                IPF_BUMP(ifs->ifs_frstats[1].fr_ipud);
                pass &= ~FR_CMDMASK;
                pass |= FR_BLOCK;
            } else {
                IPF_BUMP(ifs->ifs_frstats[0].fr_ipud);
            }
        }
    }

#ifdef  IPFILTER_LOG
    if ((ifs->ifs_fr_flags & FF_LOGGING) || (pass & FR_LOGMASK)) {
        (void) fr_dolog(fin, &pass);
    }
#endif

    /*
     * The FI_STATE flag is cleared here so that calling fr_checkstate
     * will work when called from inside of fr_fastroute.  Although
     * there is a similar flag, FI_NATED, for NAT, it does have the same
     * impact on code execution.
     */
    fin->fin_flx &= ~FI_STATE;

    /*
     * Only allow FR_DUP to work if a rule matched - it makes no sense to
     * set FR_DUP as a "default" as there are no instructions about where
     * to send the packet.  Use fin_m here because it may have changed
     * (without an update of 'm') in prior processing.
     */
    if ((fr != NULL) && (pass & FR_DUP)) {
        mc = M_DUPLICATE(fin->fin_m);
#ifdef _KERNEL
        mc->b_rptr += fin->fin_ipoff;
#endif
    }

    /*
     * We don't want to send RST for packets, which are going to be
     * dropped, just because they don't fit into TCP window. Those packets
     * will be dropped silently. In other words, we want to drop packet,
     * while keeping session alive.
     */
    if ((pass & (FR_RETRST|FR_RETICMP)) && ((fin->fin_flx & FI_OOW) == 0)) {
        /*
         * Should we return an ICMP packet to indicate error
         * status passing through the packet filter ?
         * WARNING: ICMP error packets AND TCP RST packets should
         * ONLY be sent in repsonse to incoming packets.  Sending them
         * in response to outbound packets can result in a panic on
         * some operating systems.
         */
        if (!out) {
            if (pass & FR_RETICMP) {
                int dst;

                if ((pass & FR_RETMASK) == FR_FAKEICMP)
                    dst = 1;
                else
                    dst = 0;
#if defined(_KERNEL) && (SOLARIS2 >= 10)
                /*
                 * Assume it's possible to enter insane rule:
                 *  pass return-icmp in proto udp ...
                 * then we have no other option than to forward
                 * packet on loopback and give up any attempt
                 * to create a fake response.
                 */
                if (IPF_IS_LOOPBACK(qpi->qpi_flags) &&
                    FR_ISBLOCK(pass)) {

                    if (fr_make_icmp(fin) == 0) {
                        IPF_BUMP(
                        ifs->ifs_frstats[out].fr_ret);
                    }
                    /*
                     * we drop packet silently in case we
                     * failed assemble fake response for it
                     */
                    else if (*mp != NULL) {
                        FREE_MB_T(*mp);
                        m = *mp = NULL;
                    }

                    IPF_BUMP(
                        ifs->ifs_frstats[out].fr_block);
                    RWLOCK_EXIT(&ifs->ifs_ipf_mutex);

                    return (0);
                }
#endif  /* _KERNEL && SOLARIS2 >= 10 */

                (void) fr_send_icmp_err(ICMP_UNREACH, fin, dst);
                IPF_BUMP(ifs->ifs_frstats[out].fr_ret);

            } else if (((pass & FR_RETMASK) == FR_RETRST) &&
                   !(fin->fin_flx & FI_SHORT)) {

#if defined(_KERNEL) && (SOLARIS2 >= 10)
                /*
                 * Assume it's possible to enter insane rule:
                 *  pass return-rst in proto tcp ...
                 * then we have no other option than to forward
                 * packet on loopback and give up any attempt
                 * to create a fake response.
                 */
                if (IPF_IS_LOOPBACK(qpi->qpi_flags) &&
                    FR_ISBLOCK(pass)) {
                    if (fr_make_rst(fin) == 0) {
                        IPF_BUMP(
                        ifs->ifs_frstats[out].fr_ret);
                    }
                    else if (mp != NULL) {
                    /*
                     * we drop packet silently in case we
                     * failed assemble fake response for it
                     */
                        FREE_MB_T(*mp);
                        m = *mp = NULL;
                    }

                    IPF_BUMP(
                        ifs->ifs_frstats[out].fr_block);
                    RWLOCK_EXIT(&ifs->ifs_ipf_mutex);

                    return (0);
                 }
#endif /* _KERNEL && _SOLARIS2 >= 10 */
                if (fr_send_reset(fin) == 0) {
                    IPF_BUMP(ifs->ifs_frstats[1].fr_ret);
                }
            }
        } else {
            if (pass & FR_RETRST)
                fin->fin_error = ECONNRESET;
        }
    }

    /*
     * If we didn't drop off the bottom of the list of rules (and thus
     * the 'current' rule fr is not NULL), then we may have some extra
     * instructions about what to do with a packet.
     * Once we're finished return to our caller, freeing the packet if
     * we are dropping it (* BSD ONLY *).
     * Reassign m from fin_m as we may have a new buffer, now.
     */
filtered:
    m = fin->fin_m;

    if (fr != NULL) {
        frdest_t *fdp;

        fdp = &fr->fr_tifs[fin->fin_rev];

        if (!out && (pass & FR_FASTROUTE)) {
            /*
             * For fastroute rule, no destioation interface defined
             * so pass NULL as the frdest_t parameter
             */
            (void) fr_fastroute(m, mp, fin, NULL);
            m = *mp = NULL;
        } else if ((fdp->fd_ifp != NULL) &&
               (fdp->fd_ifp != (struct ifnet *)-1)) {
            /* this is for to rules: */
            (void) fr_fastroute(m, mp, fin, fdp);
            m = *mp = NULL;
        }

        /*
         * Send a duplicated packet.
         */
        if (mc != NULL) {
#if defined(_KERNEL) && (SOLARIS2 >= 10)
            /*
             * We are going to compute chksum for copies of loopback packets
             * only. IP stack does not compute chksums at all for loopback
             * packets. We want to get it fixed in their copies, since those
             * are going to be sent to network.
             */
            if (IPF_IS_LOOPBACK(qpi->qpi_flags))
                fr_calc_chksum(fin, mc);
#endif
            (void) fr_fastroute(mc, &mc, fin, &fr->fr_dif);
        }
    }

    if (FR_ISBLOCK(pass) && (fin->fin_flx & FI_NEWNAT))
        nat_uncreate(fin);

    /*
     * This late because the likes of fr_fastroute() use fin_fr.
     */
    RWLOCK_EXIT(&ifs->ifs_ipf_mutex);

finished:
    if (!FR_ISPASS(pass)) {
        IPF_BUMP(ifs->ifs_frstats[out].fr_block);
        if (*mp != NULL) {
            FREE_MB_T(*mp);
            m = *mp = NULL;
        }
    } else {
        IPF_BUMP(ifs->ifs_frstats[out].fr_pass);
#if defined(_KERNEL) && defined(__sgi)
        if ((fin->fin_hbuf != NULL) &&
            (mtod(fin->fin_m, struct ip *) != fin->fin_ip)) {
            COPYBACK(m, 0, fin->fin_plen, fin->fin_hbuf);
        }
#endif
    }

    SPL_X(s);

#ifdef _KERNEL
# if OpenBSD >= 200311
    if (FR_ISPASS(pass) && (v == 4)) {
        ip = fin->fin_ip;
        ip->ip_len = ntohs(ip->ip_len);
        ip->ip_off = ntohs(ip->ip_off);
    }
# endif
    return (FR_ISPASS(pass)) ? 0 : fin->fin_error;
#else /* _KERNEL */
    FR_VERBOSE(("fin_flx %#x pass %#x ", fin->fin_flx, pass));
    if ((pass & FR_NOMATCH) != 0)
        return 1;

    if ((pass & FR_RETMASK) != 0)
        switch (pass & FR_RETMASK)
        {
        case FR_RETRST :
            return 3;
        case FR_RETICMP :
            return 4;
        case FR_FAKEICMP :
            return 5;
        }

    switch (pass & FR_CMDMASK)
    {
    case FR_PASS :
        return 0;
    case FR_BLOCK :
        return -1;
    case FR_AUTH :
        return -2;
    case FR_ACCOUNT :
        return -3;
    case FR_PREAUTH :
        return -4;
    }
    return 2;
#endif /* _KERNEL */
}


#ifdef  IPFILTER_LOG
/* ------------------------------------------------------------------------ */
/* Function:    fr_dolog                                                    */
/* Returns:     frentry_t* - returns contents of fin_fr (no change made)    */
/* Parameters:  fin(I) - pointer to packet information                      */
/*              passp(IO) - pointer to current/new filter decision (unused) */
/*                                                                          */
/* Checks flags set to see how a packet should be logged, if it is to be    */
/* logged.  Adjust statistics based on its success or not.                  */
/* ------------------------------------------------------------------------ */
frentry_t *fr_dolog(fin, passp)
fr_info_t *fin;
u_32_t *passp;
{
    u_32_t pass;
    int out;
    ipf_stack_t *ifs = fin->fin_ifs;

    out = fin->fin_out;
    pass = *passp;

    if ((ifs->ifs_fr_flags & FF_LOGNOMATCH) && (pass & FR_NOMATCH)) {
        pass |= FF_LOGNOMATCH;
        IPF_BUMP(ifs->ifs_frstats[out].fr_npkl);
        goto logit;
    } else if (((pass & FR_LOGMASK) == FR_LOGP) ||
        (FR_ISPASS(pass) && (ifs->ifs_fr_flags & FF_LOGPASS))) {
        if ((pass & FR_LOGMASK) != FR_LOGP)
            pass |= FF_LOGPASS;
        IPF_BUMP(ifs->ifs_frstats[out].fr_ppkl);
        goto logit;
    } else if (((pass & FR_LOGMASK) == FR_LOGB) ||
           (FR_ISBLOCK(pass) && (ifs->ifs_fr_flags & FF_LOGBLOCK))) {
        if ((pass & FR_LOGMASK) != FR_LOGB)
            pass |= FF_LOGBLOCK;
        IPF_BUMP(ifs->ifs_frstats[out].fr_bpkl);
logit:
        if (ipflog(fin, pass) == -1) {
            IPF_BUMP(ifs->ifs_frstats[out].fr_skip);

            /*
             * If the "or-block" option has been used then
             * block the packet if we failed to log it.
             */
            if ((pass & FR_LOGORBLOCK) &&
                FR_ISPASS(pass)) {
                pass &= ~FR_CMDMASK;
                pass |= FR_BLOCK;
            }
        }
        *passp = pass;
    }

    return fin->fin_fr;
}
#endif /* IPFILTER_LOG */


/* ------------------------------------------------------------------------ */
/* Function:    ipf_cksum                                                   */
/* Returns:     u_short - IP header checksum                                */
/* Parameters:  addr(I) - pointer to start of buffer to checksum            */
/*              len(I)  - length of buffer in bytes                         */
/*                                                                          */
/* Calculate the two's complement 16 bit checksum of the buffer passed.     */
/*                                                                          */
/* N.B.: addr should be 16bit aligned.                                      */
/* ------------------------------------------------------------------------ */
u_short ipf_cksum(addr, len)
u_short *addr;
int len;
{
    u_32_t sum = 0;

    for (sum = 0; len > 1; len -= 2)
        sum += *addr++;

    /* mop up an odd byte, if necessary */
    if (len == 1)
        sum += *(u_char *)addr;

    /*
     * add back carry outs from top 16 bits to low 16 bits
     */
    sum = (sum >> 16) + (sum & 0xffff); /* add hi 16 to low 16 */
    sum += (sum >> 16);         /* add carry */
    return (u_short)(~sum);
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_cksum                                                    */
/* Returns:     u_short - layer 4 checksum                                  */
/* Parameters:  m(I  )     - pointer to buffer holding packet               */
/*              ip(I)      - pointer to IP header                           */
/*              l4proto(I) - protocol to caclulate checksum for             */
/*              l4hdr(I)   - pointer to layer 4 header                      */
/*                                                                          */
/* Calculates the TCP checksum for the packet held in "m", using the data   */
/* in the IP header "ip" to seed it.                                        */
/*                                                                          */
/* NB: This function assumes we've pullup'd enough for all of the IP header */
/* and the TCP header.  We also assume that data blocks aren't allocated in */
/* odd sizes.                                                               */
/*                                                                          */
/* Expects ip_len to be in host byte order when called.                     */
/* ------------------------------------------------------------------------ */
u_short fr_cksum(m, ip, l4proto, l4hdr)
mb_t *m;
ip_t *ip;
int l4proto;
void *l4hdr;
{
    u_short *sp, slen, sumsave, l4hlen, *csump;
    u_int sum, sum2;
    int hlen;
#ifdef  USE_INET6
    ip6_t *ip6;
#endif

    csump = NULL;
    sumsave = 0;
    l4hlen = 0;
    sp = NULL;
    slen = 0;
    hlen = 0;
    sum = 0;

    /*
     * Add up IP Header portion
     */
#ifdef  USE_INET6
    if (IP_V(ip) == 4) {
#endif
        hlen = IP_HL(ip) << 2;
        slen = ip->ip_len - hlen;
        sum = htons((u_short)l4proto);
        sum += htons(slen);
        sp = (u_short *)&ip->ip_src;
        sum += *sp++;   /* ip_src */
        sum += *sp++;
        sum += *sp++;   /* ip_dst */
        sum += *sp++;
#ifdef  USE_INET6
    } else if (IP_V(ip) == 6) {
        ip6 = (ip6_t *)ip;
        hlen = sizeof(*ip6);
        slen = ntohs(ip6->ip6_plen);
        sum = htons((u_short)l4proto);
        sum += htons(slen);
        sp = (u_short *)&ip6->ip6_src;
        sum += *sp++;   /* ip6_src */
        sum += *sp++;
        sum += *sp++;
        sum += *sp++;
        sum += *sp++;
        sum += *sp++;
        sum += *sp++;
        sum += *sp++;
        sum += *sp++;   /* ip6_dst */
        sum += *sp++;
        sum += *sp++;
        sum += *sp++;
        sum += *sp++;
        sum += *sp++;
        sum += *sp++;
        sum += *sp++;
    }
#endif

    switch (l4proto)
    {
    case IPPROTO_UDP :
        csump = &((udphdr_t *)l4hdr)->uh_sum;
        l4hlen = sizeof(udphdr_t);
        break;

    case IPPROTO_TCP :
        csump = &((tcphdr_t *)l4hdr)->th_sum;
        l4hlen = sizeof(tcphdr_t);
        break;
    case IPPROTO_ICMP :
        csump = &((icmphdr_t *)l4hdr)->icmp_cksum;
        l4hlen = 4;
        sum = 0;
        break;
    default :
        break;
    }

    if (csump != NULL) {
        sumsave = *csump;
        *csump = 0;
    }

    l4hlen = l4hlen;    /* LINT */

#ifdef  _KERNEL
# ifdef MENTAT
    {
    void *rp = m->b_rptr;

    if ((unsigned char *)ip > m->b_rptr && (unsigned char *)ip < m->b_wptr)
        m->b_rptr = (u_char *)ip;
    sum2 = ip_cksum(m, hlen, sum);  /* hlen == offset */
    m->b_rptr = rp;
    sum2 = (sum2 & 0xffff) + (sum2 >> 16);
    sum2 = ~sum2 & 0xffff;
    }
# else /* MENTAT */
#  if defined(BSD) || defined(sun)
#   if BSD >= 199103
    m->m_data += hlen;
#   else
    m->m_off += hlen;
#   endif
    m->m_len -= hlen;
    sum2 = in_cksum(m, slen);
    m->m_len += hlen;
#   if BSD >= 199103
    m->m_data -= hlen;
#   else
    m->m_off -= hlen;
#   endif
    /*
     * Both sum and sum2 are partial sums, so combine them together.
     */
    sum += ~sum2 & 0xffff;
    while (sum > 0xffff)
        sum = (sum & 0xffff) + (sum >> 16);
    sum2 = ~sum & 0xffff;
#  else /* defined(BSD) || defined(sun) */
{
    union {
        u_char  c[2];
        u_short s;
    } bytes;
    u_short len = ip->ip_len;
#   if defined(__sgi)
    int add;
#   endif

    /*
     * Add up IP Header portion
     */
    if (sp != (u_short *)l4hdr)
        sp = (u_short *)l4hdr;

    switch (l4proto)
    {
    case IPPROTO_UDP :
        sum += *sp++;   /* sport */
        sum += *sp++;   /* dport */
        sum += *sp++;   /* udp length */
        sum += *sp++;   /* checksum */
        break;

    case IPPROTO_TCP :
        sum += *sp++;   /* sport */
        sum += *sp++;   /* dport */
        sum += *sp++;   /* seq */
        sum += *sp++;
        sum += *sp++;   /* ack */
        sum += *sp++;
        sum += *sp++;   /* off */
        sum += *sp++;   /* win */
        sum += *sp++;   /* checksum */
        sum += *sp++;   /* urp */
        break;
    case IPPROTO_ICMP :
        sum = *sp++;    /* type/code */
        sum += *sp++;   /* checksum */
        break;
    }

#   ifdef   __sgi
    /*
     * In case we had to copy the IP & TCP header out of mbufs,
     * skip over the mbuf bits which are the header
     */
    if ((caddr_t)ip != mtod(m, caddr_t)) {
        hlen = (caddr_t)sp - (caddr_t)ip;
        while (hlen) {
            add = MIN(hlen, m->m_len);
            sp = (u_short *)(mtod(m, caddr_t) + add);
            hlen -= add;
            if (add == m->m_len) {
                m = m->m_next;
                if (!hlen) {
                    if (!m)
                        break;
                    sp = mtod(m, u_short *);
                }
                PANIC((!m),("fr_cksum(1): not enough data"));
            }
        }
    }
#   endif

    len -= (l4hlen + hlen);
    if (len <= 0)
        goto nodata;

    while (len > 1) {
        if (((caddr_t)sp - mtod(m, caddr_t)) >= m->m_len) {
            m = m->m_next;
            PANIC((!m),("fr_cksum(2): not enough data"));
            sp = mtod(m, u_short *);
        }
        if (((caddr_t)(sp + 1) - mtod(m, caddr_t)) > m->m_len) {
            bytes.c[0] = *(u_char *)sp;
            m = m->m_next;
            PANIC((!m),("fr_cksum(3): not enough data"));
            sp = mtod(m, u_short *);
            bytes.c[1] = *(u_char *)sp;
            sum += bytes.s;
            sp = (u_short *)((u_char *)sp + 1);
        }
        if ((u_long)sp & 1) {
            bcopy((char *)sp++, (char *)&bytes.s, sizeof(bytes.s));
            sum += bytes.s;
        } else
            sum += *sp++;
        len -= 2;
    }

    if (len != 0)
        sum += ntohs(*(u_char *)sp << 8);
nodata:
    while (sum > 0xffff)
        sum = (sum & 0xffff) + (sum >> 16);
    sum2 = (u_short)(~sum & 0xffff);
}
#  endif /*  defined(BSD) || defined(sun) */
# endif /* MENTAT */
#else /* _KERNEL */
    for (; slen > 1; slen -= 2)
            sum += *sp++;
    if (slen)
        sum += ntohs(*(u_char *)sp << 8);
    while (sum > 0xffff)
        sum = (sum & 0xffff) + (sum >> 16);
    sum2 = (u_short)(~sum & 0xffff);
#endif /* _KERNEL */
    if (csump != NULL)
        *csump = sumsave;
    return sum2;
}


#if defined(_KERNEL) && ( ((BSD < 199103) && !defined(MENTAT)) || \
    defined(__sgi) ) && !defined(linux) && !defined(_AIX51)
/*
 * Copyright (c) 1982, 1986, 1988, 1991, 1993
 *  The Regents of the University of California.  All rights reserved.
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions
 * are met:
 * 1. Redistributions of source code must retain the above copyright
 *    notice, this list of conditions and the following disclaimer.
 * 2. Redistributions in binary form must reproduce the above copyright
 *    notice, this list of conditions and the following disclaimer in the
 *    documentation and/or other materials provided with the distribution.
 * 3. Neither the name of the University nor the names of its contributors
 *    may be used to endorse or promote products derived from this software
 *    without specific prior written permission.
 *
 * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
 * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
 * SUCH DAMAGE.
 *
 *  @(#)uipc_mbuf.c 8.2 (Berkeley) 1/4/94
 * $Id: fil.c,v 2.243.2.64 2005/08/13 05:19:59 darrenr Exp $
 */
/*
 * Copy data from an mbuf chain starting "off" bytes from the beginning,
 * continuing for "len" bytes, into the indicated buffer.
 */
void
m_copydata(m, off, len, cp)
    mb_t *m;
    int off;
    int len;
    caddr_t cp;
{
    unsigned count;

    if (off < 0 || len < 0)
        panic("m_copydata");
    while (off > 0) {
        if (m == 0)
            panic("m_copydata");
        if (off < m->m_len)
            break;
        off -= m->m_len;
        m = m->m_next;
    }
    while (len > 0) {
        if (m == 0)
            panic("m_copydata");
        count = MIN(m->m_len - off, len);
        bcopy(mtod(m, caddr_t) + off, cp, count);
        len -= count;
        cp += count;
        off = 0;
        m = m->m_next;
    }
}


/*
 * Copy data from a buffer back into the indicated mbuf chain,
 * starting "off" bytes from the beginning, extending the mbuf
 * chain if necessary.
 */
void
m_copyback(m0, off, len, cp)
    struct  mbuf *m0;
    int off;
    int len;
    caddr_t cp;
{
    int mlen;
    struct mbuf *m = m0, *n;
    int totlen = 0;

    if (m0 == 0)
        return;
    while (off > (mlen = m->m_len)) {
        off -= mlen;
        totlen += mlen;
        if (m->m_next == 0) {
            n = m_getclr(M_DONTWAIT, m->m_type);
            if (n == 0)
                goto out;
            n->m_len = min(MLEN, len + off);
            m->m_next = n;
        }
        m = m->m_next;
    }
    while (len > 0) {
        mlen = min(m->m_len - off, len);
        bcopy(cp, off + mtod(m, caddr_t), (unsigned)mlen);
        cp += mlen;
        len -= mlen;
        mlen += off;
        off = 0;
        totlen += mlen;
        if (len == 0)
            break;
        if (m->m_next == 0) {
            n = m_get(M_DONTWAIT, m->m_type);
            if (n == 0)
                break;
            n->m_len = min(MLEN, len);
            m->m_next = n;
        }
        m = m->m_next;
    }
out:
#if 0
    if (((m = m0)->m_flags & M_PKTHDR) && (m->m_pkthdr.len < totlen))
        m->m_pkthdr.len = totlen;
#endif
    return;
}
#endif /* (_KERNEL) && ( ((BSD < 199103) && !MENTAT) || __sgi) */


/* ------------------------------------------------------------------------ */
/* Function:    fr_findgroup                                                */
/* Returns:     frgroup_t * - NULL = group not found, else pointer to group */
/* Parameters:  group(I) - group name to search for                         */
/*              unit(I)  - device to which this group belongs               */
/*              set(I)   - which set of rules (inactive/inactive) this is   */
/*              fgpp(O)  - pointer to place to store pointer to the pointer */
/*                         to where to add the next (last) group or where   */
/*                         to delete group from.                            */
/*                                                                          */
/* Search amongst the defined groups for a particular group number.         */
/* ------------------------------------------------------------------------ */
frgroup_t *fr_findgroup(group, unit, set, fgpp, ifs)
char *group;
minor_t unit;
int set;
frgroup_t ***fgpp;
ipf_stack_t *ifs;
{
    frgroup_t *fg, **fgp;

    /*
     * Which list of groups to search in is dependent on which list of
     * rules are being operated on.
     */
    fgp = &ifs->ifs_ipfgroups[unit][set];

    while ((fg = *fgp) != NULL) {
        if (strncmp(group, fg->fg_name, FR_GROUPLEN) == 0)
            break;
        else
            fgp = &fg->fg_next;
    }
    if (fgpp != NULL)
        *fgpp = fgp;
    return fg;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_addgroup                                                 */
/* Returns:     frgroup_t * - NULL == did not create group,                 */
/*                            != NULL == pointer to the group               */
/* Parameters:  num(I)   - group number to add                              */
/*              head(I)  - rule pointer that is using this as the head      */
/*              flags(I) - rule flags which describe the type of rule it is */
/*              unit(I)  - device to which this group will belong to        */
/*              set(I)   - which set of rules (inactive/inactive) this is   */
/* Write Locks: ipf_mutex                                                   */
/*                                                                          */
/* Add a new group head, or if it already exists, increase the reference    */
/* count to it.                                                             */
/* ------------------------------------------------------------------------ */
frgroup_t *fr_addgroup(group, head, flags, unit, set, ifs)
char *group;
void *head;
u_32_t flags;
minor_t unit;
int set;
ipf_stack_t *ifs;
{
    frgroup_t *fg, **fgp;
    u_32_t gflags;

    if (group == NULL)
        return NULL;

    if (unit == IPL_LOGIPF && *group == '\0')
        return NULL;

    fgp = NULL;
    gflags = flags & FR_INOUT;

    fg = fr_findgroup(group, unit, set, &fgp, ifs);
    if (fg != NULL) {
        if (fg->fg_flags == 0)
            fg->fg_flags = gflags;
        else if (gflags != fg->fg_flags)
            return NULL;
        fg->fg_ref++;
        return fg;
    }
    KMALLOC(fg, frgroup_t *);
    if (fg != NULL) {
        fg->fg_head = head;
        fg->fg_start = NULL;
        fg->fg_next = *fgp;
        bcopy(group, fg->fg_name, FR_GROUPLEN);
        fg->fg_flags = gflags;
        fg->fg_ref = 1;
        *fgp = fg;
    }
    return fg;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_delgroup                                                 */
/* Returns:     Nil                                                         */
/* Parameters:  group(I) - group name to delete                             */
/*              unit(I)  - device to which this group belongs               */
/*              set(I)   - which set of rules (inactive/inactive) this is   */
/* Write Locks: ipf_mutex                                                   */
/*                                                                          */
/* Attempt to delete a group head.                                          */
/* Only do this when its reference count reaches 0.                         */
/* ------------------------------------------------------------------------ */
void fr_delgroup(group, unit, set, ifs)
char *group;
minor_t unit;
int set;
ipf_stack_t *ifs;
{
    frgroup_t *fg, **fgp;

    fg = fr_findgroup(group, unit, set, &fgp, ifs);
    if (fg == NULL)
        return;

    fg->fg_ref--;
    if (fg->fg_ref == 0) {
        *fgp = fg->fg_next;
        KFREE(fg);
    }
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_getrulen                                                 */
/* Returns:     frentry_t * - NULL == not found, else pointer to rule n     */
/* Parameters:  unit(I)  - device for which to count the rule's number      */
/*              flags(I) - which set of rules to find the rule in           */
/*              group(I) - group name                                       */
/*              n(I)     - rule number to find                              */
/*                                                                          */
/* Find rule # n in group # g and return a pointer to it.  Return NULl if   */
/* group # g doesn't exist or there are less than n rules in the group.     */
/* ------------------------------------------------------------------------ */
frentry_t *fr_getrulen(unit, group, n, ifs)
int unit;
char *group;
u_32_t n;
ipf_stack_t *ifs;
{
    frentry_t *fr;
    frgroup_t *fg;

    fg = fr_findgroup(group, unit, ifs->ifs_fr_active, NULL, ifs);
    if (fg == NULL)
        return NULL;
    for (fr = fg->fg_head; fr && n; fr = fr->fr_next, n--)
        ;
    if (n != 0)
        return NULL;
    return fr;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_rulen                                                    */
/* Returns:     int - >= 0 - rule number, -1 == search failed               */
/* Parameters:  unit(I) - device for which to count the rule's number       */
/*              fr(I)   - pointer to rule to match                          */
/*                                                                          */
/* Return the number for a rule on a specific filtering device.             */
/* ------------------------------------------------------------------------ */
int fr_rulen(unit, fr, ifs)
int unit;
frentry_t *fr;
ipf_stack_t *ifs;
{
    frentry_t *fh;
    frgroup_t *fg;
    u_32_t n = 0;

    if (fr == NULL)
        return -1;
    fg = fr_findgroup(fr->fr_group, unit, ifs->ifs_fr_active, NULL, ifs);
    if (fg == NULL)
        return -1;
    for (fh = fg->fg_head; fh; n++, fh = fh->fr_next)
        if (fh == fr)
            break;
    if (fh == NULL)
        return -1;
    return n;
}


/* ------------------------------------------------------------------------ */
/* Function:    frflushlist                                                 */
/* Returns:     int - >= 0 - number of flushed rules                        */
/* Parameters:  set(I)   - which set of rules (inactive/inactive) this is   */
/*              unit(I)  - device for which to flush rules                  */
/*              flags(I) - which set of rules to flush                      */
/*              nfreedp(O) - pointer to int where flush count is stored     */
/*              listp(I)   - pointer to list to flush pointer               */
/* Write Locks: ipf_mutex                                                   */
/*                                                                          */
/* Recursively flush rules from the list, descending groups as they are     */
/* encountered.  if a rule is the head of a group and it has lost all its   */
/* group members, then also delete the group reference.  nfreedp is needed  */
/* to store the accumulating count of rules removed, whereas the returned   */
/* value is just the number removed from the current list.  The latter is   */
/* needed to correctly adjust reference counts on rules that define groups. */
/*                                                                          */
/* NOTE: Rules not loaded from user space cannot be flushed.                */
/* ------------------------------------------------------------------------ */
static int frflushlist(set, unit, nfreedp, listp, ifs)
int set;
minor_t unit;
int *nfreedp;
frentry_t **listp;
ipf_stack_t *ifs;
{
    int freed = 0;
    frentry_t *fp;

    while ((fp = *listp) != NULL) {
        if ((fp->fr_type & FR_T_BUILTIN) ||
            !(fp->fr_flags & FR_COPIED)) {
            listp = &fp->fr_next;
            continue;
        }
        *listp = fp->fr_next;
        if (fp->fr_grp != NULL) {
            (void) frflushlist(set, unit, nfreedp, fp->fr_grp, ifs);
        }

        if (fp->fr_grhead != NULL) {
            fr_delgroup(fp->fr_grhead, unit, set, ifs);
            *fp->fr_grhead = '\0';
        }

        ASSERT(fp->fr_ref > 0);
        fp->fr_next = NULL;
        if (fr_derefrule(&fp, ifs) == 0)
            freed++;
    }
    *nfreedp += freed;
    return freed;
}


/* ------------------------------------------------------------------------ */
/* Function:    frflush                                                     */
/* Returns:     int - >= 0 - number of flushed rules                        */
/* Parameters:  unit(I)  - device for which to flush rules                  */
/*              flags(I) - which set of rules to flush                      */
/*                                                                          */
/* Calls flushlist() for all filter rules (accounting, firewall - both IPv4 */
/* and IPv6) as defined by the value of flags.                              */
/* ------------------------------------------------------------------------ */
int frflush(unit, proto, flags, ifs)
minor_t unit;
int proto, flags;
ipf_stack_t *ifs;
{
    int flushed = 0, set;

    WRITE_ENTER(&ifs->ifs_ipf_mutex);
    bzero((char *)ifs->ifs_frcache, sizeof (ifs->ifs_frcache));

    set = ifs->ifs_fr_active;
    if ((flags & FR_INACTIVE) == FR_INACTIVE)
        set = 1 - set;

    if (flags & FR_OUTQUE) {
        if (proto == 0 || proto == 6) {
            (void) frflushlist(set, unit,
                &flushed, &ifs->ifs_ipfilter6[1][set], ifs);
            (void) frflushlist(set, unit,
                &flushed, &ifs->ifs_ipacct6[1][set], ifs);
        }
        if (proto == 0 || proto == 4) {
            (void) frflushlist(set, unit,
                &flushed, &ifs->ifs_ipfilter[1][set], ifs);
            (void) frflushlist(set, unit,
                &flushed, &ifs->ifs_ipacct[1][set], ifs);
        }
    }
    if (flags & FR_INQUE) {
        if (proto == 0 || proto == 6) {
            (void) frflushlist(set, unit,
                &flushed, &ifs->ifs_ipfilter6[0][set], ifs);
            (void) frflushlist(set, unit,
                &flushed, &ifs->ifs_ipacct6[0][set], ifs);
        }
        if (proto == 0 || proto == 4) {
            (void) frflushlist(set, unit,
                &flushed, &ifs->ifs_ipfilter[0][set], ifs);
            (void) frflushlist(set, unit,
                &flushed, &ifs->ifs_ipacct[0][set], ifs);
        }
    }
    RWLOCK_EXIT(&ifs->ifs_ipf_mutex);

    if (unit == IPL_LOGIPF) {
        int tmp;

        tmp = frflush(IPL_LOGCOUNT, proto, flags, ifs);
        if (tmp >= 0)
            flushed += tmp;
    }
    return flushed;
}


/* ------------------------------------------------------------------------ */
/* Function:    memstr                                                      */
/* Returns:     char *  - NULL if failed, != NULL pointer to matching bytes */
/* Parameters:  src(I)  - pointer to byte sequence to match                 */
/*              dst(I)  - pointer to byte sequence to search                */
/*              slen(I) - match length                                      */
/*              dlen(I) - length available to search in                     */
/*                                                                          */
/* Search dst for a sequence of bytes matching those at src and extend for  */
/* slen bytes.                                                              */
/* ------------------------------------------------------------------------ */
char *memstr(src, dst, slen, dlen)
char *src, *dst;
int slen, dlen;
{
    char *s = NULL;

    while (dlen >= slen) {
        if (bcmp(src, dst, slen) == 0) {
            s = dst;
            break;
        }
        dst++;
        dlen--;
    }
    return s;
}
/* ------------------------------------------------------------------------ */
/* Function:    fr_fixskip                                                  */
/* Returns:     Nil                                                         */
/* Parameters:  listp(IO)    - pointer to start of list with skip rule      */
/*              rp(I)        - rule added/removed with skip in it.          */
/*              addremove(I) - adjustment (-1/+1) to make to skip count,    */
/*                             depending on whether a rule was just added   */
/*                             or removed.                                  */
/*                                                                          */
/* Adjust all the rules in a list which would have skip'd past the position */
/* where we are inserting to skip to the right place given the change.      */
/* ------------------------------------------------------------------------ */
void fr_fixskip(listp, rp, addremove)
frentry_t **listp, *rp;
int addremove;
{
    int rules, rn;
    frentry_t *fp;

    rules = 0;
    for (fp = *listp; (fp != NULL) && (fp != rp); fp = fp->fr_next)
        rules++;

    if (!fp)
        return;

    for (rn = 0, fp = *listp; fp && (fp != rp); fp = fp->fr_next, rn++)
        if (FR_ISSKIP(fp->fr_flags) && (rn + fp->fr_arg >= rules))
            fp->fr_arg += addremove;
}


#ifdef  _KERNEL
/* ------------------------------------------------------------------------ */
/* Function:    count4bits                                                  */
/* Returns:     int - >= 0 - number of consecutive bits in input            */
/* Parameters:  ip(I) - 32bit IP address                                    */
/*                                                                          */
/* IPv4 ONLY                                                                */
/* count consecutive 1's in bit mask.  If the mask generated by counting    */
/* consecutive 1's is different to that passed, return -1, else return #    */
/* of bits.                                                                 */
/* ------------------------------------------------------------------------ */
int count4bits(ip)
u_32_t  ip;
{
    u_32_t  ipn;
    int cnt = 0, i, j;

    ip = ipn = ntohl(ip);
    for (i = 32; i; i--, ipn *= 2)
        if (ipn & 0x80000000)
            cnt++;
        else
            break;
    ipn = 0;
    for (i = 32, j = cnt; i; i--, j--) {
        ipn *= 2;
        if (j > 0)
            ipn++;
    }
    if (ipn == ip)
        return cnt;
    return -1;
}


#ifdef USE_INET6
/* ------------------------------------------------------------------------ */
/* Function:    count6bits                                                  */
/* Returns:     int - >= 0 - number of consecutive bits in input            */
/* Parameters:  msk(I) - pointer to start of IPv6 bitmask                   */
/*                                                                          */
/* IPv6 ONLY                                                                */
/* count consecutive 1's in bit mask.                                       */
/* ------------------------------------------------------------------------ */
int count6bits(msk)
u_32_t *msk;
{
    int i = 0, k;
    u_32_t j;

    for (k = 3; k >= 0; k--)
        if (msk[k] == 0xffffffff)
            i += 32;
        else {
            for (j = msk[k]; j; j <<= 1)
                if (j & 0x80000000)
                    i++;
        }
    return i;
}
# endif
#endif /* _KERNEL */


/* ------------------------------------------------------------------------ */
/* Function:    fr_ifsync                                                   */
/* Returns:     void *    - new interface identifier                        */
/* Parameters:  action(I)  - type of synchronisation to do                  */
/*              v(I)       - IP version being sync'd (v4 or v6)             */
/*              newifp(I)  - interface identifier being introduced/removed  */
/*              oldifp(I)  - interface identifier in a filter rule          */
/*              newname(I) - name associated with newifp interface          */
/*              oldname(I) - name associated with oldifp interface          */
/*      ifs       - pointer to IPF stack instance           */
/*                                                                          */
/* This function returns what the new value for "oldifp" should be for its  */
/* caller.  In some cases it will not change, in some it will.              */
/* action == IPFSYNC_RESYNC                                                 */
/*   a new value for oldifp will always be looked up, according to oldname, */
/*   the values of newname and newifp are ignored.                          */
/* action == IPFSYNC_NEWIFP                                                 */
/*   if oldname matches newname then we are doing a sync for the matching   */
/*   interface, so we return newifp to be used in place of oldifp.  If the  */
/*   the names don't match, just return oldifp.                             */
/* action == IPFSYNC_OLDIFP                                                 */
/*   if oldifp matches newifp then we are are doing a sync to remove any    */
/*   references to oldifp, so we return "-1".                               */
/* -----                                    */
/* NOTE:                                    */
/* This function processes NIC event from PF_HOOKS. The action parameter    */
/* is set in ipf_nic_event_v4()/ipf_nic_event_v6() function. There is       */
/* one single switch statement() in ipf_nic_event_vx() function, which      */
/* translates the HOOK event type to action parameter passed to fr_ifsync.  */
/* The translation table looks as follows:                  */
/*  event       | action                        */
/*  ----------------+-------------                      */
/*  NE_PLUMB    | IPFSYNC_NEWIFP                    */
/*  NE_UNPLUMB  | IPFSYNC_OLDIFP                    */
/*    NE_ADDRESS_CHANGE | IPFSYNC_RESYNC                    */
/*                                      */
/* The oldname and oldifp parameters are taken from IPF entry (rule, state  */
/* table entry, NAT table entry, fragment ...). The newname and newifp      */
/* parameters come from hook event data, parameters are taken from event    */
/* in ipf_nic_event_vx() functions. Any time NIC changes, the IPF is        */
/* notified by hook function.                           */
/*                                      */
/* We get NE_UNPLUMB event from PF_HOOKS even if someone coincidently tries */
/* to plumb the interface, which is already plumbed. In such case we always */
/* get the event from PF_HOOKS as follows:                  */
/*  event:  NE_PLUMB                            */
/*  NIC:    0x0                             */
/* ------------------------------------------------------------------------ */
static void *fr_ifsync(action, v, newname, oldname, newifp, oldifp, ifs)
int action, v;
char *newname, *oldname;
void *newifp, *oldifp;
ipf_stack_t *ifs;
{
    void *rval = oldifp;

    switch (action)
    {
    case IPFSYNC_RESYNC :
        if (oldname[0] != '\0') {
            rval = fr_resolvenic(oldname, v, ifs);
        }
        break;
    case IPFSYNC_NEWIFP :
        if (!strncmp(newname, oldname, LIFNAMSIZ))
            rval = newifp;
        break;
    case IPFSYNC_OLDIFP :
        /*
         * If interface gets unplumbed it must be invalidated, which
         * means set all existing references to the interface to -1.
         * We don't want to invalidate references for wildcard
         * (unbound) rules (entries).
         */
        if (newifp == oldifp)
            rval = (oldifp) ? (void *)-1 : NULL;
        break;
    }

    return rval;
}


/* ------------------------------------------------------------------------ */
/* Function:    frsynclist                                                  */
/* Returns:     void                                                        */
/* Parameters:  action(I) - type of synchronisation to do                   */
/*              v(I)      - IP version being sync'd (v4 or v6)              */
/*              ifp(I)    - interface identifier associated with action     */
/*              ifname(I) - name associated with ifp parameter              */
/*              fr(I)     - pointer to filter rule                          */
/*      ifs       - pointer to IPF stack instance           */
/* Write Locks: ipf_mutex                                                   */
/*                                                                          */
/* Walk through a list of filter rules and resolve any interface names into */
/* pointers.  Where dynamic addresses are used, also update the IP address  */
/* used in the rule.  The interface pointer is used to limit the lookups to */
/* a specific set of matching names if it is non-NULL.                      */
/* ------------------------------------------------------------------------ */
static void frsynclist(action, v, ifp, ifname, fr, ifs)
int action, v;
void *ifp;
char *ifname;
frentry_t *fr;
ipf_stack_t *ifs;
{
    frdest_t *fdp;
    int rv, i;

    for (; fr; fr = fr->fr_next) {
        rv = fr->fr_v;
        if (v != 0 && v != rv)
            continue;

        /*
         * Lookup all the interface names that are part of the rule.
         */
        for (i = 0; i < 4; i++) {
            fr->fr_ifas[i] = fr_ifsync(action, rv, ifname,
                           fr->fr_ifnames[i],
                           ifp, fr->fr_ifas[i],
                           ifs);
        }

        fdp = &fr->fr_tifs[0];
        fdp->fd_ifp = fr_ifsync(action, rv, ifname, fdp->fd_ifname,
                       ifp, fdp->fd_ifp, ifs);

        fdp = &fr->fr_tifs[1];
        fdp->fd_ifp = fr_ifsync(action, rv, ifname, fdp->fd_ifname,
                       ifp, fdp->fd_ifp, ifs);

        fdp = &fr->fr_dif;
        fdp->fd_ifp = fr_ifsync(action, rv, ifname, fdp->fd_ifname,
                       ifp, fdp->fd_ifp, ifs);

        if (action != IPFSYNC_RESYNC)
            continue;

        if (fr->fr_type == FR_T_IPF) {
            if (fr->fr_satype != FRI_NORMAL &&
                fr->fr_satype != FRI_LOOKUP) {
                (void)fr_ifpaddr(rv, fr->fr_satype,
                         fr->fr_ifas[fr->fr_sifpidx],
                         &fr->fr_src, &fr->fr_smsk,
                         ifs);
            }
            if (fr->fr_datype != FRI_NORMAL &&
                fr->fr_datype != FRI_LOOKUP) {
                (void)fr_ifpaddr(rv, fr->fr_datype,
                         fr->fr_ifas[fr->fr_difpidx],
                         &fr->fr_dst, &fr->fr_dmsk,
                         ifs);
            }
        }

#ifdef  IPFILTER_LOOKUP
        if (fr->fr_type == FR_T_IPF && fr->fr_satype == FRI_LOOKUP &&
            fr->fr_srcptr == NULL) {
            fr->fr_srcptr = fr_resolvelookup(fr->fr_srctype,
                             fr->fr_srcnum,
                             &fr->fr_srcfunc, ifs);
        }
        if (fr->fr_type == FR_T_IPF && fr->fr_datype == FRI_LOOKUP &&
            fr->fr_dstptr == NULL) {
            fr->fr_dstptr = fr_resolvelookup(fr->fr_dsttype,
                             fr->fr_dstnum,
                             &fr->fr_dstfunc, ifs);
        }
#endif
    }
}


#ifdef  _KERNEL
/* ------------------------------------------------------------------------ */
/* Function:    frsync                                                      */
/* Returns:     void                                                        */
/* Parameters:  action(I) - type of synchronisation to do                   */
/*              v(I)      - IP version being sync'd (v4 or v6)              */
/*              ifp(I)    - interface identifier associated with action     */
/*              name(I)   - name associated with ifp parameter              */
/*                                                                          */
/* frsync() is called when we suspect that the interface list or            */
/* information about interfaces (like IP#) has changed.  Go through all     */
/* filter rules, NAT entries and the state table and check if anything      */
/* needs to be changed/updated.                                             */
/* With the filtering hooks added to Solaris, we needed to change the manner*/
/* in which this was done to support three different types of sync:         */
/* - complete resync of all interface name/identifiers                      */
/* - new interface being announced with its name and identifier             */
/* - interface removal being announced by only its identifier               */
/* ------------------------------------------------------------------------ */
void frsync(action, v, ifp, name, ifs)
int action, v;
void *ifp;
char *name;
ipf_stack_t *ifs;
{
    int i;

    WRITE_ENTER(&ifs->ifs_ipf_mutex);
    frsynclist(action, v, ifp, name, ifs->ifs_ipacct[0][ifs->ifs_fr_active], ifs);
    frsynclist(action, v, ifp, name, ifs->ifs_ipacct[1][ifs->ifs_fr_active], ifs);
    frsynclist(action, v, ifp, name, ifs->ifs_ipfilter[0][ifs->ifs_fr_active], ifs);
    frsynclist(action, v, ifp, name, ifs->ifs_ipfilter[1][ifs->ifs_fr_active], ifs);
    frsynclist(action, v, ifp, name, ifs->ifs_ipacct6[0][ifs->ifs_fr_active], ifs);
    frsynclist(action, v, ifp, name, ifs->ifs_ipacct6[1][ifs->ifs_fr_active], ifs);
    frsynclist(action, v, ifp, name, ifs->ifs_ipfilter6[0][ifs->ifs_fr_active], ifs);
    frsynclist(action, v, ifp, name, ifs->ifs_ipfilter6[1][ifs->ifs_fr_active], ifs);

    for (i = 0; i < IPL_LOGSIZE; i++) {
        frgroup_t *g;

        for (g = ifs->ifs_ipfgroups[i][0]; g != NULL; g = g->fg_next)
            frsynclist(action, v, ifp, name, g->fg_start, ifs);
        for (g = ifs->ifs_ipfgroups[i][1]; g != NULL; g = g->fg_next)
            frsynclist(action, v, ifp, name, g->fg_start, ifs);
    }
    RWLOCK_EXIT(&ifs->ifs_ipf_mutex);
}

#if SOLARIS2 >= 10
/* ------------------------------------------------------------------------ */
/* Function:    fr_syncindex                            */
/* Returns:     void                                */
/* Parameters:  rules     - list of rules to be sync'd              */
/*      ifp   - interface, which is being sync'd            */
/*      newifp    - new ifindex value for interface         */
/*                                                                          */
/* Function updates all NIC indecis, which match ifp, in every rule. Every  */
/* NIC index matching ifp, will be updated to newifp.               */
/* ------------------------------------------------------------------------ */
static void fr_syncindex(rules, ifp, newifp)
frentry_t *rules;
void *ifp;
void *newifp;
{
    int i;
    frentry_t *fr;

    for (fr = rules; fr != NULL; fr = fr->fr_next) {
        /*
         * Lookup all the interface names that are part of the rule.
         */
        for (i = 0; i < 4; i++)
            if (fr->fr_ifas[i] == ifp)
                fr->fr_ifas[i] = newifp;

        for (i = 0; i < 2; i++) {
            if (fr->fr_tifs[i].fd_ifp == ifp)
                fr->fr_tifs[i].fd_ifp = newifp;
        }

        if (fr->fr_dif.fd_ifp == ifp)
            fr->fr_dif.fd_ifp = newifp;
    }
}

/* ------------------------------------------------------------------------ */
/* Function:    fr_ifindexsync                          */
/* Returns:     void                                */
/* Parameters:  ifp   - interface, which is being sync'd            */
/*      newifp    - new ifindex value for interface         */
/*              ifs   - IPF's stack                     */
/*                                                                          */
/* Function assumes ipf_mutex is locked exclusively.                */
/*                                      */
/* Function updates the NIC references in rules with new interfaces index   */
/* (newifp). Function must process active lists:                */
/*  with accounting rules (IPv6 and IPv4)                   */
/*  with inbound rules (IPv6 and IPv4)                  */
/*  with outbound rules (IPv6 and IPv4)                 */
/* Function also has to take care of rule groups.               */
/*                                                                          */
/* NOTE: The ipf_mutex is grabbed exclusively by caller (which is always    */
/* nic_event_hook). The hook function also updates state entries, NAT rules */
/* and NAT entries. We want to do all these update atomically to keep the   */
/* NIC references consistent. The ipf_mutex will synchronize event with     */
/* fr_check(), which processes packets, so no packet will enter fr_check(), */
/* while NIC references will be synchronized.                   */
/* ------------------------------------------------------------------------ */
void fr_ifindexsync(ifp, newifp, ifs)
void *ifp;
void *newifp;
ipf_stack_t *ifs;
{
    unsigned int    i;
    frentry_t *rule_lists[8];
    unsigned int    rules = sizeof (rule_lists) / sizeof (frentry_t *);

    rule_lists[0] = ifs->ifs_ipacct[0][ifs->ifs_fr_active];
    rule_lists[1] = ifs->ifs_ipacct[1][ifs->ifs_fr_active];
    rule_lists[2] = ifs->ifs_ipfilter[0][ifs->ifs_fr_active];
    rule_lists[3] = ifs->ifs_ipfilter[1][ifs->ifs_fr_active];
    rule_lists[4] = ifs->ifs_ipacct6[0][ifs->ifs_fr_active];
    rule_lists[5] = ifs->ifs_ipacct6[1][ifs->ifs_fr_active];
    rule_lists[6] = ifs->ifs_ipfilter6[0][ifs->ifs_fr_active];
    rule_lists[7] = ifs->ifs_ipfilter6[1][ifs->ifs_fr_active];

    for (i = 0; i < rules; i++) {
        fr_syncindex(rule_lists[i], ifp, newifp);
    }

    /*
     * Update rule groups.
     */
    for (i = 0; i < IPL_LOGSIZE; i++) {
        frgroup_t *g;

        for (g = ifs->ifs_ipfgroups[i][0]; g != NULL; g = g->fg_next)
            fr_syncindex(g->fg_start, ifp, newifp);
        for (g = ifs->ifs_ipfgroups[i][1]; g != NULL; g = g->fg_next)
            fr_syncindex(g->fg_start, ifp, newifp);
    }
}
#endif

/*
 * In the functions below, bcopy() is called because the pointer being
 * copied _from_ in this instance is a pointer to a char buf (which could
 * end up being unaligned) and on the kernel's local stack.
 */
/* ------------------------------------------------------------------------ */
/* Function:    copyinptr                                                   */
/* Returns:     int - 0 = success, else failure                             */
/* Parameters:  src(I)  - pointer to the source address                     */
/*              dst(I)  - destination address                               */
/*              size(I) - number of bytes to copy                           */
/*                                                                          */
/* Copy a block of data in from user space, given a pointer to the pointer  */
/* to start copying from (src) and a pointer to where to store it (dst).    */
/* NB: src - pointer to user space pointer, dst - kernel space pointer      */
/* ------------------------------------------------------------------------ */
int copyinptr(src, dst, size)
void *src, *dst;
size_t size;
{
    caddr_t ca;
    int err;

# if SOLARIS
    err = COPYIN(src, (caddr_t)&ca, sizeof(ca));
    if (err != 0)
        return err;
# else
    bcopy(src, (caddr_t)&ca, sizeof(ca));
# endif
    err = COPYIN(ca, dst, size);
    return err;
}


/* ------------------------------------------------------------------------ */
/* Function:    copyoutptr                                                  */
/* Returns:     int - 0 = success, else failure                             */
/* Parameters:  src(I)  - pointer to the source address                     */
/*              dst(I)  - destination address                               */
/*              size(I) - number of bytes to copy                           */
/*                                                                          */
/* Copy a block of data out to user space, given a pointer to the pointer   */
/* to start copying from (src) and a pointer to where to store it (dst).    */
/* NB: src - kernel space pointer, dst - pointer to user space pointer.     */
/* ------------------------------------------------------------------------ */
int copyoutptr(src, dst, size)
void *src, *dst;
size_t size;
{
    caddr_t ca;
    int err;

# if SOLARIS
    err = COPYIN(dst, (caddr_t)&ca, sizeof(ca));
    if (err != 0)
        return err;
# else
    bcopy(dst, (caddr_t)&ca, sizeof(ca));
# endif
    err = COPYOUT(src, ca, size);
    return err;
}
#endif


/* ------------------------------------------------------------------------ */
/* Function:    fr_lock                                                     */
/* Returns: int - 0 = success, else error                   */
/* Parameters:  data(I)  - pointer to lock value to set                     */
/*              lockp(O) - pointer to location to store old lock value      */
/*                                                                          */
/* Get the new value for the lock integer, set it and return the old value  */
/* in *lockp.                                                               */
/* ------------------------------------------------------------------------ */
int fr_lock(data, lockp)
caddr_t data;
int *lockp;
{
    int arg, err;

    err = BCOPYIN(data, (caddr_t)&arg, sizeof(arg));
    if (err != 0)
        return (EFAULT);
    err = BCOPYOUT((caddr_t)lockp, data, sizeof(*lockp));
    if (err != 0)
        return (EFAULT);
    *lockp = arg;
    return (0);
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_getstat                                                  */
/* Returns:     Nil                                                         */
/* Parameters:  fiop(I)  - pointer to ipfilter stats structure              */
/*                                                                          */
/* Stores a copy of current pointers, counters, etc, in the friostat        */
/* structure.                                                               */
/* ------------------------------------------------------------------------ */
void fr_getstat(fiop, ifs)
friostat_t *fiop;
ipf_stack_t *ifs;
{
    int i, j;

    bcopy((char *)&ifs->ifs_frstats, (char *)fiop->f_st,
        sizeof(filterstats_t) * 2);
    fiop->f_locks[IPL_LOGSTATE] = ifs->ifs_fr_state_lock;
    fiop->f_locks[IPL_LOGNAT] = ifs->ifs_fr_nat_lock;
    fiop->f_locks[IPL_LOGIPF] = ifs->ifs_fr_frag_lock;
    fiop->f_locks[IPL_LOGAUTH] = ifs->ifs_fr_auth_lock;

    for (i = 0; i < 2; i++)
        for (j = 0; j < 2; j++) {
            fiop->f_ipf[i][j] = ifs->ifs_ipfilter[i][j];
            fiop->f_acct[i][j] = ifs->ifs_ipacct[i][j];
            fiop->f_ipf6[i][j] = ifs->ifs_ipfilter6[i][j];
            fiop->f_acct6[i][j] = ifs->ifs_ipacct6[i][j];
        }

    fiop->f_ticks = ifs->ifs_fr_ticks;
    fiop->f_active = ifs->ifs_fr_active;
    fiop->f_froute[0] = ifs->ifs_fr_frouteok[0];
    fiop->f_froute[1] = ifs->ifs_fr_frouteok[1];

    fiop->f_running = ifs->ifs_fr_running;
    for (i = 0; i < IPL_LOGSIZE; i++) {
        fiop->f_groups[i][0] = ifs->ifs_ipfgroups[i][0];
        fiop->f_groups[i][1] = ifs->ifs_ipfgroups[i][1];
    }
#ifdef  IPFILTER_LOG
    fiop->f_logging = 1;
#else
    fiop->f_logging = 0;
#endif
    fiop->f_defpass = ifs->ifs_fr_pass;
    fiop->f_features = fr_features;
    (void) strncpy(fiop->f_version, ipfilter_version,
               sizeof(fiop->f_version));
}


#ifdef  USE_INET6
int icmptoicmp6types[ICMP_MAXTYPE+1] = {
    ICMP6_ECHO_REPLY,   /* 0: ICMP_ECHOREPLY */
    -1,         /* 1: UNUSED */
    -1,         /* 2: UNUSED */
    ICMP6_DST_UNREACH,  /* 3: ICMP_UNREACH */
    -1,         /* 4: ICMP_SOURCEQUENCH */
    ND_REDIRECT,        /* 5: ICMP_REDIRECT */
    -1,         /* 6: UNUSED */
    -1,         /* 7: UNUSED */
    ICMP6_ECHO_REQUEST, /* 8: ICMP_ECHO */
    -1,         /* 9: UNUSED */
    -1,         /* 10: UNUSED */
    ICMP6_TIME_EXCEEDED,    /* 11: ICMP_TIMXCEED */
    ICMP6_PARAM_PROB,   /* 12: ICMP_PARAMPROB */
    -1,         /* 13: ICMP_TSTAMP */
    -1,         /* 14: ICMP_TSTAMPREPLY */
    -1,         /* 15: ICMP_IREQ */
    -1,         /* 16: ICMP_IREQREPLY */
    -1,         /* 17: ICMP_MASKREQ */
    -1,         /* 18: ICMP_MASKREPLY */
};


int icmptoicmp6unreach[ICMP_MAX_UNREACH] = {
    ICMP6_DST_UNREACH_ADDR,     /* 0: ICMP_UNREACH_NET */
    ICMP6_DST_UNREACH_ADDR,     /* 1: ICMP_UNREACH_HOST */
    -1,             /* 2: ICMP_UNREACH_PROTOCOL */
    ICMP6_DST_UNREACH_NOPORT,   /* 3: ICMP_UNREACH_PORT */
    -1,             /* 4: ICMP_UNREACH_NEEDFRAG */
    ICMP6_DST_UNREACH_NOTNEIGHBOR,  /* 5: ICMP_UNREACH_SRCFAIL */
    ICMP6_DST_UNREACH_ADDR,     /* 6: ICMP_UNREACH_NET_UNKNOWN */
    ICMP6_DST_UNREACH_ADDR,     /* 7: ICMP_UNREACH_HOST_UNKNOWN */
    -1,             /* 8: ICMP_UNREACH_ISOLATED */
    ICMP6_DST_UNREACH_ADMIN,    /* 9: ICMP_UNREACH_NET_PROHIB */
    ICMP6_DST_UNREACH_ADMIN,    /* 10: ICMP_UNREACH_HOST_PROHIB */
    -1,             /* 11: ICMP_UNREACH_TOSNET */
    -1,             /* 12: ICMP_UNREACH_TOSHOST */
    ICMP6_DST_UNREACH_ADMIN,    /* 13: ICMP_UNREACH_ADMIN_PROHIBIT */
};
int icmpreplytype6[ICMP6_MAXTYPE + 1];
#endif

int icmpreplytype4[ICMP_MAXTYPE + 1];


/* ------------------------------------------------------------------------ */
/* Function:    fr_matchicmpqueryreply                                      */
/* Returns:     int - 1 if "icmp" is a valid reply to "ic" else 0.          */
/* Parameters:  v(I)    - IP protocol version (4 or 6)                      */
/*              ic(I)   - ICMP information                                  */
/*              icmp(I) - ICMP packet header                                */
/*              rev(I)  - direction (0 = forward/1 = reverse) of packet     */
/*                                                                          */
/* Check if the ICMP packet defined by the header pointed to by icmp is a   */
/* reply to one as described by what's in ic.  If it is a match, return 1,  */
/* else return 0 for no match.                                              */
/* ------------------------------------------------------------------------ */
int fr_matchicmpqueryreply(v, ic, icmp, rev)
int v;
icmpinfo_t *ic;
icmphdr_t *icmp;
int rev;
{
    int ictype;

    ictype = ic->ici_type;

    if (v == 4) {
        /*
         * If we matched its type on the way in, then when going out
         * it will still be the same type.
         */
        if ((!rev && (icmp->icmp_type == ictype)) ||
            (rev && (icmpreplytype4[ictype] == icmp->icmp_type))) {
            if (icmp->icmp_type != ICMP_ECHOREPLY)
                return 1;
            if (icmp->icmp_id == ic->ici_id)
                return 1;
        }
    }
#ifdef  USE_INET6
    else if (v == 6) {
        if ((!rev && (icmp->icmp_type == ictype)) ||
            (rev && (icmpreplytype6[ictype] == icmp->icmp_type))) {
            if (icmp->icmp_type != ICMP6_ECHO_REPLY)
                return 1;
            if (icmp->icmp_id == ic->ici_id)
                return 1;
        }
    }
#endif
    return 0;
}


#ifdef  IPFILTER_LOOKUP
/* ------------------------------------------------------------------------ */
/* Function:    fr_resolvelookup                                            */
/* Returns:     void * - NULL = failure, else success.                      */
/* Parameters:  type(I)     - type of lookup these parameters are for.      */
/*              number(I)   - table number to use when searching            */
/*              funcptr(IO) - pointer to pointer for storing IP address     */
/*                searching function.               */
/*      ifs     - ipf stack instance                */
/*                                                                          */
/* Search for the "table" number passed in amongst those configured for     */
/* that particular type.  If the type is recognised then the function to    */
/* call to do the IP address search will be change, regardless of whether   */
/* or not the "table" number exists.                                        */
/* ------------------------------------------------------------------------ */
static void *fr_resolvelookup(type, number, funcptr, ifs)
u_int type, number;
lookupfunc_t *funcptr;
ipf_stack_t *ifs;
{
    char name[FR_GROUPLEN];
    iphtable_t *iph;
    ip_pool_t *ipo;
    void *ptr;

#if defined(SNPRINTF) && defined(_KERNEL)
    (void) SNPRINTF(name, sizeof(name), "%u", number);
#else
    (void) sprintf(name, "%u", number);
#endif

    READ_ENTER(&ifs->ifs_ip_poolrw);

    switch (type)
    {
    case IPLT_POOL :
# if (defined(__osf__) && defined(_KERNEL))
        ptr = NULL;
        *funcptr = NULL;
# else
        ipo = ip_pool_find(IPL_LOGIPF, name, ifs);
        ptr = ipo;
        if (ipo != NULL) {
            ATOMIC_INC32(ipo->ipo_ref);
        }
        *funcptr = ip_pool_search;
# endif
        break;
    case IPLT_HASH :
        iph = fr_findhtable(IPL_LOGIPF, name, ifs);
        ptr = iph;
        if (iph != NULL) {
            ATOMIC_INC32(iph->iph_ref);
        }
        *funcptr = fr_iphmfindip;
        break;
    default:
        ptr = NULL;
        *funcptr = NULL;
        break;
    }
    RWLOCK_EXIT(&ifs->ifs_ip_poolrw);

    return ptr;
}
#endif


/* ------------------------------------------------------------------------ */
/* Function:    frrequest                                                   */
/* Returns:     int - 0 == success, > 0 == errno value                      */
/* Parameters:  unit(I)     - device for which this is for                  */
/*              req(I)      - ioctl command (SIOC*)                         */
/*              data(I)     - pointr to ioctl data                          */
/*              set(I)      - 1 or 0 (filter set)                           */
/*              makecopy(I) - flag indicating whether data points to a rule */
/*                            in kernel space & hence doesn't need copying. */
/*                                                                          */
/* This function handles all the requests which operate on the list of      */
/* filter rules.  This includes adding, deleting, insertion.  It is also    */
/* responsible for creating groups when a "head" rule is loaded.  Interface */
/* names are resolved here and other sanity checks are made on the content  */
/* of the rule structure being loaded.  If a rule has user defined timeouts */
/* then make sure they are created and initialised before exiting.          */
/* ------------------------------------------------------------------------ */
int frrequest(unit, req, data, set, makecopy, ifs)
int unit;
ioctlcmd_t req;
int set, makecopy;
caddr_t data;
ipf_stack_t *ifs;
{
    frentry_t frd, *fp, *f, **fprev, **ftail;
    int error = 0, in, v;
    void *ptr, *uptr;
    u_int *p, *pp;
    frgroup_t *fg;
    char *group;

    fg = NULL;
    fp = &frd;
    if (makecopy != 0) {
        error = fr_inobj(data, fp, IPFOBJ_FRENTRY);
        if (error)
            return EFAULT;
        if ((fp->fr_flags & FR_T_BUILTIN) != 0)
            return EINVAL;
        fp->fr_ref = 0;
        fp->fr_flags |= FR_COPIED;
    } else {
        fp = (frentry_t *)data;
        if ((fp->fr_type & FR_T_BUILTIN) == 0)
            return EINVAL;
        fp->fr_flags &= ~FR_COPIED;
    }

    if (((fp->fr_dsize == 0) && (fp->fr_data != NULL)) ||
        ((fp->fr_dsize != 0) && (fp->fr_data == NULL)))
        return EINVAL;

    v = fp->fr_v;
    uptr = fp->fr_data;

    /*
     * Only filter rules for IPv4 or IPv6 are accepted.
     */
    if (v == 4)
        /*EMPTY*/;
#ifdef  USE_INET6
    else if (v == 6)
        /*EMPTY*/;
#endif
    else {
        return EINVAL;
    }

    /*
     * If the rule is being loaded from user space, i.e. we had to copy it
     * into kernel space, then do not trust the function pointer in the
     * rule.
     */
    if ((makecopy == 1) && (fp->fr_func != NULL)) {
        if (fr_findfunc(fp->fr_func) == NULL)
            return ESRCH;
        error = fr_funcinit(fp, ifs);
        if (error != 0)
            return error;
    }

    ptr = NULL;
    /*
     * Check that the group number does exist and that its use (in/out)
     * matches what the rule is.
     */
    if (!strncmp(fp->fr_grhead, "0", FR_GROUPLEN))
        *fp->fr_grhead = '\0';
    group = fp->fr_group;
    if (!strncmp(group, "0", FR_GROUPLEN))
        *group = '\0';

    if (FR_ISACCOUNT(fp->fr_flags))
        unit = IPL_LOGCOUNT;

    if ((req != (int)SIOCZRLST) && (*group != '\0')) {
        fg = fr_findgroup(group, unit, set, NULL, ifs);
        if (fg == NULL)
            return ESRCH;
        if (fg->fg_flags == 0)
            fg->fg_flags = fp->fr_flags & FR_INOUT;
        else if (fg->fg_flags != (fp->fr_flags & FR_INOUT))
            return ESRCH;
    }

    in = (fp->fr_flags & FR_INQUE) ? 0 : 1;

    /*
     * Work out which rule list this change is being applied to.
     */
    ftail = NULL;
    fprev = NULL;
    if (unit == IPL_LOGAUTH)
        fprev = &ifs->ifs_ipauth;
    else if (v == 4) {
        if (FR_ISACCOUNT(fp->fr_flags))
            fprev = &ifs->ifs_ipacct[in][set];
        else if ((fp->fr_flags & (FR_OUTQUE|FR_INQUE)) != 0)
            fprev = &ifs->ifs_ipfilter[in][set];
    } else if (v == 6) {
        if (FR_ISACCOUNT(fp->fr_flags))
            fprev = &ifs->ifs_ipacct6[in][set];
        else if ((fp->fr_flags & (FR_OUTQUE|FR_INQUE)) != 0)
            fprev = &ifs->ifs_ipfilter6[in][set];
    }
    if (fprev == NULL)
        return ESRCH;

    if (*group != '\0') {
        if (!fg && !(fg = fr_findgroup(group, unit, set, NULL, ifs)))
            return ESRCH;
        fprev = &fg->fg_start;
    }

    ftail = fprev;
    for (f = *ftail; (f = *ftail) != NULL; ftail = &f->fr_next) {
        if (fp->fr_collect <= f->fr_collect) {
            ftail = fprev;
            f = NULL;
            break;
        }
        fprev = ftail;
    }

    /*
     * Copy in extra data for the rule.
     */
    if (fp->fr_dsize != 0) {
        if (makecopy != 0) {
            KMALLOCS(ptr, void *, fp->fr_dsize);
            if (!ptr)
                return ENOMEM;
            error = COPYIN(uptr, ptr, fp->fr_dsize);
        } else {
            ptr = uptr;
            error = 0;
        }
        if (error != 0) {
            KFREES(ptr, fp->fr_dsize);
            return EFAULT;
        }
        fp->fr_data = ptr;
    } else
        fp->fr_data = NULL;

    /*
     * Perform per-rule type sanity checks of their members.
     */
    switch (fp->fr_type & ~FR_T_BUILTIN)
    {
#if defined(IPFILTER_BPF)
    case FR_T_BPFOPC :
        if (fp->fr_dsize == 0)
            return EINVAL;
        if (!bpf_validate(ptr, fp->fr_dsize/sizeof(struct bpf_insn))) {
            if (makecopy && fp->fr_data != NULL) {
                KFREES(fp->fr_data, fp->fr_dsize);
            }
            return EINVAL;
        }
        break;
#endif
    case FR_T_IPF :
        if (fp->fr_dsize != sizeof(fripf_t)) {
            if (makecopy && fp->fr_data != NULL) {
                KFREES(fp->fr_data, fp->fr_dsize);
            }
            return EINVAL;
        }

        /*
         * Allowing a rule with both "keep state" and "with oow" is
         * pointless because adding a state entry to the table will
         * fail with the out of window (oow) flag set.
         */
        if ((fp->fr_flags & FR_KEEPSTATE) && (fp->fr_flx & FI_OOW)) {
            if (makecopy && fp->fr_data != NULL) {
                KFREES(fp->fr_data, fp->fr_dsize);
            }
            return EINVAL;
        }

        switch (fp->fr_satype)
        {
        case FRI_BROADCAST :
        case FRI_DYNAMIC :
        case FRI_NETWORK :
        case FRI_NETMASKED :
        case FRI_PEERADDR :
            if (fp->fr_sifpidx < 0 || fp->fr_sifpidx > 3) {
                if (makecopy && fp->fr_data != NULL) {
                    KFREES(fp->fr_data, fp->fr_dsize);
                }
                return EINVAL;
            }
            break;
#ifdef  IPFILTER_LOOKUP
        case FRI_LOOKUP :
            fp->fr_srcptr = fr_resolvelookup(fp->fr_srctype,
                             fp->fr_srcnum,
                             &fp->fr_srcfunc, ifs);
            break;
#endif
        default :
            break;
        }

        switch (fp->fr_datype)
        {
        case FRI_BROADCAST :
        case FRI_DYNAMIC :
        case FRI_NETWORK :
        case FRI_NETMASKED :
        case FRI_PEERADDR :
            if (fp->fr_difpidx < 0 || fp->fr_difpidx > 3) {
                if (makecopy && fp->fr_data != NULL) {
                    KFREES(fp->fr_data, fp->fr_dsize);
                }
                return EINVAL;
            }
            break;
#ifdef  IPFILTER_LOOKUP
        case FRI_LOOKUP :
            fp->fr_dstptr = fr_resolvelookup(fp->fr_dsttype,
                             fp->fr_dstnum,
                             &fp->fr_dstfunc, ifs);
            break;
#endif
        default :
            break;
        }
        break;
    case FR_T_NONE :
        break;
    case FR_T_CALLFUNC :
        break;
    case FR_T_COMPIPF :
        break;
    default :
        if (makecopy && fp->fr_data != NULL) {
            KFREES(fp->fr_data, fp->fr_dsize);
        }
        return EINVAL;
    }

    /*
     * Lookup all the interface names that are part of the rule.
     */
    frsynclist(0, 0, NULL, NULL, fp, ifs);
    fp->fr_statecnt = 0;

    /*
     * Look for an existing matching filter rule, but don't include the
     * next or interface pointer in the comparison (fr_next, fr_ifa).
     * This elminates rules which are indentical being loaded.  Checksum
     * the constant part of the filter rule to make comparisons quicker
     * (this meaning no pointers are included).
     */
    for (fp->fr_cksum = 0, p = (u_int *)&fp->fr_func, pp = &fp->fr_cksum;
         p < pp; p++)
        fp->fr_cksum += *p;
    pp = (u_int *)(fp->fr_caddr + fp->fr_dsize);
    for (p = (u_int *)fp->fr_data; p < pp; p++)
        fp->fr_cksum += *p;

    WRITE_ENTER(&ifs->ifs_ipf_mutex);
    bzero((char *)ifs->ifs_frcache, sizeof (ifs->ifs_frcache));

    for (; (f = *ftail) != NULL; ftail = &f->fr_next) {
        if ((fp->fr_cksum != f->fr_cksum) ||
            (f->fr_dsize != fp->fr_dsize))
            continue;
        if (bcmp((char *)&f->fr_func, (char *)&fp->fr_func, FR_CMPSIZ))
            continue;
        if ((!ptr && !f->fr_data) ||
            (ptr && f->fr_data &&
             !bcmp((char *)ptr, (char *)f->fr_data, f->fr_dsize)))
            break;
    }

    /*
     * If zero'ing statistics, copy current to caller and zero.
     */
    if (req == (ioctlcmd_t)SIOCZRLST) {
        if (f == NULL)
            error = ESRCH;
        else {
            /*
             * Copy and reduce lock because of impending copyout.
             * Well we should, but if we do then the atomicity of
             * this call and the correctness of fr_hits and
             * fr_bytes cannot be guaranteed.  As it is, this code
             * only resets them to 0 if they are successfully
             * copied out into user space.
             */
            bcopy((char *)f, (char *)fp, sizeof(*f));

            /*
             * When we copy this rule back out, set the data
             * pointer to be what it was in user space.
             */
            fp->fr_data = uptr;
            error = fr_outobj(data, fp, IPFOBJ_FRENTRY);

            if (error == 0) {
                if ((f->fr_dsize != 0) && (uptr != NULL))
                    error = COPYOUT(f->fr_data, uptr,
                            f->fr_dsize);
                if (error == 0) {
                    f->fr_hits = 0;
                    f->fr_bytes = 0;
                }
            }
        }

        if ((ptr != NULL) && (makecopy != 0)) {
            KFREES(ptr, fp->fr_dsize);
        }
        RWLOCK_EXIT(&ifs->ifs_ipf_mutex);
        return error;
    }

    if (!f) {
        /*
         * At the end of this, ftail must point to the place where the
         * new rule is to be saved/inserted/added.
         * For SIOCAD*FR, this should be the last rule in the group of
         * rules that have equal fr_collect fields.
         * For SIOCIN*FR, ...
         */
        if (req == (ioctlcmd_t)SIOCADAFR ||
            req == (ioctlcmd_t)SIOCADIFR) {

            for (ftail = fprev; (f = *ftail) != NULL; ) {
                if (f->fr_collect > fp->fr_collect)
                    break;
                ftail = &f->fr_next;
            }
            f = NULL;
            ptr = NULL;
            error = 0;
        } else if (req == (ioctlcmd_t)SIOCINAFR ||
               req == (ioctlcmd_t)SIOCINIFR) {
            while ((f = *fprev) != NULL) {
                if (f->fr_collect >= fp->fr_collect)
                    break;
                fprev = &f->fr_next;
            }
            ftail = fprev;
            if (fp->fr_hits != 0) {
                while (fp->fr_hits && (f = *ftail)) {
                    if (f->fr_collect != fp->fr_collect)
                        break;
                    fprev = ftail;
                    ftail = &f->fr_next;
                    fp->fr_hits--;
                }
            }
            f = NULL;
            ptr = NULL;
            error = 0;
        }
    }

    /*
     * Request to remove a rule.
     */
    if (req == (ioctlcmd_t)SIOCRMAFR || req == (ioctlcmd_t)SIOCRMIFR) {
        if (!f)
            error = ESRCH;
        else {
            /*
             * Do not allow activity from user space to interfere
             * with rules not loaded that way.
             */
            if ((makecopy == 1) && !(f->fr_flags & FR_COPIED)) {
                error = EPERM;
                goto done;
            }

            /*
             * Return EBUSY if the rule is being reference by
             * something else (eg state information.
             */
            if (f->fr_ref > 1) {
                error = EBUSY;
                goto done;
            }
#ifdef  IPFILTER_SCAN
            if (f->fr_isctag[0] != '\0' &&
                (f->fr_isc != (struct ipscan *)-1))
                ipsc_detachfr(f);
#endif
            if (unit == IPL_LOGAUTH) {
                error = fr_preauthcmd(req, f, ftail, ifs);
                goto done;
            }
            if (*f->fr_grhead != '\0')
                fr_delgroup(f->fr_grhead, unit, set, ifs);
            fr_fixskip(ftail, f, -1);
            *ftail = f->fr_next;
            f->fr_next = NULL;
            (void)fr_derefrule(&f, ifs);
        }
    } else {
        /*
         * Not removing, so we must be adding/inserting a rule.
         */
        if (f)
            error = EEXIST;
        else {
            if (unit == IPL_LOGAUTH) {
                error = fr_preauthcmd(req, fp, ftail, ifs);
                goto done;
            }
            if (makecopy) {
                KMALLOC(f, frentry_t *);
            } else
                f = fp;
            if (f != NULL) {
                if (fp != f)
                    bcopy((char *)fp, (char *)f,
                          sizeof(*f));
                MUTEX_NUKE(&f->fr_lock);
                MUTEX_INIT(&f->fr_lock, "filter rule lock");
#ifdef  IPFILTER_SCAN
                if (f->fr_isctag[0] != '\0' &&
                    ipsc_attachfr(f))
                    f->fr_isc = (struct ipscan *)-1;
#endif
                f->fr_hits = 0;
                if (makecopy != 0)
                    f->fr_ref = 1;
                f->fr_next = *ftail;
                *ftail = f;
                if (req == (ioctlcmd_t)SIOCINIFR ||
                    req == (ioctlcmd_t)SIOCINAFR)
                    fr_fixskip(ftail, f, 1);
                f->fr_grp = NULL;
                group = f->fr_grhead;
                if (*group != '\0') {
                    fg = fr_addgroup(group, f, f->fr_flags,
                             unit, set, ifs);
                    if (fg != NULL)
                        f->fr_grp = &fg->fg_start;
                }
            } else
                error = ENOMEM;
        }
    }
done:
    RWLOCK_EXIT(&ifs->ifs_ipf_mutex);
    if ((ptr != NULL) && (error != 0) && (makecopy != 0)) {
        KFREES(ptr, fp->fr_dsize);
    }
    return (error);
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_funcinit                                                 */
/* Returns:     int - 0 == success, else ESRCH: cannot resolve rule details */
/* Parameters:  fr(I) - pointer to filter rule                              */
/*                                                                          */
/* If a rule is a call rule, then check if the function it points to needs  */
/* an init function to be called now the rule has been loaded.              */
/* ------------------------------------------------------------------------ */
static int fr_funcinit(fr, ifs)
frentry_t *fr;
ipf_stack_t *ifs;
{
    ipfunc_resolve_t *ft;
    int err;

    err = ESRCH;

    for (ft = fr_availfuncs; ft->ipfu_addr != NULL; ft++)
        if (ft->ipfu_addr == fr->fr_func) {
            err = 0;
            if (ft->ipfu_init != NULL)
                err = (*ft->ipfu_init)(fr, ifs);
            break;
        }
    return err;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_findfunc                                                 */
/* Returns:     ipfunc_t - pointer to function if found, else NULL          */
/* Parameters:  funcptr(I) - function pointer to lookup                     */
/*                                                                          */
/* Look for a function in the table of known functions.                     */
/* ------------------------------------------------------------------------ */
static ipfunc_t fr_findfunc(funcptr)
ipfunc_t funcptr;
{
    ipfunc_resolve_t *ft;

    for (ft = fr_availfuncs; ft->ipfu_addr != NULL; ft++)
        if (ft->ipfu_addr == funcptr)
            return funcptr;
    return NULL;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_resolvefunc                                              */
/* Returns:     int - 0 == success, else error                              */
/* Parameters:  data(IO) - ioctl data pointer to ipfunc_resolve_t struct    */
/*                                                                          */
/* Copy in a ipfunc_resolve_t structure and then fill in the missing field. */
/* This will either be the function name (if the pointer is set) or the     */
/* function pointer if the name is set.  When found, fill in the other one  */
/* so that the entire, complete, structure can be copied back to user space.*/
/* ------------------------------------------------------------------------ */
int fr_resolvefunc(data)
void *data;
{
    ipfunc_resolve_t res, *ft;
    int err;

    err = BCOPYIN(data, &res, sizeof(res));
    if (err != 0)
        return EFAULT;

    if (res.ipfu_addr == NULL && res.ipfu_name[0] != '\0') {
        for (ft = fr_availfuncs; ft->ipfu_addr != NULL; ft++)
            if (strncmp(res.ipfu_name, ft->ipfu_name,
                    sizeof(res.ipfu_name)) == 0) {
                res.ipfu_addr = ft->ipfu_addr;
                res.ipfu_init = ft->ipfu_init;
                if (COPYOUT(&res, data, sizeof(res)) != 0)
                    return EFAULT;
                return 0;
            }
    }
    if (res.ipfu_addr != NULL && res.ipfu_name[0] == '\0') {
        for (ft = fr_availfuncs; ft->ipfu_addr != NULL; ft++)
            if (ft->ipfu_addr == res.ipfu_addr) {
                (void) strncpy(res.ipfu_name, ft->ipfu_name,
                           sizeof(res.ipfu_name));
                res.ipfu_init = ft->ipfu_init;
                if (COPYOUT(&res, data, sizeof(res)) != 0)
                    return EFAULT;
                return 0;
            }
    }
    return ESRCH;
}


#if !defined(_KERNEL) || (!defined(__NetBSD__) && !defined(__OpenBSD__) && !defined(__FreeBSD__)) || \
    (defined(__FreeBSD__) && (__FreeBSD_version < 490000)) || \
    (defined(__NetBSD__) && (__NetBSD_Version__ < 105000000)) || \
    (defined(__OpenBSD__) && (OpenBSD < 200006))
/*
 * From: NetBSD
 * ppsratecheck(): packets (or events) per second limitation.
 */
int
ppsratecheck(lasttime, curpps, maxpps)
    struct timeval *lasttime;
    int *curpps;
    int maxpps; /* maximum pps allowed */
{
    struct timeval tv, delta;
    int rv;

    GETKTIME(&tv);

    delta.tv_sec = tv.tv_sec - lasttime->tv_sec;
    delta.tv_usec = tv.tv_usec - lasttime->tv_usec;
    if (delta.tv_usec < 0) {
        delta.tv_sec--;
        delta.tv_usec += 1000000;
    }

    /*
     * check for 0,0 is so that the message will be seen at least once.
     * if more than one second have passed since the last update of
     * lasttime, reset the counter.
     *
     * we do increment *curpps even in *curpps < maxpps case, as some may
     * try to use *curpps for stat purposes as well.
     */
    if ((lasttime->tv_sec == 0 && lasttime->tv_usec == 0) ||
        delta.tv_sec >= 1) {
        *lasttime = tv;
        *curpps = 0;
        rv = 1;
    } else if (maxpps < 0)
        rv = 1;
    else if (*curpps < maxpps)
        rv = 1;
    else
        rv = 0;
    *curpps = *curpps + 1;

    return (rv);
}
#endif


/* ------------------------------------------------------------------------ */
/* Function:    fr_derefrule                                                */
/* Returns:     int   - 0 == rule freed up, else rule not freed             */
/* Parameters:  fr(I) - pointer to filter rule                              */
/*                                                                          */
/* Decrement the reference counter to a rule by one.  If it reaches zero,   */
/* free it and any associated storage space being used by it.               */
/* ------------------------------------------------------------------------ */
int fr_derefrule(frp, ifs)
frentry_t **frp;
ipf_stack_t *ifs;
{
    frentry_t *fr;

    fr = *frp;

    MUTEX_ENTER(&fr->fr_lock);
    fr->fr_ref--;
    if (fr->fr_ref == 0) {
        MUTEX_EXIT(&fr->fr_lock);
        MUTEX_DESTROY(&fr->fr_lock);

#ifdef IPFILTER_LOOKUP
        if (fr->fr_type == FR_T_IPF && fr->fr_satype == FRI_LOOKUP)
            ip_lookup_deref(fr->fr_srctype, fr->fr_srcptr, ifs);
        if (fr->fr_type == FR_T_IPF && fr->fr_datype == FRI_LOOKUP)
            ip_lookup_deref(fr->fr_dsttype, fr->fr_dstptr, ifs);
#endif

        if (fr->fr_dsize) {
            KFREES(fr->fr_data, fr->fr_dsize);
        }
        if ((fr->fr_flags & FR_COPIED) != 0) {
            KFREE(fr);
            return 0;
        }
        return 1;
    } else {
        MUTEX_EXIT(&fr->fr_lock);
    }
    *frp = NULL;
    return -1;
}


#ifdef  IPFILTER_LOOKUP
/* ------------------------------------------------------------------------ */
/* Function:    fr_grpmapinit                                               */
/* Returns:     int - 0 == success, else ESRCH because table entry not found*/
/* Parameters:  fr(I) - pointer to rule to find hash table for              */
/*                                                                          */
/* Looks for group hash table fr_arg and stores a pointer to it in fr_ptr.  */
/* fr_ptr is later used by fr_srcgrpmap and fr_dstgrpmap.                   */
/* ------------------------------------------------------------------------ */
static int fr_grpmapinit(fr, ifs)
frentry_t *fr;
ipf_stack_t *ifs;
{
    char name[FR_GROUPLEN];
    iphtable_t *iph;

#if defined(SNPRINTF) && defined(_KERNEL)
    (void) SNPRINTF(name, sizeof(name), "%d", fr->fr_arg);
#else
    (void) sprintf(name, "%d", fr->fr_arg);
#endif
    iph = fr_findhtable(IPL_LOGIPF, name, ifs);
    if (iph == NULL)
        return ESRCH;
    if ((iph->iph_flags & FR_INOUT) != (fr->fr_flags & FR_INOUT))
        return ESRCH;
    fr->fr_ptr = iph;
    return 0;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_srcgrpmap                                                */
/* Returns:     frentry_t * - pointer to "new last matching" rule or NULL   */
/* Parameters:  fin(I)    - pointer to packet information                   */
/*              passp(IO) - pointer to current/new filter decision (unused) */
/*                                                                          */
/* Look for a rule group head in a hash table, using the source address as  */
/* the key, and descend into that group and continue matching rules against */
/* the packet.                                                              */
/* ------------------------------------------------------------------------ */
frentry_t *fr_srcgrpmap(fin, passp)
fr_info_t *fin;
u_32_t *passp;
{
    frgroup_t *fg;
    void *rval;
    ipf_stack_t *ifs = fin->fin_ifs;

    rval = fr_iphmfindgroup(fin->fin_fr->fr_ptr, fin->fin_v, &fin->fin_src, ifs);
    if (rval == NULL)
        return NULL;

    fg = rval;
    fin->fin_fr = fg->fg_start;
    (void) fr_scanlist(fin, *passp);
    return fin->fin_fr;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_dstgrpmap                                                */
/* Returns:     frentry_t * - pointer to "new last matching" rule or NULL   */
/* Parameters:  fin(I)    - pointer to packet information                   */
/*              passp(IO) - pointer to current/new filter decision (unused) */
/*                                                                          */
/* Look for a rule group head in a hash table, using the destination        */
/* address as the key, and descend into that group and continue matching    */
/* rules against  the packet.                                               */
/* ------------------------------------------------------------------------ */
frentry_t *fr_dstgrpmap(fin, passp)
fr_info_t *fin;
u_32_t *passp;
{
    frgroup_t *fg;
    void *rval;
    ipf_stack_t *ifs = fin->fin_ifs;

    rval = fr_iphmfindgroup(fin->fin_fr->fr_ptr, fin->fin_v, &fin->fin_dst, ifs);
    if (rval == NULL)
        return NULL;

    fg = rval;
    fin->fin_fr = fg->fg_start;
    (void) fr_scanlist(fin, *passp);
    return fin->fin_fr;
}
#endif /* IPFILTER_LOOKUP */

/*
 * Queue functions
 * ===============
 * These functions manage objects on queues for efficient timeouts.  There are
 * a number of system defined queues as well as user defined timeouts.  It is
 * expected that a lock is held in the domain in which the queue belongs
 * (i.e. either state or NAT) when calling any of these functions that prevents
 * fr_freetimeoutqueue() from being called at the same time as any other.
 */


/* ------------------------------------------------------------------------ */
/* Function:    fr_addtimeoutqueue                                          */
/* Returns:     struct ifqtq * - NULL if malloc fails, else pointer to      */
/*                               timeout queue with given interval.         */
/* Parameters:  parent(I)  - pointer to pointer to parent node of this list */
/*                           of interface queues.                           */
/*              seconds(I) - timeout value in seconds for this queue.       */
/*                                                                          */
/* This routine first looks for a timeout queue that matches the interval   */
/* being requested.  If it finds one, increments the reference counter and  */
/* returns a pointer to it.  If none are found, it allocates a new one and  */
/* inserts it at the top of the list.                                       */
/*                                                                          */
/* Locking.                                                                 */
/* It is assumed that the caller of this function has an appropriate lock   */
/* held (exclusively) in the domain that encompases 'parent'.               */
/* ------------------------------------------------------------------------ */
ipftq_t *fr_addtimeoutqueue(parent, seconds, ifs)
ipftq_t **parent;
u_int seconds;
ipf_stack_t *ifs;
{
    ipftq_t *ifq;
    u_int period;

    period = seconds * IPF_HZ_DIVIDE;

    MUTEX_ENTER(&ifs->ifs_ipf_timeoutlock);
    for (ifq = *parent; ifq != NULL; ifq = ifq->ifq_next) {
        if (ifq->ifq_ttl == period) {
            /*
             * Reset the delete flag, if set, so the structure
             * gets reused rather than freed and reallocated.
             */
            MUTEX_ENTER(&ifq->ifq_lock);
            ifq->ifq_flags &= ~IFQF_DELETE;
            ifq->ifq_ref++;
            MUTEX_EXIT(&ifq->ifq_lock);
            MUTEX_EXIT(&ifs->ifs_ipf_timeoutlock);

            return ifq;
        }
    }

    KMALLOC(ifq, ipftq_t *);
    if (ifq != NULL) {
        ifq->ifq_ttl = period;
        ifq->ifq_head = NULL;
        ifq->ifq_tail = &ifq->ifq_head;
        ifq->ifq_next = *parent;
        ifq->ifq_pnext = parent;
        ifq->ifq_ref = 1;
        ifq->ifq_flags = IFQF_USER;
        *parent = ifq;
        ifs->ifs_fr_userifqs++;
        MUTEX_NUKE(&ifq->ifq_lock);
        MUTEX_INIT(&ifq->ifq_lock, "ipftq mutex");
    }
    MUTEX_EXIT(&ifs->ifs_ipf_timeoutlock);
    return ifq;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_deletetimeoutqueue                                       */
/* Returns:     int    - new reference count value of the timeout queue     */
/* Parameters:  ifq(I) - timeout queue which is losing a reference.         */
/* Locks:       ifq->ifq_lock                                               */
/*                                                                          */
/* This routine must be called when we're discarding a pointer to a timeout */
/* queue object, taking care of the reference counter.                      */
/*                                                                          */
/* Now that this just sets a DELETE flag, it requires the expire code to    */
/* check the list of user defined timeout queues and call the free function */
/* below (currently commented out) to stop memory leaking.  It is done this */
/* way because the locking may not be sufficient to safely do a free when   */
/* this function is called.                                                 */
/* ------------------------------------------------------------------------ */
int fr_deletetimeoutqueue(ifq)
ipftq_t *ifq;
{

    ifq->ifq_ref--;
    if ((ifq->ifq_ref == 0) && ((ifq->ifq_flags & IFQF_USER) != 0)) {
        ifq->ifq_flags |= IFQF_DELETE;
    }

    return ifq->ifq_ref;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_freetimeoutqueue                                         */
/* Parameters:  ifq(I) - timeout queue which is losing a reference.         */
/* Returns:     Nil                                                         */
/*                                                                          */
/* Locking:                                                                 */
/* It is assumed that the caller of this function has an appropriate lock   */
/* held (exclusively) in the domain that encompases the callers "domain".   */
/* The ifq_lock for this structure should not be held.                      */
/*                                                                          */
/* Remove a user definde timeout queue from the list of queues it is in and */
/* tidy up after this is done.                                              */
/* ------------------------------------------------------------------------ */
void fr_freetimeoutqueue(ifq, ifs)
ipftq_t *ifq;
ipf_stack_t *ifs;
{


    if (((ifq->ifq_flags & IFQF_DELETE) == 0) || (ifq->ifq_ref != 0) ||
        ((ifq->ifq_flags & IFQF_USER) == 0)) {
        printf("fr_freetimeoutqueue(%lx) flags 0x%x ttl %d ref %d\n",
               (u_long)ifq, ifq->ifq_flags, ifq->ifq_ttl,
               ifq->ifq_ref);
        return;
    }

    /*
     * Remove from its position in the list.
     */
    *ifq->ifq_pnext = ifq->ifq_next;
    if (ifq->ifq_next != NULL)
        ifq->ifq_next->ifq_pnext = ifq->ifq_pnext;

    MUTEX_DESTROY(&ifq->ifq_lock);
    ifs->ifs_fr_userifqs--;
    KFREE(ifq);
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_deletequeueentry                                         */
/* Returns:     Nil                                                         */
/* Parameters:  tqe(I) - timeout queue entry to delete                      */
/*              ifq(I) - timeout queue to remove entry from                 */
/*                                                                          */
/* Remove a tail queue entry from its queue and make it an orphan.          */
/* fr_deletetimeoutqueue is called to make sure the reference count on the  */
/* queue is correct.  We can't, however, call fr_freetimeoutqueue because   */
/* the correct lock(s) may not be held that would make it safe to do so.    */
/* ------------------------------------------------------------------------ */
void fr_deletequeueentry(tqe)
ipftqent_t *tqe;
{
    ipftq_t *ifq;

    ifq = tqe->tqe_ifq;
    if (ifq == NULL)
        return;

    MUTEX_ENTER(&ifq->ifq_lock);

    if (tqe->tqe_pnext != NULL) {
        *tqe->tqe_pnext = tqe->tqe_next;
        if (tqe->tqe_next != NULL)
            tqe->tqe_next->tqe_pnext = tqe->tqe_pnext;
        else    /* we must be the tail anyway */
            ifq->ifq_tail = tqe->tqe_pnext;

        tqe->tqe_pnext = NULL;
        tqe->tqe_ifq = NULL;
    }

    (void) fr_deletetimeoutqueue(ifq);

    MUTEX_EXIT(&ifq->ifq_lock);
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_queuefront                                               */
/* Returns:     Nil                                                         */
/* Parameters:  tqe(I) - pointer to timeout queue entry                     */
/*                                                                          */
/* Move a queue entry to the front of the queue, if it isn't already there. */
/* ------------------------------------------------------------------------ */
void fr_queuefront(tqe)
ipftqent_t *tqe;
{
    ipftq_t *ifq;

    ifq = tqe->tqe_ifq;
    if (ifq == NULL)
        return;

    MUTEX_ENTER(&ifq->ifq_lock);
    if (ifq->ifq_head != tqe) {
        *tqe->tqe_pnext = tqe->tqe_next;
        if (tqe->tqe_next)
            tqe->tqe_next->tqe_pnext = tqe->tqe_pnext;
        else
            ifq->ifq_tail = tqe->tqe_pnext;

        tqe->tqe_next = ifq->ifq_head;
        ifq->ifq_head->tqe_pnext = &tqe->tqe_next;
        ifq->ifq_head = tqe;
        tqe->tqe_pnext = &ifq->ifq_head;
    }
    MUTEX_EXIT(&ifq->ifq_lock);
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_queueback                                                */
/* Returns:     Nil                                                         */
/* Parameters:  tqe(I) - pointer to timeout queue entry                     */
/*                                                                          */
/* Move a queue entry to the back of the queue, if it isn't already there.  */
/* ------------------------------------------------------------------------ */
void fr_queueback(tqe, ifs)
ipftqent_t *tqe;
ipf_stack_t *ifs;
{
    ipftq_t *ifq;

    ifq = tqe->tqe_ifq;
    if (ifq == NULL)
        return;
    tqe->tqe_die = ifs->ifs_fr_ticks + ifq->ifq_ttl;

    MUTEX_ENTER(&ifq->ifq_lock);
    if (tqe->tqe_next == NULL) {        /* at the end already ? */
        MUTEX_EXIT(&ifq->ifq_lock);
        return;
    }

    /*
     * Remove from list
     */
    *tqe->tqe_pnext = tqe->tqe_next;
    tqe->tqe_next->tqe_pnext = tqe->tqe_pnext;

    /*
     * Make it the last entry.
     */
    tqe->tqe_next = NULL;
    tqe->tqe_pnext = ifq->ifq_tail;
    *ifq->ifq_tail = tqe;
    ifq->ifq_tail = &tqe->tqe_next;
    MUTEX_EXIT(&ifq->ifq_lock);
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_queueappend                                              */
/* Returns:     Nil                                                         */
/* Parameters:  tqe(I)    - pointer to timeout queue entry                  */
/*              ifq(I)    - pointer to timeout queue                        */
/*              parent(I) - owing object pointer                            */
/*                                                                          */
/* Add a new item to this queue and put it on the very end.                 */
/* ------------------------------------------------------------------------ */
void fr_queueappend(tqe, ifq, parent, ifs)
ipftqent_t *tqe;
ipftq_t *ifq;
void *parent;
ipf_stack_t *ifs;
{

    MUTEX_ENTER(&ifq->ifq_lock);
    tqe->tqe_parent = parent;
    tqe->tqe_pnext = ifq->ifq_tail;
    *ifq->ifq_tail = tqe;
    ifq->ifq_tail = &tqe->tqe_next;
    tqe->tqe_next = NULL;
    tqe->tqe_ifq = ifq;
    tqe->tqe_die = ifs->ifs_fr_ticks + ifq->ifq_ttl;
    ifq->ifq_ref++;
    MUTEX_EXIT(&ifq->ifq_lock);
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_movequeue                                                */
/* Returns:     Nil                                                         */
/* Parameters:  tq(I)   - pointer to timeout queue information              */
/*              oifp(I) - old timeout queue entry was on                    */
/*              nifp(I) - new timeout queue to put entry on                 */
/*      ifs - ipf stack instance                    */
/*                                                                          */
/* Move a queue entry from one timeout queue to another timeout queue.      */
/* If it notices that the current entry is already last and does not need   */
/* to move queue, the return.                                               */
/* ------------------------------------------------------------------------ */
void fr_movequeue(tqe, oifq, nifq, ifs)
ipftqent_t *tqe;
ipftq_t *oifq, *nifq;
ipf_stack_t *ifs;
{
    /*
     * If the queue isn't changing, and the clock hasn't ticked
     * since the last update, the operation will be a no-op.
     */
    if (oifq == nifq && tqe->tqe_touched == ifs->ifs_fr_ticks)
        return;

    /*
     * Grab the lock and update the timers.
     */
    MUTEX_ENTER(&oifq->ifq_lock);
    tqe->tqe_touched = ifs->ifs_fr_ticks;
    tqe->tqe_die = ifs->ifs_fr_ticks + nifq->ifq_ttl;

    /*
     * The remainder of the operation can still be a no-op.
     *
     * If the queue isn't changing, check to see if
     * an update would be meaningless.
     */
    if (oifq == nifq) {
        if ((tqe->tqe_next == NULL) ||
            (tqe->tqe_next->tqe_die == tqe->tqe_die)) {
            MUTEX_EXIT(&oifq->ifq_lock);
            return;
        }
    }

    /*
     * Remove from the old queue
     */
    *tqe->tqe_pnext = tqe->tqe_next;
    if (tqe->tqe_next)
        tqe->tqe_next->tqe_pnext = tqe->tqe_pnext;
    else
        oifq->ifq_tail = tqe->tqe_pnext;
    tqe->tqe_next = NULL;

    /*
     * If we're moving from one queue to another, release the lock on the
     * old queue and get a lock on the new queue.  For user defined queues,
     * if we're moving off it, call delete in case it can now be freed.
     */
    if (oifq != nifq) {
        tqe->tqe_ifq = NULL;

        (void) fr_deletetimeoutqueue(oifq);

        MUTEX_EXIT(&oifq->ifq_lock);

        MUTEX_ENTER(&nifq->ifq_lock);

        tqe->tqe_ifq = nifq;
        nifq->ifq_ref++;
    }

    /*
     * Add to the bottom of the new queue
     */
    tqe->tqe_pnext = nifq->ifq_tail;
    *nifq->ifq_tail = tqe;
    nifq->ifq_tail = &tqe->tqe_next;
    MUTEX_EXIT(&nifq->ifq_lock);
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_updateipid                                               */
/* Returns:     int - 0 == success, -1 == error (packet should be droppped) */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* When we are doing NAT, change the IP of every packet to represent a      */
/* single sequence of packets coming from the host, hiding any host         */
/* specific sequencing that might otherwise be revealed.  If the packet is  */
/* a fragment, then store the 'new' IPid in the fragment cache and look up  */
/* the fragment cache for non-leading fragments.  If a non-leading fragment */
/* has no match in the cache, return an error.                              */
/* ------------------------------------------------------------------------ */
static INLINE int fr_updateipid(fin)
fr_info_t *fin;
{
    u_short id, ido, sums;
    u_32_t sumd, sum;
    ip_t *ip;

    if (fin->fin_off != 0) {
        sum = fr_ipid_knownfrag(fin);
        if (sum == 0xffffffff)
            return -1;
        sum &= 0xffff;
        id = (u_short)sum;
    } else {
        id = fr_nextipid(fin);
        if (fin->fin_off == 0 && (fin->fin_flx & FI_FRAG) != 0)
            (void) fr_ipid_newfrag(fin, (u_32_t)id);
    }

    ip = fin->fin_ip;
    ido = ntohs(ip->ip_id);
    if (id == ido)
        return 0;
    ip->ip_id = htons(id);
    CALC_SUMD(ido, id, sumd);   /* DESTRUCTIVE MACRO! id,ido change */
    sum = (~ntohs(ip->ip_sum)) & 0xffff;
    sum += sumd;
    sum = (sum >> 16) + (sum & 0xffff);
    sum = (sum >> 16) + (sum & 0xffff);
    sums = ~(u_short)sum;
    ip->ip_sum = htons(sums);
    return 0;
}


#ifdef  NEED_FRGETIFNAME
/* ------------------------------------------------------------------------ */
/* Function:    fr_getifname                                                */
/* Returns:     char *    - pointer to interface name                       */
/* Parameters:  ifp(I)    - pointer to network interface                    */
/*              buffer(O) - pointer to where to store interface name        */
/*                                                                          */
/* Constructs an interface name in the buffer passed.  The buffer passed is */
/* expected to be at least LIFNAMSIZ in bytes big.  If buffer is passed in  */
/* as a NULL pointer then return a pointer to a static array.               */
/* ------------------------------------------------------------------------ */
char *fr_getifname(ifp, buffer)
struct ifnet *ifp;
char *buffer;
{
    static char namebuf[LIFNAMSIZ];
# if defined(MENTAT) || defined(__FreeBSD__) || defined(__osf__) || \
     defined(__sgi) || defined(linux) || defined(_AIX51) || \
     (defined(sun) && !defined(__SVR4) && !defined(__svr4__))
    int unit, space;
    char temp[20];
    char *s;
# endif

    ASSERT(buffer != NULL);
#ifdef notdef
    if (buffer == NULL)
        buffer = namebuf;
#endif
    (void) strncpy(buffer, ifp->if_name, LIFNAMSIZ);
    buffer[LIFNAMSIZ - 1] = '\0';
# if defined(MENTAT) || defined(__FreeBSD__) || defined(__osf__) || \
     defined(__sgi) || defined(_AIX51) || \
     (defined(sun) && !defined(__SVR4) && !defined(__svr4__))
    for (s = buffer; *s; s++)
        ;
    unit = ifp->if_unit;
    space = LIFNAMSIZ - (s - buffer);
    if (space > 0) {
#  if defined(SNPRINTF) && defined(_KERNEL)
        (void) SNPRINTF(temp, sizeof(temp), "%d", unit);
#  else
        (void) sprintf(temp, "%d", unit);
#  endif
        (void) strncpy(s, temp, space);
    }
# endif
    return buffer;
}
#endif


/* ------------------------------------------------------------------------ */
/* Function:    fr_ioctlswitch                                              */
/* Returns:     int     - -1 continue processing, else ioctl return value   */
/* Parameters:  unit(I) - device unit opened                                */
/*              data(I) - pointer to ioctl data                             */
/*              cmd(I)  - ioctl command                                     */
/*              mode(I) - mode value                                        */
/*                                                                          */
/* Based on the value of unit, call the appropriate ioctl handler or return */
/* EIO if ipfilter is not running.   Also checks if write perms are req'd   */
/* for the device in order to execute the ioctl.                            */
/* ------------------------------------------------------------------------ */
INLINE int fr_ioctlswitch(unit, data, cmd, mode, uid, ctx, ifs)
int unit, mode, uid;
ioctlcmd_t cmd;
void *data, *ctx;
ipf_stack_t *ifs;
{
    int error = 0;

    switch (unit)
    {
    case IPL_LOGIPF :
        error = -1;
        break;
    case IPL_LOGNAT :
        if (ifs->ifs_fr_running > 0)
            error = fr_nat_ioctl(data, cmd, mode, uid, ctx, ifs);
        else
            error = EIO;
        break;
    case IPL_LOGSTATE :
        if (ifs->ifs_fr_running > 0)
            error = fr_state_ioctl(data, cmd, mode, uid, ctx, ifs);
        else
            error = EIO;
        break;
    case IPL_LOGAUTH :
        if (ifs->ifs_fr_running > 0) {
            if ((cmd == (ioctlcmd_t)SIOCADAFR) ||
                (cmd == (ioctlcmd_t)SIOCRMAFR)) {
                if (!(mode & FWRITE)) {
                    error = EPERM;
                } else {
                    error = frrequest(unit, cmd, data,
                          ifs->ifs_fr_active, 1, ifs);
                }
            } else {
                error = fr_auth_ioctl(data, cmd, mode, uid, ctx, ifs);
            }
        } else
            error = EIO;
        break;
    case IPL_LOGSYNC :
#ifdef IPFILTER_SYNC
        if (ifs->ifs_fr_running > 0)
            error = fr_sync_ioctl(data, cmd, mode, ifs);
        else
#endif
            error = EIO;
        break;
    case IPL_LOGSCAN :
#ifdef IPFILTER_SCAN
        if (ifs->ifs_fr_running > 0)
            error = fr_scan_ioctl(data, cmd, mode, ifs);
        else
#endif
            error = EIO;
        break;
    case IPL_LOGLOOKUP :
#ifdef IPFILTER_LOOKUP
        if (ifs->ifs_fr_running > 0)
            error = ip_lookup_ioctl(data, cmd, mode, uid, ctx, ifs);
        else
#endif
            error = EIO;
        break;
    default :
        error = EIO;
        break;
    }

    return error;
}


/*
 * This array defines the expected size of objects coming into the kernel
 * for the various recognised object types.
 */
#define NUM_OBJ_TYPES   19

static  int fr_objbytes[NUM_OBJ_TYPES][2] = {
    { 1,    sizeof(struct frentry) },       /* frentry */
    { 0,    sizeof(struct friostat) },
    { 0,    sizeof(struct fr_info) },
    { 0,    sizeof(struct fr_authstat) },
    { 0,    sizeof(struct ipfrstat) },
    { 0,    sizeof(struct ipnat) },
    { 0,    sizeof(struct natstat) },
    { 0,    sizeof(struct ipstate_save) },
    { 1,    sizeof(struct nat_save) },      /* nat_save */
    { 0,    sizeof(struct natlookup) },
    { 1,    sizeof(struct ipstate) },       /* ipstate */
    { 0,    sizeof(struct ips_stat) },
    { 0,    sizeof(struct frauth) },
    { 0,    sizeof(struct ipftune) },
    { 0,    sizeof(struct nat) },                   /* nat_t */
    { 0,    sizeof(struct ipfruleiter) },
    { 0,    sizeof(struct ipfgeniter) },
    { 0,    sizeof(struct ipftable) },
    { 0,    sizeof(struct ipflookupiter) }
};


/* ------------------------------------------------------------------------ */
/* Function:    fr_getzoneid                                                */
/* Returns:     int     - 0 = success, else failure                         */
/* Parameters:  idsp(I) - pointer to ipf_devstate_t                         */
/*              data(I) - pointer to ioctl data                             */
/*                                                                          */
/* Set the zone ID in idsp based on the zone name in ipfzoneobj.  Further   */
/* ioctls will act on the IPF stack for that zone ID.                       */
/* ------------------------------------------------------------------------ */
#if defined(_KERNEL)
int fr_setzoneid(idsp, data)
ipf_devstate_t *idsp;
void *data;
{
    int error = 0;
    ipfzoneobj_t ipfzo;
    zone_t *zone;

    error = BCOPYIN(data, &ipfzo, sizeof(ipfzo));
    if (error != 0)
        return EFAULT;

    if (memchr(ipfzo.ipfz_zonename, '\0', ZONENAME_MAX) == NULL)
        return EFAULT;

    /*
     * The global zone doesn't have a GZ-controlled stack, so no
     * sense in going any further
     */
    if (strcmp(ipfzo.ipfz_zonename, "global") == 0)
        return ENODEV;

    if ((zone = zone_find_by_name(ipfzo.ipfz_zonename)) == NULL)
        return ENODEV;

    /*
     * Store the zone ID that to control, and whether it's the
     * GZ-controlled stack that's wanted
     */
    idsp->ipfs_zoneid = zone->zone_id;
    idsp->ipfs_gz = (ipfzo.ipfz_gz == 1) ? B_TRUE : B_FALSE;
    zone_rele(zone);

    return error;
}
#endif


/* ------------------------------------------------------------------------ */
/* Function:    fr_inobj                                                    */
/* Returns:     int     - 0 = success, else failure                         */
/* Parameters:  data(I) - pointer to ioctl data                             */
/*              ptr(I)  - pointer to store real data in                     */
/*              type(I) - type of structure being moved                     */
/*                                                                          */
/* Copy in the contents of what the ipfobj_t points to.  In future, we      */
/* add things to check for version numbers, sizes, etc, to make it backward */
/* compatible at the ABI for user land.                                     */
/* ------------------------------------------------------------------------ */
int fr_inobj(data, ptr, type)
void *data;
void *ptr;
int type;
{
    ipfobj_t obj;
    int error = 0;

    if ((type < 0) || (type > NUM_OBJ_TYPES-1))
        return EINVAL;

    error = BCOPYIN((caddr_t)data, (caddr_t)&obj, sizeof(obj));
    if (error != 0)
        return EFAULT;

    if (obj.ipfo_type != type)
        return EINVAL;

#ifndef IPFILTER_COMPAT
    if ((fr_objbytes[type][0] & 1) != 0) {
        if (obj.ipfo_size < fr_objbytes[type][1])
            return EINVAL;
    } else if (obj.ipfo_size != fr_objbytes[type][1])
        return EINVAL;
#else
    if (obj.ipfo_rev != IPFILTER_VERSION) {
        error = fr_incomptrans(&obj, ptr);
        return error;
    }

    if ((fr_objbytes[type][0] & 1) != 0 &&
        obj.ipfo_size < fr_objbytes[type][1] ||
        obj.ipfo_size != fr_objbytes[type][1])
        return EINVAL;
#endif

    if ((fr_objbytes[type][0] & 1) != 0) {
        error = COPYIN((caddr_t)obj.ipfo_ptr, (caddr_t)ptr,
                fr_objbytes[type][1]);
    } else {
        error = COPYIN((caddr_t)obj.ipfo_ptr, (caddr_t)ptr,
                obj.ipfo_size);
    }
    return error;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_inobjsz                                                  */
/* Returns:     int     - 0 = success, else failure                         */
/* Parameters:  data(I) - pointer to ioctl data                             */
/*              ptr(I)  - pointer to store real data in                     */
/*              type(I) - type of structure being moved                     */
/*              sz(I)   - size of data to copy                              */
/*                                                                          */
/* As per fr_inobj, except the size of the object to copy in is passed in   */
/* but it must not be smaller than the size defined for the type and the    */
/* type must allow for varied sized objects.  The extra requirement here is */
/* that sz must match the size of the object being passed in - this is not  */
/* not possible nor required in fr_inobj().                                 */
/* ------------------------------------------------------------------------ */
int fr_inobjsz(data, ptr, type, sz)
void *data;
void *ptr;
int type, sz;
{
    ipfobj_t obj;
    int error;

    if ((type < 0) || (type > NUM_OBJ_TYPES-1))
        return EINVAL;
    if (((fr_objbytes[type][0] & 1) == 0) || (sz < fr_objbytes[type][1]))
        return EINVAL;

    error = BCOPYIN((caddr_t)data, (caddr_t)&obj, sizeof(obj));
    if (error != 0)
        return EFAULT;

    if (obj.ipfo_type != type)
        return EINVAL;

#ifndef IPFILTER_COMPAT
    if (obj.ipfo_size != sz)
        return EINVAL;
#else
    if (obj.ipfo_rev != IPFILTER_VERSION)
        /*XXX compatibility hook here */
        /*EMPTY*/;
    if (obj.ipfo_size != sz)
        /* XXX compatibility hook here */
        return EINVAL;
#endif

    error = COPYIN((caddr_t)obj.ipfo_ptr, (caddr_t)ptr, sz);
    return error;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_outobjsz                                                 */
/* Returns:     int     - 0 = success, else failure                         */
/* Parameters:  data(I) - pointer to ioctl data                             */
/*              ptr(I)  - pointer to store real data in                     */
/*              type(I) - type of structure being moved                     */
/*              sz(I)   - size of data to copy                              */
/*                                                                          */
/* As per fr_outobj, except the size of the object to copy out is passed in */
/* but it must not be smaller than the size defined for the type and the    */
/* type must allow for varied sized objects.  The extra requirement here is */
/* that sz must match the size of the object being passed in - this is not  */
/* not possible nor required in fr_outobj().                                */
/* ------------------------------------------------------------------------ */
int fr_outobjsz(data, ptr, type, sz)
void *data;
void *ptr;
int type, sz;
{
    ipfobj_t obj;
    int error;

    if ((type < 0) || (type > NUM_OBJ_TYPES-1) ||
        ((fr_objbytes[type][0] & 1) == 0) ||
        (sz < fr_objbytes[type][1]))
        return EINVAL;

    error = BCOPYIN((caddr_t)data, (caddr_t)&obj, sizeof(obj));
    if (error != 0)
        return EFAULT;

    if (obj.ipfo_type != type)
        return EINVAL;

#ifndef IPFILTER_COMPAT
    if (obj.ipfo_size != sz)
        return EINVAL;
#else
    if (obj.ipfo_rev != IPFILTER_VERSION)
        /* XXX compatibility hook here */
        /*EMPTY*/;
    if (obj.ipfo_size != sz)
        /* XXX compatibility hook here */
        return EINVAL;
#endif

    error = COPYOUT((caddr_t)ptr, (caddr_t)obj.ipfo_ptr, sz);
    return error;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_outobj                                                   */
/* Returns:     int     - 0 = success, else failure                         */
/* Parameters:  data(I) - pointer to ioctl data                             */
/*              ptr(I)  - pointer to store real data in                     */
/*              type(I) - type of structure being moved                     */
/*                                                                          */
/* Copy out the contents of what ptr is to where ipfobj points to.  In      */
/* future, we add things to check for version numbers, sizes, etc, to make  */
/* it backward  compatible at the ABI for user land.                        */
/* ------------------------------------------------------------------------ */
int fr_outobj(data, ptr, type)
void *data;
void *ptr;
int type;
{
    ipfobj_t obj;
    int error;

    if ((type < 0) || (type > NUM_OBJ_TYPES-1))
        return EINVAL;

    error = BCOPYIN((caddr_t)data, (caddr_t)&obj, sizeof(obj));
    if (error != 0)
        return EFAULT;

    if (obj.ipfo_type != type)
        return EINVAL;

#ifndef IPFILTER_COMPAT
    if ((fr_objbytes[type][0] & 1) != 0) {
        if (obj.ipfo_size < fr_objbytes[type][1])
            return EINVAL;
    } else if (obj.ipfo_size != fr_objbytes[type][1])
        return EINVAL;
#else
    if (obj.ipfo_rev != IPFILTER_VERSION) {
        error = fr_outcomptrans(&obj, ptr);
        return error;
    }

    if ((fr_objbytes[type][0] & 1) != 0 &&
        obj.ipfo_size < fr_objbytes[type][1] ||
        obj.ipfo_size != fr_objbytes[type][1])
        return EINVAL;
#endif

    error = COPYOUT((caddr_t)ptr, (caddr_t)obj.ipfo_ptr, obj.ipfo_size);
    return error;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_checkl4sum                                               */
/* Returns:     int     - 0 = good, -1 = bad, 1 = cannot check              */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* If possible, calculate the layer 4 checksum for the packet.  If this is  */
/* not possible, return without indicating a failure or success but in a    */
/* way that is ditinguishable.                                              */
/* ------------------------------------------------------------------------ */
int fr_checkl4sum(fin)
fr_info_t *fin;
{
    u_short sum, hdrsum, *csump;
    udphdr_t *udp;
    int dosum;
    ipf_stack_t *ifs = fin->fin_ifs;

#if SOLARIS && defined(_KERNEL) && (SOLARIS2 >= 6)
    net_handle_t net_data_p;
    if (fin->fin_v == 4)
        net_data_p = ifs->ifs_ipf_ipv4;
    else
        net_data_p = ifs->ifs_ipf_ipv6;
#endif

    if ((fin->fin_flx & FI_NOCKSUM) != 0)
        return 0;

    /*
     * If the TCP packet isn't a fragment, isn't too short and otherwise
     * isn't already considered "bad", then validate the checksum.  If
     * this check fails then considered the packet to be "bad".
     */
    if ((fin->fin_flx & (FI_FRAG|FI_SHORT|FI_BAD)) != 0)
        return 1;

    csump = NULL;
    hdrsum = 0;
    dosum = 0;
    sum = 0;

#if SOLARIS && defined(_KERNEL) && (SOLARIS2 >= 6)
    ASSERT(fin->fin_m != NULL);
    if (NET_IS_HCK_L4_FULL(net_data_p, fin->fin_m) ||
        NET_IS_HCK_L4_PART(net_data_p, fin->fin_m)) {
            hdrsum = 0;
            sum = 0;
    } else {
#endif
        switch (fin->fin_p)
        {
        case IPPROTO_TCP :
            csump = &((tcphdr_t *)fin->fin_dp)->th_sum;
            dosum = 1;
            break;

        case IPPROTO_UDP :
            udp = fin->fin_dp;
            if (udp->uh_sum != 0) {
                csump = &udp->uh_sum;
                dosum = 1;
            }
            break;

        case IPPROTO_ICMP :
            csump = &((struct icmp *)fin->fin_dp)->icmp_cksum;
            dosum = 1;
            break;

        default :
            return 1;
            /*NOTREACHED*/
        }

        if (csump != NULL)
            hdrsum = *csump;

        if (dosum)
            sum = fr_cksum(fin->fin_m, fin->fin_ip,
                       fin->fin_p, fin->fin_dp);
#if SOLARIS && defined(_KERNEL) && (SOLARIS2 >= 6)
    }
#endif
#if !defined(_KERNEL)
    if (sum == hdrsum) {
        FR_DEBUG(("checkl4sum: %hx == %hx\n", sum, hdrsum));
    } else {
        FR_DEBUG(("checkl4sum: %hx != %hx\n", sum, hdrsum));
    }
#endif
    if (hdrsum == sum)
        return 0;
    return -1;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_ifpfillv4addr                                            */
/* Returns:     int     - 0 = address update, -1 = address not updated      */
/* Parameters:  atype(I)   - type of network address update to perform      */
/*              sin(I)     - pointer to source of address information       */
/*              mask(I)    - pointer to source of netmask information       */
/*              inp(I)     - pointer to destination address store           */
/*              inpmask(I) - pointer to destination netmask store           */
/*                                                                          */
/* Given a type of network address update (atype) to perform, copy          */
/* information from sin/mask into inp/inpmask.  If ipnmask is NULL then no  */
/* netmask update is performed unless FRI_NETMASKED is passed as atype, in  */
/* which case the operation fails.  For all values of atype other than      */
/* FRI_NETMASKED, if inpmask is non-NULL then the mask is set to an all 1s  */
/* value.                                                                   */
/* ------------------------------------------------------------------------ */
int fr_ifpfillv4addr(atype, sin, mask, inp, inpmask)
int atype;
struct sockaddr_in *sin, *mask;
struct in_addr *inp, *inpmask;
{
    if (inpmask != NULL && atype != FRI_NETMASKED)
        inpmask->s_addr = 0xffffffff;

    if (atype == FRI_NETWORK || atype == FRI_NETMASKED) {
        if (atype == FRI_NETMASKED) {
            if (inpmask == NULL)
                return -1;
            inpmask->s_addr = mask->sin_addr.s_addr;
        }
        inp->s_addr = sin->sin_addr.s_addr & mask->sin_addr.s_addr;
    } else {
        inp->s_addr = sin->sin_addr.s_addr;
    }
    return 0;
}


#ifdef  USE_INET6
/* ------------------------------------------------------------------------ */
/* Function:    fr_ifpfillv6addr                                            */
/* Returns:     int     - 0 = address update, -1 = address not updated      */
/* Parameters:  atype(I)   - type of network address update to perform      */
/*              sin(I)     - pointer to source of address information       */
/*              mask(I)    - pointer to source of netmask information       */
/*              inp(I)     - pointer to destination address store           */
/*              inpmask(I) - pointer to destination netmask store           */
/*                                                                          */
/* Given a type of network address update (atype) to perform, copy          */
/* information from sin/mask into inp/inpmask.  If ipnmask is NULL then no  */
/* netmask update is performed unless FRI_NETMASKED is passed as atype, in  */
/* which case the operation fails.  For all values of atype other than      */
/* FRI_NETMASKED, if inpmask is non-NULL then the mask is set to an all 1s  */
/* value.                                                                   */
/* ------------------------------------------------------------------------ */
int fr_ifpfillv6addr(atype, sin, mask, inp, inpmask)
int atype;
struct sockaddr_in6 *sin, *mask;
struct in_addr *inp, *inpmask;
{
    i6addr_t *src, *dst, *and, *dmask;

    src = (i6addr_t *)&sin->sin6_addr;
    and = (i6addr_t *)&mask->sin6_addr;
    dst = (i6addr_t *)inp;
    dmask = (i6addr_t *)inpmask;

    if (inpmask != NULL && atype != FRI_NETMASKED) {
        dmask->i6[0] = 0xffffffff;
        dmask->i6[1] = 0xffffffff;
        dmask->i6[2] = 0xffffffff;
        dmask->i6[3] = 0xffffffff;
    }

    if (atype == FRI_NETWORK || atype == FRI_NETMASKED) {
        if (atype == FRI_NETMASKED) {
            if (inpmask == NULL)
                return -1;
            dmask->i6[0] = and->i6[0];
            dmask->i6[1] = and->i6[1];
            dmask->i6[2] = and->i6[2];
            dmask->i6[3] = and->i6[3];
        }

        dst->i6[0] = src->i6[0] & and->i6[0];
        dst->i6[1] = src->i6[1] & and->i6[1];
        dst->i6[2] = src->i6[2] & and->i6[2];
        dst->i6[3] = src->i6[3] & and->i6[3];
    } else {
        dst->i6[0] = src->i6[0];
        dst->i6[1] = src->i6[1];
        dst->i6[2] = src->i6[2];
        dst->i6[3] = src->i6[3];
    }
    return 0;
}
#endif


/* ------------------------------------------------------------------------ */
/* Function:    fr_matchtag                                                 */
/* Returns:     0 == mismatch, 1 == match.                                  */
/* Parameters:  tag1(I) - pointer to first tag to compare                   */
/*              tag2(I) - pointer to second tag to compare                  */
/*                                                                          */
/* Returns true (non-zero) or false(0) if the two tag structures can be     */
/* considered to be a match or not match, respectively.  The tag is 16      */
/* bytes long (16 characters) but that is overlayed with 4 32bit ints so    */
/* compare the ints instead, for speed. tag1 is the master of the           */
/* comparison.  This function should only be called with both tag1 and tag2 */
/* as non-NULL pointers.                                                    */
/* ------------------------------------------------------------------------ */
int fr_matchtag(tag1, tag2)
ipftag_t *tag1, *tag2;
{
    if (tag1 == tag2)
        return 1;

    if ((tag1->ipt_num[0] == 0) && (tag2->ipt_num[0] == 0))
        return 1;

    if ((tag1->ipt_num[0] == tag2->ipt_num[0]) &&
        (tag1->ipt_num[1] == tag2->ipt_num[1]) &&
        (tag1->ipt_num[2] == tag2->ipt_num[2]) &&
        (tag1->ipt_num[3] == tag2->ipt_num[3]))
        return 1;
    return 0;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_coalesce                                                 */
/* Returns:     1 == success, -1 == failure, 0 == no change                 */
/* Parameters:  fin(I) - pointer to packet information                      */
/*                                                                          */
/* Attempt to get all of the packet data into a single, contiguous buffer.  */
/* If this call returns a failure then the buffers have also been freed.    */
/* ------------------------------------------------------------------------ */
int fr_coalesce(fin)
fr_info_t *fin;
{
    ipf_stack_t *ifs = fin->fin_ifs;
    if ((fin->fin_flx & FI_COALESCE) != 0)
        return 1;

    /*
     * If the mbuf pointers indicate that there is no mbuf to work with,
     * return but do not indicate success or failure.
     */
    if (fin->fin_m == NULL || fin->fin_mp == NULL)
        return 0;

#if defined(_KERNEL)
    if (fr_pullup(fin->fin_m, fin, fin->fin_plen) == NULL) {
        IPF_BUMP(ifs->ifs_fr_badcoalesces[fin->fin_out]);
# ifdef MENTAT
        FREE_MB_T(*fin->fin_mp);
# endif
        *fin->fin_mp = NULL;
        fin->fin_m = NULL;
        return -1;
    }
#else
    fin = fin;  /* LINT */
#endif
    return 1;
}


/*
 * The following table lists all of the tunable variables that can be
 * accessed via SIOCIPFGET/SIOCIPFSET/SIOCIPFGETNEXT.  The format of each row
 * in the table below is as follows:
 *
 * pointer to value, name of value, minimum, maximum, size of the value's
 *     container, value attribute flags
 *
 * For convienience, IPFT_RDONLY means the value is read-only, IPFT_WRDISABLED
 * means the value can only be written to when IPFilter is loaded but disabled.
 * The obvious implication is if neither of these are set then the value can be
 * changed at any time without harm.
 */
ipftuneable_t lcl_ipf_tuneables[] = {
    /* filtering */
    { { NULL }, "fr_flags",     0,  0xffffffff,
            0,      0 },
    { { NULL }, "fr_active",        0,  0,
            0,      IPFT_RDONLY },
    { { NULL }, "fr_control_forwarding",    0, 1,
            0,      0 },
    { { NULL }, "fr_update_ipid",   0,  1,
            0,      0 },
    { { NULL }, "fr_chksrc",        0,  1,
            0,      0 },
    { { NULL }, "fr_minttl",        0,  1,
            0,      0 },
    { { NULL },     "fr_icmpminfragmtu",    0,  1,
            0,      0 },
    { { NULL },     "fr_pass",      0,  0xffffffff,
            0,      0 },
#if SOLARIS2 >= 10
    { { NULL }, "ipf_loopback",     0,  1,
            0,      IPFT_WRDISABLED },
#endif
    /* state */
    { { NULL }, "fr_tcpidletimeout",    1,  0x7fffffff,
            0,  IPFT_WRDISABLED },
    { { NULL }, "fr_tcpclosewait",  1,  0x7fffffff,
            0,  IPFT_WRDISABLED },
    { { NULL }, "fr_tcplastack",    1,  0x7fffffff,
            0,      IPFT_WRDISABLED },
    { { NULL }, "fr_tcptimeout",    1,  0x7fffffff,
            0,      IPFT_WRDISABLED },
    { { NULL }, "fr_tcpclosed",     1,  0x7fffffff,
            0,      IPFT_WRDISABLED },
    { { NULL }, "fr_tcphalfclosed", 1,  0x7fffffff,
            0,  IPFT_WRDISABLED },
    { { NULL }, "fr_udptimeout",    1,  0x7fffffff,
            0,      IPFT_WRDISABLED },
    { { NULL }, "fr_udpacktimeout", 1,  0x7fffffff,
            0,  IPFT_WRDISABLED },
    { { NULL }, "fr_icmptimeout",   1,  0x7fffffff,
            0,      IPFT_WRDISABLED },
    { { NULL }, "fr_icmpacktimeout",    1,  0x7fffffff,
            0,  IPFT_WRDISABLED },
    { { NULL }, "fr_iptimeout",     1,  0x7fffffff,
            0,      IPFT_WRDISABLED },
    { { NULL }, "fr_statemax",      1,  0x7fffffff,
            0,      0 },
    { { NULL }, "fr_statesize",     1,  0x7fffffff,
            0,      IPFT_WRDISABLED },
    { { NULL }, "fr_state_lock",    0,  1,
            0,      IPFT_RDONLY },
    { { NULL }, "fr_state_maxbucket", 1,    0x7fffffff,
            0,  IPFT_WRDISABLED },
    { { NULL }, "fr_state_maxbucket_reset", 0, 1,
            0, IPFT_WRDISABLED },
    { { NULL }, "ipstate_logging",  0,  1,
            0,  0 },
    { { NULL }, "state_flush_level_hi", 1,  100,
            0,      0 },
    { { NULL }, "state_flush_level_lo", 1,  100,
            0,      0 },
    /* nat */
    { { NULL },     "fr_nat_lock",      0,  1,
            0,      IPFT_RDONLY },
    { { NULL }, "ipf_nattable_sz",  1,  0x7fffffff,
            0,  IPFT_WRDISABLED },
    { { NULL }, "ipf_nattable_max", 1,  0x7fffffff,
            0,  0 },
    { { NULL }, "ipf_natrules_sz",  1,  0x7fffffff,
            0,  IPFT_WRDISABLED },
    { { NULL }, "ipf_rdrrules_sz",  1,  0x7fffffff,
            0,  IPFT_WRDISABLED },
    { { NULL }, "ipf_hostmap_sz",   1,  0x7fffffff,
            0,      IPFT_WRDISABLED },
    { { NULL }, "fr_nat_maxbucket", 1,  0x7fffffff,
            0,  IPFT_WRDISABLED },
    { { NULL }, "fr_nat_maxbucket_reset",   0, 1,
            0,  IPFT_WRDISABLED },
    { { NULL },     "nat_logging",      0,  1,
            0,      0 },
    { { NULL }, "fr_defnatage",     1,  0x7fffffff,
            0,      IPFT_WRDISABLED },
    { { NULL }, "fr_defnatipage",   1,  0x7fffffff,
            0,      IPFT_WRDISABLED },
    { { NULL }, "fr_defnaticmpage", 1,  0x7fffffff,
            0,  IPFT_WRDISABLED },
    { { NULL }, "nat_flush_level_hi",   1,  100,
            0,      0 },
    { { NULL }, "nat_flush_level_lo",   1,  100,
            0,      0 },
    /* frag */
    { { NULL }, "ipfr_size",        1,  0x7fffffff,
            0,      IPFT_WRDISABLED },
    { { NULL }, "fr_ipfrttl",       1,  0x7fffffff,
            0,      IPFT_WRDISABLED },
#ifdef IPFILTER_LOG
    /* log */
    { { NULL }, "ipl_suppress",     0,  1,
            0,      0 },
    { { NULL }, "ipl_buffer_sz",    0,  0,
            0,      IPFT_RDONLY },
    { { NULL }, "ipl_logmax",       0,  0x7fffffff,
            0,      IPFT_WRDISABLED },
    { { NULL }, "ipl_logall",       0,  1,
            0,      0 },
    { { NULL }, "ipl_logsize",      0,  0x80000,
            0,      0 },
#endif
    { { NULL },     NULL,           0,  0 }
};

static ipftuneable_t *
tune_lookup(ipf_stack_t *ifs, char *name)
{
    int i;

    for (i = 0; ifs->ifs_ipf_tuneables[i].ipft_name != NULL; i++) {
    if (strcmp(ifs->ifs_ipf_tuneables[i].ipft_name, name) == 0)
        return (&ifs->ifs_ipf_tuneables[i]);
    }
    return (NULL);
}

#ifdef _KERNEL
extern dev_info_t *ipf_dev_info;
extern int ipf_property_update __P((dev_info_t *, ipf_stack_t *));
#endif

/* -------------------------------------------------------------------- */
/* Function:    ipftuneable_setdefs()                   */
/* Returns:     void                        */
/* Parameters:  ifs - pointer to newly allocated IPF instance       */
/*              assigned to IP instance     */
/*                                  */
/* Function initializes IPF instance variables. Function is invoked */
/* from ipftuneable_alloc(). ipftuneable_alloc() is called only one */
/* time during IP instance lifetime - at the time of IP instance    */
/* creation. Anytime IP instance is being created new private IPF   */
/* instance is allocated and assigned to it. The moment of IP       */
/* instance creation is the right time to initialize those IPF      */
/* variables.                               */
/*                                  */
/* -------------------------------------------------------------------- */
static void ipftuneable_setdefs(ipf_stack_t *ifs)
{
    ifs->ifs_ipfr_size = IPFT_SIZE;
    ifs->ifs_fr_ipfrttl = 120;  /* 60 seconds */

    /* it comes from fr_authinit() in IPF auth */
    ifs->ifs_fr_authsize = FR_NUMAUTH;
    ifs->ifs_fr_defaultauthage = 600;

    /* it comes from fr_stateinit() in IPF state */
    ifs->ifs_fr_tcpidletimeout = IPF_TTLVAL(3600 * 24 * 5); /* five days */
    ifs->ifs_fr_tcpclosewait = IPF_TTLVAL(TCP_MSL);
    ifs->ifs_fr_tcplastack = IPF_TTLVAL(TCP_MSL);
    ifs->ifs_fr_tcptimeout = IPF_TTLVAL(TCP_MSL);
    ifs->ifs_fr_tcpclosed = IPF_TTLVAL(60);
    ifs->ifs_fr_tcphalfclosed = IPF_TTLVAL(2 * 3600);   /* 2 hours */
    ifs->ifs_fr_udptimeout = IPF_TTLVAL(120);
    ifs->ifs_fr_udpacktimeout = IPF_TTLVAL(12);
    ifs->ifs_fr_icmptimeout = IPF_TTLVAL(60);
    ifs->ifs_fr_icmpacktimeout = IPF_TTLVAL(6);
    ifs->ifs_fr_iptimeout = IPF_TTLVAL(60);
    ifs->ifs_fr_statemax = IPSTATE_MAX;
    ifs->ifs_fr_statesize = IPSTATE_SIZE;
    ifs->ifs_fr_state_maxbucket_reset = 1;
    ifs->ifs_state_flush_level_hi = ST_FLUSH_HI;
    ifs->ifs_state_flush_level_lo = ST_FLUSH_LO;

    /* it comes from fr_natinit() in ipnat */
    ifs->ifs_ipf_nattable_sz = NAT_TABLE_SZ;
    ifs->ifs_ipf_nattable_max = NAT_TABLE_MAX;
    ifs->ifs_ipf_natrules_sz = NAT_SIZE;
    ifs->ifs_ipf_rdrrules_sz = RDR_SIZE;
    ifs->ifs_ipf_hostmap_sz = HOSTMAP_SIZE;
    ifs->ifs_fr_nat_maxbucket_reset = 1;
    ifs->ifs_fr_defnatage = DEF_NAT_AGE;
    ifs->ifs_fr_defnatipage = 120;      /* 60 seconds */
    ifs->ifs_fr_defnaticmpage = 6;      /* 3 seconds */
    ifs->ifs_nat_flush_level_hi = NAT_FLUSH_HI;
    ifs->ifs_nat_flush_level_lo = NAT_FLUSH_LO;

#ifdef IPFILTER_LOG
    /* it comes from fr_loginit() in IPF log */
    ifs->ifs_ipl_suppress = 1;
    ifs->ifs_ipl_logmax = IPL_LOGMAX;
    ifs->ifs_ipl_logsize = IPFILTER_LOGSIZE;

    /* from fr_natinit() */
    ifs->ifs_nat_logging = 1;

    /* from fr_stateinit() */
    ifs->ifs_ipstate_logging = 1;
#else
    /* from fr_natinit() */
    ifs->ifs_nat_logging = 0;

    /* from fr_stateinit() */
    ifs->ifs_ipstate_logging = 0;
#endif
    ifs->ifs_ipf_loopback = 0;

}
/*
 * Allocate a per-stack tuneable and copy in the names. Then
 * set it to point to each of the per-stack tunables.
 */
void
ipftuneable_alloc(ipf_stack_t *ifs)
{
    ipftuneable_t *item;

    KMALLOCS(ifs->ifs_ipf_tuneables, ipftuneable_t *,
    sizeof (lcl_ipf_tuneables));
    bcopy(lcl_ipf_tuneables, ifs->ifs_ipf_tuneables,
    sizeof (lcl_ipf_tuneables));

#define TUNE_SET(_ifs, _name, _field)           \
    item = tune_lookup((_ifs), (_name));        \
    if (item != NULL) {                 \
    item->ipft_una.ipftp_int = (unsigned int *)&((_ifs)->_field);   \
    item->ipft_sz = sizeof ((_ifs)->_field);    \
    }

    TUNE_SET(ifs, "fr_flags", ifs_fr_flags);
    TUNE_SET(ifs, "fr_active", ifs_fr_active);
    TUNE_SET(ifs, "fr_control_forwarding", ifs_fr_control_forwarding);
    TUNE_SET(ifs, "fr_update_ipid", ifs_fr_update_ipid);
    TUNE_SET(ifs, "fr_chksrc", ifs_fr_chksrc);
    TUNE_SET(ifs, "fr_minttl", ifs_fr_minttl);
    TUNE_SET(ifs, "fr_icmpminfragmtu", ifs_fr_icmpminfragmtu);
    TUNE_SET(ifs, "fr_pass", ifs_fr_pass);
    TUNE_SET(ifs, "fr_tcpidletimeout", ifs_fr_tcpidletimeout);
    TUNE_SET(ifs, "fr_tcpclosewait", ifs_fr_tcpclosewait);
    TUNE_SET(ifs, "fr_tcplastack", ifs_fr_tcplastack);
    TUNE_SET(ifs, "fr_tcptimeout", ifs_fr_tcptimeout);
    TUNE_SET(ifs, "fr_tcpclosed", ifs_fr_tcpclosed);
    TUNE_SET(ifs, "fr_tcphalfclosed", ifs_fr_tcphalfclosed);
    TUNE_SET(ifs, "fr_udptimeout", ifs_fr_udptimeout);
    TUNE_SET(ifs, "fr_udpacktimeout", ifs_fr_udpacktimeout);
    TUNE_SET(ifs, "fr_icmptimeout", ifs_fr_icmptimeout);
    TUNE_SET(ifs, "fr_icmpacktimeout", ifs_fr_icmpacktimeout);
    TUNE_SET(ifs, "fr_iptimeout", ifs_fr_iptimeout);
    TUNE_SET(ifs, "fr_statemax", ifs_fr_statemax);
    TUNE_SET(ifs, "fr_statesize", ifs_fr_statesize);
    TUNE_SET(ifs, "fr_state_lock", ifs_fr_state_lock);
    TUNE_SET(ifs, "fr_state_maxbucket", ifs_fr_state_maxbucket);
    TUNE_SET(ifs, "fr_state_maxbucket_reset", ifs_fr_state_maxbucket_reset);
    TUNE_SET(ifs, "ipstate_logging", ifs_ipstate_logging);
    TUNE_SET(ifs, "fr_nat_lock", ifs_fr_nat_lock);
    TUNE_SET(ifs, "ipf_nattable_sz", ifs_ipf_nattable_sz);
    TUNE_SET(ifs, "ipf_nattable_max", ifs_ipf_nattable_max);
    TUNE_SET(ifs, "ipf_natrules_sz", ifs_ipf_natrules_sz);
    TUNE_SET(ifs, "ipf_rdrrules_sz", ifs_ipf_rdrrules_sz);
    TUNE_SET(ifs, "ipf_hostmap_sz", ifs_ipf_hostmap_sz);
    TUNE_SET(ifs, "fr_nat_maxbucket", ifs_fr_nat_maxbucket);
    TUNE_SET(ifs, "fr_nat_maxbucket_reset", ifs_fr_nat_maxbucket_reset);
    TUNE_SET(ifs, "nat_logging", ifs_nat_logging);
    TUNE_SET(ifs, "fr_defnatage", ifs_fr_defnatage);
    TUNE_SET(ifs, "fr_defnatipage", ifs_fr_defnatipage);
    TUNE_SET(ifs, "fr_defnaticmpage", ifs_fr_defnaticmpage);
    TUNE_SET(ifs, "nat_flush_level_hi", ifs_nat_flush_level_hi);
    TUNE_SET(ifs, "nat_flush_level_lo", ifs_nat_flush_level_lo);
    TUNE_SET(ifs, "state_flush_level_hi", ifs_state_flush_level_hi);
    TUNE_SET(ifs, "state_flush_level_lo", ifs_state_flush_level_lo);
    TUNE_SET(ifs, "ipfr_size", ifs_ipfr_size);
    TUNE_SET(ifs, "fr_ipfrttl", ifs_fr_ipfrttl);
    TUNE_SET(ifs, "ipf_loopback", ifs_ipf_loopback);
#ifdef IPFILTER_LOG
    TUNE_SET(ifs, "ipl_suppress", ifs_ipl_suppress);
    TUNE_SET(ifs, "ipl_buffer_sz", ifs_ipl_buffer_sz);
    TUNE_SET(ifs, "ipl_logmax", ifs_ipl_logmax);
    TUNE_SET(ifs, "ipl_logall", ifs_ipl_logall);
    TUNE_SET(ifs, "ipl_logsize", ifs_ipl_logsize);
#endif
#undef TUNE_SET

    ipftuneable_setdefs(ifs);

#ifdef _KERNEL
    (void) ipf_property_update(ipf_dev_info, ifs);
#endif
}

void
ipftuneable_free(ipf_stack_t *ifs)
{
    KFREES(ifs->ifs_ipf_tuneables, sizeof (lcl_ipf_tuneables));
    ifs->ifs_ipf_tuneables = NULL;
}

/* ------------------------------------------------------------------------ */
/* Function:    fr_findtunebycookie                                         */
/* Returns:     NULL = search failed, else pointer to tune struct           */
/* Parameters:  cookie(I) - cookie value to search for amongst tuneables    */
/*              next(O)   - pointer to place to store the cookie for the    */
/*                          "next" tuneable, if it is desired.              */
/*                                                                          */
/* This function is used to walk through all of the existing tunables with  */
/* successive calls.  It searches the known tunables for the one which has  */
/* a matching value for "cookie" - ie its address.  When returning a match, */
/* the next one to be found may be returned inside next.                    */
/* ------------------------------------------------------------------------ */
static ipftuneable_t *fr_findtunebycookie(cookie, next, ifs)
void *cookie, **next;
ipf_stack_t * ifs;
{
    ipftuneable_t *ta, **tap;

    for (ta = ifs->ifs_ipf_tuneables; ta->ipft_name != NULL; ta++)
        if (ta == cookie) {
            if (next != NULL) {
                /*
                 * If the next entry in the array has a name
                 * present, then return a pointer to it for
                 * where to go next, else return a pointer to
                 * the dynaminc list as a key to search there
                 * next.  This facilitates a weak linking of
                 * the two "lists" together.
                 */
                if ((ta + 1)->ipft_name != NULL)
                    *next = ta + 1;
                else
                    *next = &ifs->ifs_ipf_tunelist;
            }
            return ta;
        }

    for (tap = &ifs->ifs_ipf_tunelist; (ta = *tap) != NULL; tap = &ta->ipft_next)
        if (tap == cookie) {
            if (next != NULL)
                *next = &ta->ipft_next;
            return ta;
        }

    if (next != NULL)
        *next = NULL;
    return NULL;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_findtunebyname                                           */
/* Returns:     NULL = search failed, else pointer to tune struct           */
/* Parameters:  name(I) - name of the tuneable entry to find.               */
/*                                                                          */
/* Search the static array of tuneables and the list of dynamic tuneables   */
/* for an entry with a matching name.  If we can find one, return a pointer */
/* to the matching structure.                                               */
/* ------------------------------------------------------------------------ */
static ipftuneable_t *fr_findtunebyname(name, ifs)
const char *name;
ipf_stack_t *ifs;
{
    ipftuneable_t *ta;

    for (ta = ifs->ifs_ipf_tuneables; ta->ipft_name != NULL; ta++)
        if (!strcmp(ta->ipft_name, name)) {
            return ta;
        }

    for (ta = ifs->ifs_ipf_tunelist; ta != NULL; ta = ta->ipft_next)
        if (!strcmp(ta->ipft_name, name)) {
            return ta;
        }

    return NULL;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_addipftune                                               */
/* Returns:     int - 0 == success, else failure                            */
/* Parameters:  newtune - pointer to new tune struct to add to tuneables    */
/*                                                                          */
/* Appends the tune structure pointer to by "newtune" to the end of the     */
/* current list of "dynamic" tuneable parameters.  Once added, the owner    */
/* of the object is not expected to ever change "ipft_next".                */
/* ------------------------------------------------------------------------ */
int fr_addipftune(newtune, ifs)
ipftuneable_t *newtune;
ipf_stack_t *ifs;
{
    ipftuneable_t *ta, **tap;

    ta = fr_findtunebyname(newtune->ipft_name, ifs);
    if (ta != NULL)
        return EEXIST;

    for (tap = &ifs->ifs_ipf_tunelist; *tap != NULL; tap = &(*tap)->ipft_next)
        ;

    newtune->ipft_next = NULL;
    *tap = newtune;
    return 0;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_delipftune                                               */
/* Returns:     int - 0 == success, else failure                            */
/* Parameters:  oldtune - pointer to tune struct to remove from the list of */
/*                        current dynamic tuneables                         */
/*                                                                          */
/* Search for the tune structure, by pointer, in the list of those that are */
/* dynamically added at run time.  If found, adjust the list so that this   */
/* structure is no longer part of it.                                       */
/* ------------------------------------------------------------------------ */
int fr_delipftune(oldtune, ifs)
ipftuneable_t *oldtune;
ipf_stack_t *ifs;
{
    ipftuneable_t *ta, **tap;

    for (tap = &ifs->ifs_ipf_tunelist; (ta = *tap) != NULL; tap = &ta->ipft_next)
        if (ta == oldtune) {
            *tap = oldtune->ipft_next;
            oldtune->ipft_next = NULL;
            return 0;
        }

    return ESRCH;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_ipftune                                                  */
/* Returns:     int - 0 == success, else failure                            */
/* Parameters:  cmd(I)  - ioctl command number                              */
/*              data(I) - pointer to ioctl data structure                   */
/*                                                                          */
/* Implement handling of SIOCIPFGETNEXT, SIOCIPFGET and SIOCIPFSET.  These  */
/* three ioctls provide the means to access and control global variables    */
/* within IPFilter, allowing (for example) timeouts and table sizes to be   */
/* changed without rebooting, reloading or recompiling.  The initialisation */
/* and 'destruction' routines of the various components of ipfilter are all */
/* each responsible for handling their own values being too big.            */
/* ------------------------------------------------------------------------ */
int fr_ipftune(cmd, data, ifs)
ioctlcmd_t cmd;
void *data;
ipf_stack_t *ifs;
{
    ipftuneable_t *ta;
    ipftune_t tu;
    void *cookie;
    int error;

    error = fr_inobj(data, &tu, IPFOBJ_TUNEABLE);
    if (error != 0)
        return error;

    tu.ipft_name[sizeof(tu.ipft_name) - 1] = '\0';
    cookie = tu.ipft_cookie;
    ta = NULL;

    switch (cmd)
    {
    case SIOCIPFGETNEXT :
        /*
         * If cookie is non-NULL, assume it to be a pointer to the last
         * entry we looked at, so find it (if possible) and return a
         * pointer to the next one after it.  The last entry in the
         * the table is a NULL entry, so when we get to it, set cookie
         * to NULL and return that, indicating end of list, erstwhile
         * if we come in with cookie set to NULL, we are starting anew
         * at the front of the list.
         */
        if (cookie != NULL) {
            ta = fr_findtunebycookie(cookie, &tu.ipft_cookie, ifs);
        } else {
            ta = ifs->ifs_ipf_tuneables;
            tu.ipft_cookie = ta + 1;
        }
        if (ta != NULL) {
            /*
             * Entry found, but does the data pointed to by that
             * row fit in what we can return?
             */
            if (ta->ipft_sz > sizeof(tu.ipft_un))
                return EINVAL;

            tu.ipft_vlong = 0;
            if (ta->ipft_sz == sizeof(u_long))
                tu.ipft_vlong = *ta->ipft_plong;
            else if (ta->ipft_sz == sizeof(u_int))
                tu.ipft_vint = *ta->ipft_pint;
            else if (ta->ipft_sz == sizeof(u_short))
                tu.ipft_vshort = *ta->ipft_pshort;
            else if (ta->ipft_sz == sizeof(u_char))
                tu.ipft_vchar = *ta->ipft_pchar;

            tu.ipft_sz = ta->ipft_sz;
            tu.ipft_min = ta->ipft_min;
            tu.ipft_max = ta->ipft_max;
            tu.ipft_flags = ta->ipft_flags;
            bcopy(ta->ipft_name, tu.ipft_name,
                  MIN(sizeof(tu.ipft_name),
                  strlen(ta->ipft_name) + 1));
        }
        error = fr_outobj(data, &tu, IPFOBJ_TUNEABLE);
        break;

    case SIOCIPFGET :
    case SIOCIPFSET :
        /*
         * Search by name or by cookie value for a particular entry
         * in the tuning paramter table.
         */
        error = ESRCH;
        if (cookie != NULL) {
            ta = fr_findtunebycookie(cookie, NULL, ifs);
            if (ta != NULL)
                error = 0;
        } else if (tu.ipft_name[0] != '\0') {
            ta = fr_findtunebyname(tu.ipft_name, ifs);
            if (ta != NULL)
                error = 0;
        }
        if (error != 0)
            break;

        if (cmd == (ioctlcmd_t)SIOCIPFGET) {
            /*
             * Fetch the tuning parameters for a particular value
             */
            tu.ipft_vlong = 0;
            if (ta->ipft_sz == sizeof(u_long))
                tu.ipft_vlong = *ta->ipft_plong;
            else if (ta->ipft_sz == sizeof(u_int))
                tu.ipft_vint = *ta->ipft_pint;
            else if (ta->ipft_sz == sizeof(u_short))
                tu.ipft_vshort = *ta->ipft_pshort;
            else if (ta->ipft_sz == sizeof(u_char))
                tu.ipft_vchar = *ta->ipft_pchar;
            tu.ipft_cookie = ta;
            tu.ipft_sz = ta->ipft_sz;
            tu.ipft_min = ta->ipft_min;
            tu.ipft_max = ta->ipft_max;
            tu.ipft_flags = ta->ipft_flags;
            error = fr_outobj(data, &tu, IPFOBJ_TUNEABLE);

        } else if (cmd == (ioctlcmd_t)SIOCIPFSET) {
            /*
             * Set an internal parameter.  The hard part here is
             * getting the new value safely and correctly out of
             * the kernel (given we only know its size, not type.)
             */
            u_long in;

            if (((ta->ipft_flags & IPFT_WRDISABLED) != 0) &&
                (ifs->ifs_fr_running > 0)) {
                error = EBUSY;
                break;
            }

            in = tu.ipft_vlong;
            if (in < ta->ipft_min || in > ta->ipft_max) {
                error = EINVAL;
                break;
            }

            if (ta->ipft_sz == sizeof(u_long)) {
                tu.ipft_vlong = *ta->ipft_plong;
                *ta->ipft_plong = in;
            } else if (ta->ipft_sz == sizeof(u_int)) {
                tu.ipft_vint = *ta->ipft_pint;
                *ta->ipft_pint = (u_int)(in & 0xffffffff);
            } else if (ta->ipft_sz == sizeof(u_short)) {
                tu.ipft_vshort = *ta->ipft_pshort;
                *ta->ipft_pshort = (u_short)(in & 0xffff);
            } else if (ta->ipft_sz == sizeof(u_char)) {
                tu.ipft_vchar = *ta->ipft_pchar;
                *ta->ipft_pchar = (u_char)(in & 0xff);
            }
            error = fr_outobj(data, &tu, IPFOBJ_TUNEABLE);
        }
        break;

    default :
        error = EINVAL;
        break;
    }

    return error;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_initialise                                               */
/* Returns:     int - 0 == success,  < 0 == failure                         */
/* Parameters:  None.                                                       */
/*                                                                          */
/* Call of the initialise functions for all the various subsystems inside   */
/* of IPFilter.  If any of them should fail, return immeadiately a failure  */
/* BUT do not try to recover from the error here.                           */
/* ------------------------------------------------------------------------ */
int fr_initialise(ifs)
ipf_stack_t *ifs;
{
    int i;

#ifdef IPFILTER_LOG
    i = fr_loginit(ifs);
    if (i < 0)
        return -10 + i;
#endif
    i = fr_natinit(ifs);
    if (i < 0)
        return -20 + i;

    i = fr_stateinit(ifs);
    if (i < 0)
        return -30 + i;

    i = fr_authinit(ifs);
    if (i < 0)
        return -40 + i;

    i = fr_fraginit(ifs);
    if (i < 0)
        return -50 + i;

    i = appr_init(ifs);
    if (i < 0)
        return -60 + i;

#ifdef IPFILTER_SYNC
    i = ipfsync_init(ifs);
    if (i < 0)
        return -70 + i;
#endif
#ifdef IPFILTER_SCAN
    i = ipsc_init(ifs);
    if (i < 0)
        return -80 + i;
#endif
#ifdef IPFILTER_LOOKUP
    i = ip_lookup_init(ifs);
    if (i < 0)
        return -90 + i;
#endif
#ifdef IPFILTER_COMPILED
    ipfrule_add(ifs);
#endif
    return 0;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_deinitialise                                             */
/* Returns:     None.                                                       */
/* Parameters:  None.                                                       */
/*                                                                          */
/* Call all the various subsystem cleanup routines to deallocate memory or  */
/* destroy locks or whatever they've done that they need to now undo.       */
/* The order here IS important as there are some cross references of        */
/* internal data structures.                                                */
/* ------------------------------------------------------------------------ */
void fr_deinitialise(ifs)
ipf_stack_t *ifs;
{
    fr_fragunload(ifs);
    fr_authunload(ifs);
    fr_natunload(ifs);
    fr_stateunload(ifs);
#ifdef IPFILTER_SCAN
    fr_scanunload(ifs);
#endif
    appr_unload(ifs);

#ifdef IPFILTER_COMPILED
    ipfrule_remove(ifs);
#endif

    (void) frflush(IPL_LOGIPF, 0, FR_INQUE|FR_OUTQUE|FR_INACTIVE, ifs);
    (void) frflush(IPL_LOGIPF, 0, FR_INQUE|FR_OUTQUE, ifs);
    (void) frflush(IPL_LOGCOUNT, 0, FR_INQUE|FR_OUTQUE|FR_INACTIVE, ifs);
    (void) frflush(IPL_LOGCOUNT, 0, FR_INQUE|FR_OUTQUE, ifs);

#ifdef IPFILTER_LOOKUP
    ip_lookup_unload(ifs);
#endif

#ifdef IPFILTER_LOG
    fr_logunload(ifs);
#endif
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_zerostats                                                */
/* Returns:     int - 0 = success, else failure                             */
/* Parameters:  data(O) - pointer to pointer for copying data back to       */
/*                                                                          */
/* Copies the current statistics out to userspace and then zero's the       */
/* current ones in the kernel. The lock is only held across the bzero() as  */
/* the copyout may result in paging (ie network activity.)                  */
/* ------------------------------------------------------------------------ */
int fr_zerostats(data, ifs)
caddr_t data;
ipf_stack_t *ifs;
{
    friostat_t fio;
    int error;

    fr_getstat(&fio, ifs);
    error = copyoutptr(&fio, data, sizeof(fio));
    if (error)
        return EFAULT;

    WRITE_ENTER(&ifs->ifs_ipf_mutex);
    bzero((char *)ifs->ifs_frstats, sizeof(*ifs->ifs_frstats) * 2);
    RWLOCK_EXIT(&ifs->ifs_ipf_mutex);

    return 0;
}


#ifdef _KERNEL
/* ------------------------------------------------------------------------ */
/* Function:    fr_resolvedest                                              */
/* Returns:     Nil                                                         */
/* Parameters:  fdp(IO) - pointer to destination information to resolve     */
/*              v(I)    - IP protocol version to match                      */
/*                                                                          */
/* Looks up an interface name in the frdest structure pointed to by fdp and */
/* if a matching name can be found for the particular IP protocol version   */
/* then store the interface pointer in the frdest struct.  If no match is   */
/* found, then set the interface pointer to be -1 as NULL is considered to  */
/* indicate there is no information at all in the structure.                */
/* ------------------------------------------------------------------------ */
void fr_resolvedest(fdp, v, ifs)
frdest_t *fdp;
int v;
ipf_stack_t *ifs;
{
    fdp->fd_ifp = NULL;

    if (*fdp->fd_ifname != '\0') {
        fdp->fd_ifp = GETIFP(fdp->fd_ifname, v, ifs);
        if (fdp->fd_ifp == NULL)
            fdp->fd_ifp = (void *)-1;
    }
}
#endif /* _KERNEL */


/* ------------------------------------------------------------------------ */
/* Function:    fr_resolvenic                                               */
/* Returns:     void* - NULL = wildcard name, -1 = failed to find NIC, else */
/*                      pointer to interface structure for NIC              */
/* Parameters:  name(I) - complete interface name                           */
/*              v(I)    - IP protocol version                               */
/*                                                                          */
/* Look for a network interface structure that firstly has a matching name  */
/* to that passed in and that is also being used for that IP protocol       */
/* version (necessary on some platforms where there are separate listings   */
/* for both IPv4 and IPv6 on the same physical NIC.                         */
/*                                                                          */
/* One might wonder why name gets terminated with a \0 byte in here.  The   */
/* reason is an interface name could get into the kernel structures of ipf  */
/* in any number of ways and so long as they all use the same sized array   */
/* to put the name in, it makes sense to ensure it gets null terminated     */
/* before it is used for its intended purpose - finding its match in the    */
/* kernel's list of configured interfaces.                                  */
/*                                                                          */
/* NOTE: This SHOULD ONLY be used with IPFilter structures that have an     */
/*       array for the name that is LIFNAMSIZ bytes (at least) in length.   */
/* ------------------------------------------------------------------------ */
void *fr_resolvenic(name, v, ifs)
char *name;
int v;
ipf_stack_t *ifs;
{
    void *nic;

    if (name[0] == '\0')
        return NULL;

    if ((name[1] == '\0') && ((name[0] == '-') || (name[0] == '*'))) {
        return NULL;
    }

    name[LIFNAMSIZ - 1] = '\0';

    nic = GETIFP(name, v, ifs);
    if (nic == NULL)
        nic = (void *)-1;
    return nic;
}


/* ------------------------------------------------------------------------ */
/* Function:    ipf_expiretokens                                            */
/* Returns:     None.                                                       */
/* Parameters:  ifs - ipf stack instance                                    */
/*                                                                          */
/* This function is run every ipf tick to see if there are any tokens that  */
/* have been held for too long and need to be freed up.                     */
/* ------------------------------------------------------------------------ */
void ipf_expiretokens(ifs)
ipf_stack_t *ifs;
{
    ipftoken_t *it;

    WRITE_ENTER(&ifs->ifs_ipf_tokens);
    while ((it = ifs->ifs_ipftokenhead) != NULL) {
        if (it->ipt_die > ifs->ifs_fr_ticks)
            break;

        ipf_freetoken(it, ifs);
    }
    RWLOCK_EXIT(&ifs->ifs_ipf_tokens);
}


/* ------------------------------------------------------------------------ */
/* Function:    ipf_deltoken                                                */
/* Returns:     int - 0 = success, else error                               */
/* Parameters:  type(I) - the token type to match                           */
/*              uid(I)  - uid owning the token                              */
/*              ptr(I)  - context pointer for the token                     */
/*              ifs - ipf stack instance                                    */
/*                                                                          */
/* This function looks for a a token in the current list that matches up    */
/* the fields (type, uid, ptr).  If none is found, ESRCH is returned, else  */
/* call ipf_freetoken() to remove it from the list.                         */
/* ------------------------------------------------------------------------ */
int ipf_deltoken(type, uid, ptr, ifs)
int type, uid;
void *ptr;
ipf_stack_t *ifs;
{
    ipftoken_t *it;
    int error = ESRCH;

    WRITE_ENTER(&ifs->ifs_ipf_tokens);
    for (it = ifs->ifs_ipftokenhead; it != NULL; it = it->ipt_next)
        if (ptr == it->ipt_ctx && type == it->ipt_type &&
            uid == it->ipt_uid) {
            ipf_freetoken(it, ifs);
            error = 0;
            break;
    }
    RWLOCK_EXIT(&ifs->ifs_ipf_tokens);

    return error;
}


/* ------------------------------------------------------------------------ */
/* Function:    ipf_unlinktoken                                             */
/* Returns:     None.                                                       */
/* Parameters:  token(I) - pointer to token structure                       */
/*              ifs - ipf stack instance                                    */
/*                                                                          */
/* This function unlinks a token structure from the linked list of tokens   */
/* that it belongs to.  The head pointer never needs to be explicitly       */
/* adjusted, but the tail does due to the linked list implementation.       */
/* ------------------------------------------------------------------------ */
static void ipf_unlinktoken(token, ifs)
ipftoken_t *token;
ipf_stack_t *ifs;
{

    if (ifs->ifs_ipftokentail == &token->ipt_next)
        ifs->ifs_ipftokentail = token->ipt_pnext;

    *token->ipt_pnext = token->ipt_next;
    if (token->ipt_next != NULL)
        token->ipt_next->ipt_pnext = token->ipt_pnext;
}


/* ------------------------------------------------------------------------ */
/* Function:    ipf_findtoken                                               */
/* Returns:     ipftoken_t * - NULL if no memory, else pointer to token     */
/* Parameters:  type(I) - the token type to match                           */
/*              uid(I) - uid owning the token                               */
/*              ptr(I) - context pointer for the token                      */
/*              ifs - ipf stack instance                                    */
/*                                                                          */
/* This function looks for a live token in the list of current tokens that  */
/* matches the tuple (type, uid, ptr).  If one cannot be found then one is  */
/* allocated.  If one is found then it is moved to the top of the list of   */
/* currently active tokens.                                                 */
/*                                                                          */
/* NOTE: It is by design that this function returns holding a read lock on  */
/*       ipf_tokens.  Callers must make sure they release it!               */
/* ------------------------------------------------------------------------ */
ipftoken_t *ipf_findtoken(type, uid, ptr, ifs)
int type, uid;
void *ptr;
ipf_stack_t *ifs;
{
    ipftoken_t *it, *new;

    KMALLOC(new, ipftoken_t *);

    WRITE_ENTER(&ifs->ifs_ipf_tokens);
    for (it = ifs->ifs_ipftokenhead; it != NULL; it = it->ipt_next) {
        if (it->ipt_alive == 0)
            continue;
        if (ptr == it->ipt_ctx && type == it->ipt_type &&
            uid == it->ipt_uid)
            break;
    }

    if (it == NULL) {
        it = new;
        new = NULL;
        if (it == NULL)
            return NULL;
        it->ipt_data = NULL;
        it->ipt_ctx = ptr;
        it->ipt_uid = uid;
        it->ipt_type = type;
        it->ipt_next = NULL;
        it->ipt_alive = 1;
    } else {
        if (new != NULL) {
            KFREE(new);
            new = NULL;
        }

        ipf_unlinktoken(it, ifs);
    }
    it->ipt_pnext = ifs->ifs_ipftokentail;
    *ifs->ifs_ipftokentail = it;
    ifs->ifs_ipftokentail = &it->ipt_next;
    it->ipt_next = NULL;

    it->ipt_die = ifs->ifs_fr_ticks + 2;

    MUTEX_DOWNGRADE(&ifs->ifs_ipf_tokens);

    return it;
}


/* ------------------------------------------------------------------------ */
/* Function:    ipf_freetoken                                               */
/* Returns:     None.                                                       */
/* Parameters:  token(I) - pointer to token structure                       */
/*              ifs - ipf stack instance                                    */
/*                                                                          */
/* This function unlinks a token from the linked list and on the path to    */
/* free'ing the data, it calls the dereference function that is associated  */
/* with the type of data pointed to by the token as it is considered to     */
/* hold a reference to it.                                                  */
/* ------------------------------------------------------------------------ */
void ipf_freetoken(token, ifs)
ipftoken_t *token;
ipf_stack_t *ifs;
{
    void *data, **datap;

    ipf_unlinktoken(token, ifs);

    data = token->ipt_data;
    datap = &data;

    if ((data != NULL) && (data != (void *)-1)) {
        switch (token->ipt_type)
        {
        case IPFGENITER_IPF :
            (void)fr_derefrule((frentry_t **)datap, ifs);
            break;
        case IPFGENITER_IPNAT :
            WRITE_ENTER(&ifs->ifs_ipf_nat);
            fr_ipnatderef((ipnat_t **)datap, ifs);
            RWLOCK_EXIT(&ifs->ifs_ipf_nat);
            break;
        case IPFGENITER_NAT :
            fr_natderef((nat_t **)datap, ifs);
            break;
        case IPFGENITER_STATE :
            fr_statederef((ipstate_t **)datap, ifs);
            break;
        case IPFGENITER_FRAG :
            fr_fragderef((ipfr_t **)datap, &ifs->ifs_ipf_frag, ifs);
            break;
        case IPFGENITER_NATFRAG :
            fr_fragderef((ipfr_t **)datap,
                     &ifs->ifs_ipf_natfrag, ifs);
            break;
        case IPFGENITER_HOSTMAP :
            WRITE_ENTER(&ifs->ifs_ipf_nat);
            fr_hostmapdel((hostmap_t **)datap);
            RWLOCK_EXIT(&ifs->ifs_ipf_nat);
            break;
        default :
            (void) ip_lookup_iterderef(token->ipt_type, data, ifs);
            break;
        }
    }

    KFREE(token);
}


/* ------------------------------------------------------------------------ */
/* Function:    ipf_getnextrule                                             */
/* Returns:     int - 0 = success, else error                               */
/* Parameters:  t(I)   - pointer to destination information to resolve      */
/*              ptr(I) - pointer to ipfobj_t to copyin from user space      */
/*              ifs - ipf stack instance                                    */
/*                                                                          */
/* This function's first job is to bring in the ipfruleiter_t structure via */
/* the ipfobj_t structure to determine what should be the next rule to      */
/* return. Once the ipfruleiter_t has been brought in, it then tries to     */
/* find the 'next rule'.  This may include searching rule group lists or    */
/* just be as simple as looking at the 'next' field in the rule structure.  */
/* When we have found the rule to return, increase its reference count and  */
/* if we used an existing rule to get here, decrease its reference count.   */
/* ------------------------------------------------------------------------ */
int ipf_getnextrule(t, ptr, ifs)
ipftoken_t *t;
void *ptr;
ipf_stack_t *ifs;
{
    frentry_t *fr, *next, zero;
    int error, out, count;
    ipfruleiter_t it;
    frgroup_t *fg;
    char *dst;

    if (t == NULL || ptr == NULL)
        return EFAULT;
    error = fr_inobj(ptr, &it, IPFOBJ_IPFITER);
    if (error != 0)
        return error;
    if ((it.iri_ver != AF_INET) && (it.iri_ver != AF_INET6))
        return EINVAL;
    if ((it.iri_inout < 0) || (it.iri_inout > 3))
        return EINVAL;
    if (it.iri_nrules == 0)
        return EINVAL;
    if ((it.iri_active != 0) && (it.iri_active != 1))
        return EINVAL;
    if (it.iri_rule == NULL)
        return EFAULT;

    /*
     * Use bitmask on it.iri_inout to determine direction.
     * F_OUT (1) and F_ACOUT (3) mask to out = 1, while
     * F_IN (0) and F_ACIN (2) mask to out = 0.
     */
    out = it.iri_inout & F_OUT;
    READ_ENTER(&ifs->ifs_ipf_mutex);

    /*
     * Retrieve "previous" entry from token and find the next entry.
     */
    fr = t->ipt_data;
    if (fr == NULL) {
        if (*it.iri_group == '\0') {
            /*
             * Use bitmask again to determine accounting or not.
             * F_ACIN will mask to accounting cases F_ACIN (2)
             * or F_ACOUT (3), but not F_IN or F_OUT.
             */
            if ((it.iri_inout & F_ACIN) != 0) {
                if (it.iri_ver == AF_INET)
                    next = ifs->ifs_ipacct
                        [out][it.iri_active];
                else
                    next = ifs->ifs_ipacct6
                        [out][it.iri_active];
            } else {
                if (it.iri_ver == AF_INET)
                    next = ifs->ifs_ipfilter
                        [out][it.iri_active];
                else
                    next = ifs->ifs_ipfilter6
                        [out][it.iri_active];
            }
        } else {
            fg = fr_findgroup(it.iri_group, IPL_LOGIPF,
                      it.iri_active, NULL, ifs);
            if (fg != NULL)
                next = fg->fg_start;
            else
                next = NULL;
        }
    } else {
        next = fr->fr_next;
    }

    dst = (char *)it.iri_rule;
    /*
     * The ipfruleiter may ask for more than 1 rule at a time to be
     * copied out, so long as that many exist in the list to start with!
     */
    for (count = it.iri_nrules; count > 0; count--) {
        /*
         * If we found an entry, add reference to it and update token.
         * Otherwise, zero out data to be returned and NULL out token.
         */
        if (next != NULL) {
            MUTEX_ENTER(&next->fr_lock);
            next->fr_ref++;
            MUTEX_EXIT(&next->fr_lock);
            t->ipt_data = next;
        } else {
            bzero(&zero, sizeof(zero));
            next = &zero;
            t->ipt_data = NULL;
        }

        /*
         * Now that we have ref, it's save to give up lock.
         */
        RWLOCK_EXIT(&ifs->ifs_ipf_mutex);

        /*
         * Copy out data and clean up references and token as needed.
         */
        error = COPYOUT(next, dst, sizeof(*next));
        if (error != 0)
            error = EFAULT;
        if (t->ipt_data == NULL) {
            ipf_freetoken(t, ifs);
            break;
        } else {
            if (fr != NULL)
                (void) fr_derefrule(&fr, ifs);
            if (next->fr_data != NULL) {
                dst += sizeof(*next);
                error = COPYOUT(next->fr_data, dst,
                        next->fr_dsize);
                if (error != 0)
                    error = EFAULT;
                else
                    dst += next->fr_dsize;
            }
            if (next->fr_next == NULL) {
                ipf_freetoken(t, ifs);
                break;
            }
        }

        if ((count == 1) || (error != 0))
            break;

        READ_ENTER(&ifs->ifs_ipf_mutex);
        fr = next;
        next = fr->fr_next;
    }

    return error;
}


/* ------------------------------------------------------------------------ */
/* Function:    fr_frruleiter                                               */
/* Returns:     int - 0 = success, else error                               */
/* Parameters:  data(I) - the token type to match                           */
/*              uid(I) - uid owning the token                               */
/*              ptr(I) - context pointer for the token                      */
/*              ifs - ipf stack instance                                    */
/*                                                                          */
/* This function serves as a stepping stone between fr_ipf_ioctl and        */
/* ipf_getnextrule.  It's role is to find the right token in the kernel for */
/* the process doing the ioctl and use that to ask for the next rule.       */
/* ------------------------------------------------------------------------ */
int ipf_frruleiter(data, uid, ctx, ifs)
void *data, *ctx;
int uid;
ipf_stack_t *ifs;
{
    ipftoken_t *token;
    int error;

    token = ipf_findtoken(IPFGENITER_IPF, uid, ctx, ifs);
    if (token != NULL)
        error = ipf_getnextrule(token, data, ifs);
    else
        error = EFAULT;
    RWLOCK_EXIT(&ifs->ifs_ipf_tokens);

    return error;
}


/* ------------------------------------------------------------------------ */
/* Function:    ipf_geniter                                                 */
/* Returns:     int - 0 = success, else error                               */
/* Parameters:  token(I) - pointer to ipftoken structure                    */
/*              itp(I) - pointer to ipfgeniter structure                    */
/*              ifs - ipf stack instance                                    */
/*                                                                          */
/* Generic iterator called from ipf_genericiter.  Currently only used for   */
/* walking through list of fragments.                                       */
/* ------------------------------------------------------------------------ */
int ipf_geniter(token, itp, ifs)
ipftoken_t *token;
ipfgeniter_t *itp;
ipf_stack_t *ifs;
{
    int error;

    switch (itp->igi_type)
    {
    case IPFGENITER_FRAG :
        error = fr_nextfrag(token, itp, &ifs->ifs_ipfr_list,
                    &ifs->ifs_ipfr_tail, &ifs->ifs_ipf_frag,
                    ifs);
        break;
    default :
        error = EINVAL;
        break;
    }

    return error;
}


/* ------------------------------------------------------------------------ */
/* Function:    ipf_genericiter                                             */
/* Returns:     int - 0 = success, else error                               */
/* Parameters:  data(I) - the token type to match                           */
/*              uid(I) - uid owning the token                               */
/*              ptr(I) - context pointer for the token                      */
/*              ifs - ipf stack instance                                    */
/*                                                                          */
/* This function serves as a stepping stone between fr_ipf_ioctl and        */
/* ipf_geniter when handling SIOCGENITER.  It's role is to find the right   */
/* token in the kernel for the process using the ioctl, and to use that     */
/* token when calling ipf_geniter.                                          */
/* ------------------------------------------------------------------------ */
int ipf_genericiter(data, uid, ctx, ifs)
void *data, *ctx;
int uid;
ipf_stack_t *ifs;
{
    ipftoken_t *token;
    ipfgeniter_t iter;
    int error;

    error = fr_inobj(data, &iter, IPFOBJ_GENITER);
    if (error != 0)
        return error;

    token = ipf_findtoken(iter.igi_type, uid, ctx, ifs);
    if (token != NULL) {
        token->ipt_subtype = iter.igi_type;
        error = ipf_geniter(token, &iter, ifs);
    } else
        error = EFAULT;
    RWLOCK_EXIT(&ifs->ifs_ipf_tokens);

    return error;
}


/* --------------------------------------------------------------------- */
/* Function:    ipf_earlydrop                                            */
/* Returns:     number of dropped/removed entries from the queue         */
/* Parameters:  flushtype - which table we're cleaning (NAT or State)    */
/*              ifq - pointer to queue with entries to be deleted    */
/*              idletime - entry must be idle this long to be deleted    */
/*              ifs     - ipf stack instance                             */
/*                                                                       */
/* Function is invoked from state/NAT flush routines to remove entries   */
/* from specified timeout queue, based on how long they've sat idle,     */
/* without waiting for it to happen on its own.                          */
/* --------------------------------------------------------------------- */
int ipf_earlydrop(flushtype, ifq, idletime, ifs)
int flushtype;
ipftq_t *ifq;
int idletime;
ipf_stack_t *ifs;
{
        ipftqent_t *tqe, *tqn;
        unsigned int dropped;
        int droptick;
    void *ent;

        if (ifq == NULL)
                return (0);

        dropped = 0;

        /*
         * Determine the tick representing the idle time we're interested
         * in.  If an entry exists in the queue, and it was touched before
         * that tick, then it's been idle longer than idletime, so it should
     * be deleted.
         */
        droptick = ifs->ifs_fr_ticks - idletime;
        tqn = ifq->ifq_head;
        while ((tqe = tqn) != NULL && tqe->tqe_touched < droptick) {
                tqn = tqe->tqe_next;
        ent = tqe->tqe_parent;
        switch (flushtype)
        {
        case NAT_FLUSH:
            if (nat_delete((nat_t *)ent, NL_FLUSH, ifs) == 0)
                dropped++;
            break;
        case STATE_FLUSH:
            if (fr_delstate((ipstate_t *)ent, ISL_FLUSH, ifs) == 0)
                dropped++;
            break;
        default:
            return (0);
        }
        }
        return (dropped);
}


/* --------------------------------------------------------------------- */
/* Function:    ipf_flushclosing                                         */
/* Returns:     int - number of entries deleted                          */
/* Parameters:  flushtype - which table we're cleaning (NAT or State)    */
/*              stateval - TCP state at which to start removing entries  */
/*              ipfqs - pointer to timeout queues                        */
/*              userqs - pointer to user defined queues                  */
/*              ifs  - ipf stack instance                                */
/*                                                                       */
/* Remove state/NAT table entries for TCP connections which are in the   */
/* process of closing, and have at least reached the state specified by  */
/* the 'stateval' parameter.                                             */
/* --------------------------------------------------------------------- */
int ipf_flushclosing(flushtype, stateval, ipfqs, userqs, ifs)
int flushtype, stateval;
ipftq_t *ipfqs, *userqs;
ipf_stack_t *ifs;
{
    ipftq_t *ifq, *ifqn;
        ipftqent_t *tqe, *tqn;
        int dropped;
    void *ent;
    nat_t *nat;
    ipstate_t *is;

        dropped = 0;

        /*
         * Start by deleting any entries in specific timeout queues.
         */
    ifqn = &ipfqs[stateval];
        while ((ifq = ifqn) != NULL) {
                ifqn = ifq->ifq_next;
                dropped += ipf_earlydrop(flushtype, ifq, (int)0, ifs);
        }

        /*
         * Next, look through user defined queues for closing entries.
         */
    ifqn = userqs;
        while ((ifq = ifqn) != NULL) {
                ifqn = ifq->ifq_next;
                tqn = ifq->ifq_head;
                while ((tqe = tqn) != NULL) {
                        tqn = tqe->tqe_next;
            ent = tqe->tqe_parent;
            switch (flushtype)
            {
            case NAT_FLUSH:
                nat = (nat_t *)ent;
                if ((nat->nat_p == IPPROTO_TCP) &&
                    (nat->nat_tcpstate[0] >= stateval) &&
                    (nat->nat_tcpstate[1] >= stateval) &&
                    (nat_delete(nat, NL_EXPIRE, ifs) == 0))
                    dropped++;
                break;
            case STATE_FLUSH:
                is = (ipstate_t *)ent;
                if ((is->is_p == IPPROTO_TCP) &&
                    (is->is_state[0] >= stateval) &&
                    (is->is_state[1] >= stateval) &&
                    (fr_delstate(is, ISL_EXPIRE, ifs) == 0))
                    dropped++;
                break;
            default:
                return (0);
            }
                }
        }
        return (dropped);
}


/* --------------------------------------------------------------------- */
/* Function:    ipf_extraflush                                           */
/* Returns:     int - number of entries flushed (0 = none)               */
/* Parameters:  flushtype - which table we're cleaning (NAT or State)    */
/*              ipfqs - pointer to 'established' timeout queue           */
/*              userqs - pointer to user defined queues                  */
/*              ifs  - ipf stack instance                                */
/*                                                                       */
/* This function gets called when either NAT or state tables fill up.    */
/* We need to try a bit harder to free up some space.  The function will */
/* flush entries for TCP connections which have been idle a long time.   */
/*                                                                       */
/* Currently, the idle time is checked using values from ideltime_tab[]  */
/* --------------------------------------------------------------------- */
int ipf_extraflush(flushtype, ipfqs, userqs, ifs)
int flushtype;
ipftq_t *ipfqs, *userqs;
ipf_stack_t *ifs;
{
    ipftq_t *ifq, *ifqn;
    int idletime, removed, idle_idx;

    removed = 0;

    /*
     * Determine initial threshold for minimum idle time based on
     * how long ipfilter has been running.  Ipfilter needs to have
     * been up as long as the smallest interval to continue on.
     *
     * Minimum idle times stored in idletime_tab and indexed by
     * idle_idx.  Start at upper end of array and work backwards.
     *
     * Once the index is found, set the initial idle time to the
     * first interval before the current ipfilter run time.
     */
    if (ifs->ifs_fr_ticks < idletime_tab[0])
        return (0);
    idle_idx = (sizeof (idletime_tab) / sizeof (int)) - 1;
    if (ifs->ifs_fr_ticks > idletime_tab[idle_idx]) {
        idletime = idletime_tab[idle_idx];
    } else {
        while ((idle_idx > 0) &&
            (ifs->ifs_fr_ticks < idletime_tab[idle_idx]))
            idle_idx--;

        idletime = (ifs->ifs_fr_ticks /
                idletime_tab[idle_idx]) *
                idletime_tab[idle_idx];
    }

    while (idle_idx >= 0) {
        /*
         * Check to see if we need to delete more entries.
         * If we do, start with appropriate timeout queue.
         */
        if (flushtype == NAT_FLUSH) {
            if (NAT_TAB_WATER_LEVEL(ifs) <=
                ifs->ifs_nat_flush_level_lo)
                break;
        } else if (flushtype == STATE_FLUSH) {
            if (ST_TAB_WATER_LEVEL(ifs) <=
                ifs->ifs_state_flush_level_lo)
                break;
        } else {
            break;
        }

        removed += ipf_earlydrop(flushtype, ipfqs, idletime, ifs);

        /*
         * Next, check the user defined queues.  But first, make
         * certain that timeout queue deletions didn't do enough.
         */
        if (flushtype == NAT_FLUSH) {
            if (NAT_TAB_WATER_LEVEL(ifs) <=
                ifs->ifs_nat_flush_level_lo)
                break;
        } else {
            if (ST_TAB_WATER_LEVEL(ifs) <=
                ifs->ifs_state_flush_level_lo)
                break;
        }
        ifqn = userqs;
        while ((ifq = ifqn) != NULL) {
            ifqn = ifq->ifq_next;
            removed += ipf_earlydrop(flushtype, ifq, idletime, ifs);
        }

        /*
         * Adjust the granularity of idle time.
         *
         * If we reach an interval boundary, we need to
         * either adjust the idle time accordingly or exit
         * the loop altogether (if this is very last check).
         */
        idletime -= idletime_tab[idle_idx];
        if (idletime < idletime_tab[idle_idx]) {
            if (idle_idx != 0) {
                idletime = idletime_tab[idle_idx] -
                idletime_tab[idle_idx - 1];
                idle_idx--;
            } else {
                break;
            }
        }
    }

    return (removed);
}