/* * Copyright (C) 1993-2001, 2003 by Darren Reed. * * See the IPFILTER.LICENCE file for details on licencing. * * Copyright 2007 Sun Microsystems, Inc. All rights reserved. * Use is subject to license terms. */ /* #pragma ident "@(#)solaris.c 1.12 6/5/96 (C) 1995 Darren Reed"*/ #pragma ident "@(#)$Id: solaris.c,v 2.73.2.6 2005/07/13 21:40:47 darrenr Exp $" #pragma ident "%Z%%M% %I% %E% SMI" #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #if SOLARIS2 >= 6 # include #endif #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include "netinet/ip_compat.h" #include "netinet/ipl.h" #include "netinet/ip_fil.h" #include "netinet/ip_nat.h" #include "netinet/ip_frag.h" #include "netinet/ip_auth.h" #include "netinet/ip_state.h" #include "netinet/ipf_stack.h" extern int iplwrite __P((dev_t, struct uio *, cred_t *)); static int ipf_getinfo __P((dev_info_t *, ddi_info_cmd_t, void *, void **)); #if SOLARIS2 < 10 static int ipf_identify __P((dev_info_t *)); #endif static int ipf_attach __P((dev_info_t *, ddi_attach_cmd_t)); static int ipf_detach __P((dev_info_t *, ddi_detach_cmd_t)); static int ipf_property_g_update __P((dev_info_t *)); static char *ipf_devfiles[] = { IPL_NAME, IPNAT_NAME, IPSTATE_NAME, IPAUTH_NAME, IPSYNC_NAME, IPSCAN_NAME, IPLOOKUP_NAME, NULL }; static struct cb_ops ipf_cb_ops = { iplopen, iplclose, nodev, /* strategy */ nodev, /* print */ nodev, /* dump */ iplread, iplwrite, /* write */ iplioctl, /* ioctl */ nodev, /* devmap */ nodev, /* mmap */ nodev, /* segmap */ nochpoll, /* poll */ ddi_prop_op, NULL, D_MTSAFE, #if SOLARIS2 > 4 CB_REV, nodev, /* aread */ nodev, /* awrite */ #endif }; static struct dev_ops ipf_ops = { DEVO_REV, 0, ipf_getinfo, #if SOLARIS2 >= 10 nulldev, #else ipf_identify, #endif nulldev, ipf_attach, ipf_detach, nodev, /* reset */ &ipf_cb_ops, (struct bus_ops *)0 }; extern struct mod_ops mod_driverops; static struct modldrv iplmod = { &mod_driverops, IPL_VERSION, &ipf_ops }; static struct modlinkage modlink1 = { MODREV_1, &iplmod, NULL }; #if SOLARIS2 >= 6 static size_t hdrsizes[57][2] = { { 0, 0 }, { IFT_OTHER, 0 }, { IFT_1822, 0 }, { IFT_HDH1822, 0 }, { IFT_X25DDN, 0 }, { IFT_X25, 0 }, { IFT_ETHER, 14 }, { IFT_ISO88023, 0 }, { IFT_ISO88024, 0 }, { IFT_ISO88025, 0 }, { IFT_ISO88026, 0 }, { IFT_STARLAN, 0 }, { IFT_P10, 0 }, { IFT_P80, 0 }, { IFT_HY, 0 }, { IFT_FDDI, 24 }, { IFT_LAPB, 0 }, { IFT_SDLC, 0 }, { IFT_T1, 0 }, { IFT_CEPT, 0 }, { IFT_ISDNBASIC, 0 }, { IFT_ISDNPRIMARY, 0 }, { IFT_PTPSERIAL, 0 }, { IFT_PPP, 0 }, { IFT_LOOP, 0 }, { IFT_EON, 0 }, { IFT_XETHER, 0 }, { IFT_NSIP, 0 }, { IFT_SLIP, 0 }, { IFT_ULTRA, 0 }, { IFT_DS3, 0 }, { IFT_SIP, 0 }, { IFT_FRELAY, 0 }, { IFT_RS232, 0 }, { IFT_PARA, 0 }, { IFT_ARCNET, 0 }, { IFT_ARCNETPLUS, 0 }, { IFT_ATM, 0 }, { IFT_MIOX25, 0 }, { IFT_SONET, 0 }, { IFT_X25PLE, 0 }, { IFT_ISO88022LLC, 0 }, { IFT_LOCALTALK, 0 }, { IFT_SMDSDXI, 0 }, { IFT_FRELAYDCE, 0 }, { IFT_V35, 0 }, { IFT_HSSI, 0 }, { IFT_HIPPI, 0 }, { IFT_MODEM, 0 }, { IFT_AAL5, 0 }, { IFT_SONETPATH, 0 }, { IFT_SONETVT, 0 }, { IFT_SMDSICIP, 0 }, { IFT_PROPVIRTUAL, 0 }, { IFT_PROPMUX, 0 }, }; #endif /* SOLARIS2 >= 6 */ dev_info_t *ipf_dev_info = NULL; static const filter_kstats_t ipf_kstat_tmp = { { "pass", KSTAT_DATA_ULONG }, { "block", KSTAT_DATA_ULONG }, { "nomatch", KSTAT_DATA_ULONG }, { "short", KSTAT_DATA_ULONG }, { "pass, logged", KSTAT_DATA_ULONG }, { "block, logged", KSTAT_DATA_ULONG }, { "nomatch, logged", KSTAT_DATA_ULONG }, { "logged", KSTAT_DATA_ULONG }, { "skip", KSTAT_DATA_ULONG }, { "return sent", KSTAT_DATA_ULONG }, { "acct", KSTAT_DATA_ULONG }, { "bad frag state alloc", KSTAT_DATA_ULONG }, { "new frag state kept", KSTAT_DATA_ULONG }, { "new frag state compl. pkt", KSTAT_DATA_ULONG }, { "bad pkt state alloc", KSTAT_DATA_ULONG }, { "new pkt kept state", KSTAT_DATA_ULONG }, { "cachehit", KSTAT_DATA_ULONG }, { "tcp cksum bad", KSTAT_DATA_ULONG }, {{ "pullup ok", KSTAT_DATA_ULONG }, { "pullup nok", KSTAT_DATA_ULONG }}, { "src != route", KSTAT_DATA_ULONG }, { "ttl invalid", KSTAT_DATA_ULONG }, { "bad ip pkt", KSTAT_DATA_ULONG }, { "ipv6 pkt", KSTAT_DATA_ULONG }, { "dropped:pps ceiling", KSTAT_DATA_ULONG }, { "ip upd. fail", KSTAT_DATA_ULONG } }; static int ipf_kstat_update(kstat_t *ksp, int rwflag); static void ipf_kstat_init(ipf_stack_t *ifs, netstackid_t stackid) { int i; for (i = 0; i < 2; i++) { ifs->ifs_kstatp[i] = kstat_create_netstack("ipf", 0, (i==0)?"inbound":"outbound", "net", KSTAT_TYPE_NAMED, sizeof (filter_kstats_t) / sizeof (kstat_named_t), 0, stackid); if (ifs->ifs_kstatp[i] != NULL) { bcopy(&ipf_kstat_tmp, ifs->ifs_kstatp[i]->ks_data, sizeof (filter_kstats_t)); ifs->ifs_kstatp[i]->ks_update = ipf_kstat_update; ifs->ifs_kstatp[i]->ks_private = &ifs->ifs_frstats[i]; kstat_install(ifs->ifs_kstatp[i]); } } #ifdef IPFDEBUG cmn_err(CE_NOTE, "IP Filter: ipf_kstat_init() installed 0x%x, 0x%x", ifs->ifs_kstatp[0], ifs->ifs_kstatp[1]); #endif } static void ipf_kstat_fini(ipf_stack_t *ifs, netstackid_t stackid) { int i; for (i = 0; i < 2; i++) { if (ifs->ifs_kstatp[i] != NULL) { kstat_delete_netstack(ifs->ifs_kstatp[i], stackid); ifs->ifs_kstatp[i] = NULL; } } } static int ipf_kstat_update(kstat_t *ksp, int rwflag) { filter_kstats_t *fkp; filterstats_t *fsp; if (ksp == NULL || ksp->ks_data == NULL) return (EIO); if (rwflag == KSTAT_WRITE) return (EACCES); fkp = ksp->ks_data; fsp = ksp->ks_private; fkp->fks_pass.value.ul = fsp->fr_pass; fkp->fks_block.value.ul = fsp->fr_block; fkp->fks_nom.value.ul = fsp->fr_nom; fkp->fks_short.value.ul = fsp->fr_short; fkp->fks_ppkl.value.ul = fsp->fr_ppkl; fkp->fks_bpkl.value.ul = fsp->fr_bpkl; fkp->fks_npkl.value.ul = fsp->fr_npkl; fkp->fks_pkl.value.ul = fsp->fr_pkl; fkp->fks_skip.value.ul = fsp->fr_skip; fkp->fks_ret.value.ul = fsp->fr_ret; fkp->fks_acct.value.ul = fsp->fr_acct; fkp->fks_bnfr.value.ul = fsp->fr_bnfr; fkp->fks_nfr.value.ul = fsp->fr_nfr; fkp->fks_cfr.value.ul = fsp->fr_cfr; fkp->fks_bads.value.ul = fsp->fr_bads; fkp->fks_ads.value.ul = fsp->fr_ads; fkp->fks_chit.value.ul = fsp->fr_chit; fkp->fks_tcpbad.value.ul = fsp->fr_tcpbad; fkp->fks_pull[0].value.ul = fsp->fr_pull[0]; fkp->fks_pull[1].value.ul = fsp->fr_pull[1]; fkp->fks_badsrc.value.ul = fsp->fr_badsrc; fkp->fks_badttl.value.ul = fsp->fr_badttl; fkp->fks_bad.value.ul = fsp->fr_bad; fkp->fks_ipv6.value.ul = fsp->fr_ipv6; fkp->fks_ppshit.value.ul = fsp->fr_ppshit; fkp->fks_ipud.value.ul = fsp->fr_ipud; return (0); } int _init() { int ipfinst; ipfinst = mod_install(&modlink1); #ifdef IPFDEBUG cmn_err(CE_NOTE, "IP Filter: _init() = %d", ipfinst); #endif return ipfinst; } int _fini(void) { int ipfinst; ipfinst = mod_remove(&modlink1); #ifdef IPFDEBUG cmn_err(CE_NOTE, "IP Filter: _fini() = %d", ipfinst); #endif return ipfinst; } int _info(modinfop) struct modinfo *modinfop; { int ipfinst; ipfinst = mod_info(&modlink1, modinfop); #ifdef IPFDEBUG cmn_err(CE_NOTE, "IP Filter: _info(%x) = %x", modinfop, ipfinst); #endif return ipfinst; } #if SOLARIS2 < 10 static int ipf_identify(dip) dev_info_t *dip; { # ifdef IPFDEBUG cmn_err(CE_NOTE, "IP Filter: ipf_identify(%x)", dip); # endif if (strcmp(ddi_get_name(dip), "ipf") == 0) return (DDI_IDENTIFIED); return (DDI_NOT_IDENTIFIED); } #endif /* * Initialize things for IPF for each stack instance */ static void * ipf_stack_init(netstackid_t stackid, netstack_t *ns) { ipf_stack_t *ifs; #ifdef NS_DEBUG (void) printf("ipf_stack_init(%d)\n", stackid); #endif KMALLOCS(ifs, ipf_stack_t *, sizeof (*ifs)); bzero(ifs, sizeof (*ifs)); ifs->ifs_netstack = ns; ifs->ifs_hook4_physical_in = B_FALSE; ifs->ifs_hook4_physical_out = B_FALSE; ifs->ifs_hook4_nic_events = B_FALSE; ifs->ifs_hook4_loopback_in = B_FALSE; ifs->ifs_hook4_loopback_out = B_FALSE; ifs->ifs_hook6_physical_in = B_FALSE; ifs->ifs_hook6_physical_out = B_FALSE; ifs->ifs_hook6_nic_events = B_FALSE; ifs->ifs_hook6_loopback_in = B_FALSE; ifs->ifs_hook6_loopback_out = B_FALSE; /* * Initialize mutex's */ RWLOCK_INIT(&ifs->ifs_ipf_global, "ipf filter load/unload mutex"); RWLOCK_INIT(&ifs->ifs_ipf_mutex, "ipf filter rwlock"); #ifdef KERNEL ipf_kstat_init(ifs, stackid); #endif /* * Lock people out while we set things up. */ WRITE_ENTER(&ifs->ifs_ipf_global); ipftuneable_alloc(ifs); RWLOCK_EXIT(&ifs->ifs_ipf_global); /* Limit to global stack */ if (stackid == GLOBAL_NETSTACKID) cmn_err(CE_CONT, "!%s, running.\n", ipfilter_version); return (ifs); } static int ipf_detach_check_zone(ipf_stack_t *ifs) { /* * Make sure we're the only one's modifying things. With * this lock others should just fall out of the loop. */ READ_ENTER(&ifs->ifs_ipf_global); if (ifs->ifs_fr_running == 1) { RWLOCK_EXIT(&ifs->ifs_ipf_global); return (-1); } /* * Make sure there is no active filter rule. */ if (ifs->ifs_ipfilter[0][ifs->ifs_fr_active] || ifs->ifs_ipfilter[1][ifs->ifs_fr_active] || ifs->ifs_ipfilter6[0][ifs->ifs_fr_active] || ifs->ifs_ipfilter6[1][ifs->ifs_fr_active]) { RWLOCK_EXIT(&ifs->ifs_ipf_global); return (-1); } RWLOCK_EXIT(&ifs->ifs_ipf_global); return (0); } static int ipf_detach_check_all() { netstack_handle_t nh; netstack_t *ns; int ret; netstack_next_init(&nh); while ((ns = netstack_next(&nh)) != NULL) { ret = ipf_detach_check_zone(ns->netstack_ipf); netstack_rele(ns); if (ret != 0) { netstack_next_fini(&nh); return (-1); } } netstack_next_fini(&nh); return (0); } /* * Destroy things for ipf for one stack. */ /* ARGSUSED */ static void ipf_stack_fini(netstackid_t stackid, void *arg) { ipf_stack_t *ifs = (ipf_stack_t *)arg; #ifdef NS_DEBUG (void) printf("ipf_stack_destroy(%p, stackid %d)\n", (void *)ifs, stackid); #endif /* * Make sure we're the only one's modifying things. With * this lock others should just fall out of the loop. */ WRITE_ENTER(&ifs->ifs_ipf_global); if (ifs->ifs_fr_running == -2) { RWLOCK_EXIT(&ifs->ifs_ipf_global); return; } ifs->ifs_fr_running = -2; RWLOCK_EXIT(&ifs->ifs_ipf_global); #ifdef KERNEL ipf_kstat_fini(ifs, stackid); #endif if (ifs->ifs_fr_timer_id != 0) { (void) untimeout(ifs->ifs_fr_timer_id); ifs->ifs_fr_timer_id = 0; } WRITE_ENTER(&ifs->ifs_ipf_global); if (ipldetach(ifs) != 0) { printf("ipf_stack_fini: ipldetach failed\n"); } ipftuneable_free(ifs); RWLOCK_EXIT(&ifs->ifs_ipf_global); RW_DESTROY(&ifs->ifs_ipf_mutex); RW_DESTROY(&ifs->ifs_ipf_global); KFREE(ifs); } static int ipf_attach(dip, cmd) dev_info_t *dip; ddi_attach_cmd_t cmd; { char *s; int i; int instance; #ifdef IPFDEBUG cmn_err(CE_NOTE, "IP Filter: ipf_attach(%x,%x)", dip, cmd); #endif switch (cmd) { case DDI_ATTACH: instance = ddi_get_instance(dip); /* Only one instance of ipf (instance 0) can be attached. */ if (instance > 0) return DDI_FAILURE; #ifdef IPFDEBUG cmn_err(CE_NOTE, "IP Filter: attach ipf instance %d", instance); #endif (void) ipf_property_g_update(dip); for (i = 0; ((s = ipf_devfiles[i]) != NULL); i++) { s = strrchr(s, '/'); if (s == NULL) continue; s++; if (ddi_create_minor_node(dip, s, S_IFCHR, i, DDI_PSEUDO, 0) == DDI_FAILURE) { ddi_remove_minor_node(dip, NULL); goto attach_failed; } } ipf_dev_info = dip; netstack_register(NS_IPF, ipf_stack_init, NULL, ipf_stack_fini); return DDI_SUCCESS; /* NOTREACHED */ default: break; } attach_failed: ddi_prop_remove_all(dip); return DDI_FAILURE; } static int ipf_detach(dip, cmd) dev_info_t *dip; ddi_detach_cmd_t cmd; { int i; #ifdef IPFDEBUG cmn_err(CE_NOTE, "IP Filter: ipf_detach(%x,%x)", dip, cmd); #endif switch (cmd) { case DDI_DETACH: if (ipf_detach_check_all() != 0) return DDI_FAILURE; /* Undo what we did in ipf_attach, freeing resources * and removing things we installed. The system * framework guarantees we are not active with this devinfo * node in any other entry points at this time. */ ddi_prop_remove_all(dip); i = ddi_get_instance(dip); ddi_remove_minor_node(dip, NULL); if (i > 0) { cmn_err(CE_CONT, "IP Filter: still attached (%d)\n", i); return DDI_FAILURE; } netstack_unregister(NS_IPF); return DDI_SUCCESS; /* NOTREACHED */ default: break; } cmn_err(CE_NOTE, "IP Filter: failed to detach\n"); return DDI_FAILURE; } /*ARGSUSED*/ static int ipf_getinfo(dip, infocmd, arg, result) dev_info_t *dip; ddi_info_cmd_t infocmd; void *arg, **result; { int error; error = DDI_FAILURE; #ifdef IPFDEBUG cmn_err(CE_NOTE, "IP Filter: ipf_getinfo(%x,%x,%x)", dip, infocmd, arg); #endif switch (infocmd) { case DDI_INFO_DEVT2DEVINFO: *result = ipf_dev_info; error = DDI_SUCCESS; break; case DDI_INFO_DEVT2INSTANCE: *result = (void *)0; error = DDI_SUCCESS; break; default: break; } return (error); } /* * Fetch configuration file values that have been entered into the ipf.conf * driver file. */ static int ipf_property_g_update(dip) dev_info_t *dip; { #ifdef DDI_NO_AUTODETACH if (ddi_prop_update_int(DDI_DEV_T_NONE, dip, DDI_NO_AUTODETACH, 1) != DDI_PROP_SUCCESS) { cmn_err(CE_WARN, "!updating DDI_NO_AUTODETACH failed"); return DDI_FAILURE; } #else if (ddi_prop_update_int(DDI_DEV_T_NONE, dip, "ddi-no-autodetach", 1) != DDI_PROP_SUCCESS) { cmn_err(CE_WARN, "!updating ddi-no-autodetach failed"); return DDI_FAILURE; } #endif return DDI_SUCCESS; } int ipf_property_update(dip, ifs) dev_info_t *dip; ipf_stack_t *ifs; { ipftuneable_t *ipft; int64_t *i64p; char *name; u_int one; int *i32p; int err; for (ipft = ifs->ifs_ipf_tuneables; (name = ipft->ipft_name) != NULL; ipft++) { one = 1; switch (ipft->ipft_sz) { case 4 : i32p = NULL; err = ddi_prop_lookup_int_array(DDI_DEV_T_ANY, dip, 0, name, &i32p, &one); if (err == DDI_PROP_NOT_FOUND) continue; #ifdef IPFDEBUG cmn_err(CE_CONT, "IP Filter: lookup_int(%s) = %d\n", name, err); #endif if (err != DDI_PROP_SUCCESS) return err; if (*i32p >= ipft->ipft_min && *i32p <= ipft->ipft_max) *ipft->ipft_pint = *i32p; else err = DDI_PROP_CANNOT_DECODE; ddi_prop_free(i32p); break; #if SOLARIS2 > 8 case 8 : i64p = NULL; err = ddi_prop_lookup_int64_array(DDI_DEV_T_ANY, dip, 0, name, &i64p, &one); if (err == DDI_PROP_NOT_FOUND) continue; # ifdef IPFDEBUG cmn_err(CE_CONT, "IP Filter: lookup_int64(%s) = %d\n", name, err); # endif if (err != DDI_PROP_SUCCESS) return err; if (*i64p >= ipft->ipft_min && *i64p <= ipft->ipft_max) *ipft->ipft_pint = *i64p; else err = DDI_PROP_CANNOT_DECODE; ddi_prop_free(i64p); break; #endif default : break; } if (err != DDI_SUCCESS) break; } return err; }