17c478bd9Sstevel@tonic-gate /*
27c478bd9Sstevel@tonic-gate * CDDL HEADER START
37c478bd9Sstevel@tonic-gate *
47c478bd9Sstevel@tonic-gate * The contents of this file are subject to the terms of the
57c478bd9Sstevel@tonic-gate * Common Development and Distribution License, Version 1.0 only
67c478bd9Sstevel@tonic-gate * (the "License"). You may not use this file except in compliance
77c478bd9Sstevel@tonic-gate * with the License.
87c478bd9Sstevel@tonic-gate *
97c478bd9Sstevel@tonic-gate * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
107c478bd9Sstevel@tonic-gate * or http://www.opensolaris.org/os/licensing.
117c478bd9Sstevel@tonic-gate * See the License for the specific language governing permissions
127c478bd9Sstevel@tonic-gate * and limitations under the License.
137c478bd9Sstevel@tonic-gate *
147c478bd9Sstevel@tonic-gate * When distributing Covered Code, include this CDDL HEADER in each
157c478bd9Sstevel@tonic-gate * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
167c478bd9Sstevel@tonic-gate * If applicable, add the following below this CDDL HEADER, with the
177c478bd9Sstevel@tonic-gate * fields enclosed by brackets "[]" replaced with your own identifying
187c478bd9Sstevel@tonic-gate * information: Portions Copyright [yyyy] [name of copyright owner]
197c478bd9Sstevel@tonic-gate *
207c478bd9Sstevel@tonic-gate * CDDL HEADER END
217c478bd9Sstevel@tonic-gate */
227c478bd9Sstevel@tonic-gate /*
231d8c4025Svi117747 * Copyright 2005 Sun Microsystems, Inc. All rights reserved.
247c478bd9Sstevel@tonic-gate * Use is subject to license terms.
257c478bd9Sstevel@tonic-gate */
267c478bd9Sstevel@tonic-gate
277c478bd9Sstevel@tonic-gate #include <sys/types.h>
287c478bd9Sstevel@tonic-gate #include <sys/atomic.h>
291d8c4025Svi117747 #include <sys/pattr.h>
307c478bd9Sstevel@tonic-gate #include <netinet/in.h>
317c478bd9Sstevel@tonic-gate #include <netinet/ip6.h>
327c478bd9Sstevel@tonic-gate #include <inet/common.h>
337c478bd9Sstevel@tonic-gate #include <inet/ip.h>
347c478bd9Sstevel@tonic-gate #include <inet/ip6.h>
357c478bd9Sstevel@tonic-gate #include <ipp/dscpmk/dscpmk_impl.h>
367c478bd9Sstevel@tonic-gate
377c478bd9Sstevel@tonic-gate /* Module to mark the ToS/DS field for a given packet */
387c478bd9Sstevel@tonic-gate
397c478bd9Sstevel@tonic-gate /* Debug level */
407c478bd9Sstevel@tonic-gate int dscpmk_debug = 0;
417c478bd9Sstevel@tonic-gate
427c478bd9Sstevel@tonic-gate /*
437c478bd9Sstevel@tonic-gate * Given a packet, this routine marks the ToS or DSCP for IPv4 and IPv6 resp.
447c478bd9Sstevel@tonic-gate * using the configured dscp_map.
457c478bd9Sstevel@tonic-gate * Note that this module does not change the ECN bits.
467c478bd9Sstevel@tonic-gate */
477c478bd9Sstevel@tonic-gate int
dscpmk_process(mblk_t ** mpp,dscpmk_data_t * dscpmk_data,ip_proc_t proc)487c478bd9Sstevel@tonic-gate dscpmk_process(mblk_t **mpp, dscpmk_data_t *dscpmk_data, ip_proc_t proc)
497c478bd9Sstevel@tonic-gate {
507c478bd9Sstevel@tonic-gate ipha_t *ipha;
517c478bd9Sstevel@tonic-gate ip6_t *ip6_hdr;
527c478bd9Sstevel@tonic-gate boolean_t is_v4;
537c478bd9Sstevel@tonic-gate uint8_t dscp, new_dscp;
547c478bd9Sstevel@tonic-gate mblk_t *mp;
557c478bd9Sstevel@tonic-gate
567c478bd9Sstevel@tonic-gate ASSERT((mpp != NULL) && (*mpp != NULL));
577c478bd9Sstevel@tonic-gate mp = *mpp;
587c478bd9Sstevel@tonic-gate
597c478bd9Sstevel@tonic-gate /*
607c478bd9Sstevel@tonic-gate * The action module will receive an M_DATA or an M_CTL followed
617c478bd9Sstevel@tonic-gate * by an M_DATA. In the latter case skip the M_CTL.
627c478bd9Sstevel@tonic-gate */
637c478bd9Sstevel@tonic-gate if (mp->b_datap->db_type != M_DATA) {
647c478bd9Sstevel@tonic-gate if ((mp->b_cont != NULL) &&
657c478bd9Sstevel@tonic-gate (mp->b_cont->b_datap->db_type == M_DATA)) {
667c478bd9Sstevel@tonic-gate mp = mp->b_cont;
677c478bd9Sstevel@tonic-gate } else {
687c478bd9Sstevel@tonic-gate dscpmk0dbg(("dscpmk_process: no data\n"));
69*1a5e258fSJosef 'Jeff' Sipek atomic_inc_64(&dscpmk_data->epackets);
707c478bd9Sstevel@tonic-gate return (EINVAL);
717c478bd9Sstevel@tonic-gate }
727c478bd9Sstevel@tonic-gate }
737c478bd9Sstevel@tonic-gate
747c478bd9Sstevel@tonic-gate /* Pull-up needed? */
757c478bd9Sstevel@tonic-gate if ((mp->b_wptr - mp->b_rptr) < IP_SIMPLE_HDR_LENGTH) {
767c478bd9Sstevel@tonic-gate if (!pullupmsg(mp, IP_SIMPLE_HDR_LENGTH)) {
777c478bd9Sstevel@tonic-gate dscpmk0dbg(("dscpmk_process: pullup failed\n"));
78*1a5e258fSJosef 'Jeff' Sipek atomic_inc_64(&dscpmk_data->epackets);
797c478bd9Sstevel@tonic-gate return (EINVAL);
807c478bd9Sstevel@tonic-gate }
817c478bd9Sstevel@tonic-gate }
827c478bd9Sstevel@tonic-gate ipha = (ipha_t *)mp->b_rptr;
837c478bd9Sstevel@tonic-gate
847c478bd9Sstevel@tonic-gate /* Update global stats */
85*1a5e258fSJosef 'Jeff' Sipek atomic_inc_64(&dscpmk_data->npackets);
867c478bd9Sstevel@tonic-gate
877c478bd9Sstevel@tonic-gate /*
887c478bd9Sstevel@tonic-gate * This should only be called for outgoing packets. For inbound packets
897c478bd9Sstevel@tonic-gate * proceed with the next action.
907c478bd9Sstevel@tonic-gate */
917c478bd9Sstevel@tonic-gate if ((proc == IPP_LOCAL_IN) || (proc == IPP_FWD_IN)) {
927c478bd9Sstevel@tonic-gate dscpmk2dbg(("dscpmk_process: cannot mark incoming packets\n"));
93*1a5e258fSJosef 'Jeff' Sipek atomic_inc_64(&dscpmk_data->ipackets);
947c478bd9Sstevel@tonic-gate return (0);
957c478bd9Sstevel@tonic-gate }
967c478bd9Sstevel@tonic-gate
977c478bd9Sstevel@tonic-gate /* Figure out the ToS or the Traffic Class from the message */
987c478bd9Sstevel@tonic-gate if (IPH_HDR_VERSION(ipha) == IPV4_VERSION) {
997c478bd9Sstevel@tonic-gate dscp = ipha->ipha_type_of_service;
1007c478bd9Sstevel@tonic-gate is_v4 = B_TRUE;
1017c478bd9Sstevel@tonic-gate } else {
1027c478bd9Sstevel@tonic-gate ip6_hdr = (ip6_t *)mp->b_rptr;
1037c478bd9Sstevel@tonic-gate dscp = __IPV6_TCLASS_FROM_FLOW(ip6_hdr->ip6_vcf);
1047c478bd9Sstevel@tonic-gate is_v4 = B_FALSE;
1057c478bd9Sstevel@tonic-gate }
1067c478bd9Sstevel@tonic-gate
1077c478bd9Sstevel@tonic-gate /*
1087c478bd9Sstevel@tonic-gate * Select the new dscp from the dscp_map after ignoring the
1097c478bd9Sstevel@tonic-gate * ECN/CU from dscp (hence dscp >> 2). new_dscp will be the
1107c478bd9Sstevel@tonic-gate * 6-bit DSCP value.
1117c478bd9Sstevel@tonic-gate */
1127c478bd9Sstevel@tonic-gate new_dscp = dscpmk_data->dscp_map[dscp >> 2];
1137c478bd9Sstevel@tonic-gate
1147c478bd9Sstevel@tonic-gate /* Update stats for this new_dscp */
115*1a5e258fSJosef 'Jeff' Sipek atomic_inc_64(&dscpmk_data->dscp_stats[new_dscp].npackets);
1167c478bd9Sstevel@tonic-gate
1177c478bd9Sstevel@tonic-gate /*
1187c478bd9Sstevel@tonic-gate * if new_dscp is same as the original, update stats and
1197c478bd9Sstevel@tonic-gate * return.
1207c478bd9Sstevel@tonic-gate */
1217c478bd9Sstevel@tonic-gate if (new_dscp == (dscp >> 2)) {
122*1a5e258fSJosef 'Jeff' Sipek atomic_inc_64(&dscpmk_data->unchanged);
1237c478bd9Sstevel@tonic-gate return (0);
1247c478bd9Sstevel@tonic-gate }
1257c478bd9Sstevel@tonic-gate
1267c478bd9Sstevel@tonic-gate /* Get back the ECN/CU value from the original dscp */
1277c478bd9Sstevel@tonic-gate new_dscp = (new_dscp << 2) | (dscp & 0x3);
1287c478bd9Sstevel@tonic-gate
129*1a5e258fSJosef 'Jeff' Sipek atomic_inc_64(&dscpmk_data->changed);
1307c478bd9Sstevel@tonic-gate /*
1317c478bd9Sstevel@tonic-gate * IPv4 : ToS structure -- RFC 791
1327c478bd9Sstevel@tonic-gate *
1337c478bd9Sstevel@tonic-gate * 0 1 2 3 4 5 6 7
1347c478bd9Sstevel@tonic-gate * +---+---+---+---+---+---+---+---+
1357c478bd9Sstevel@tonic-gate * | IP Precd | D | T | R | 0 | 0 |
1367c478bd9Sstevel@tonic-gate * | | | | | | |
1377c478bd9Sstevel@tonic-gate * +---+---+---+---+---+---+---+---+
1387c478bd9Sstevel@tonic-gate *
1397c478bd9Sstevel@tonic-gate * For Backward Compatability the diff serv DSCP will be mapped
1407c478bd9Sstevel@tonic-gate * to the 3-bits Precedence field. DTR is not supported. Thus,
1417c478bd9Sstevel@tonic-gate * the following Class Seletor CodePoints are reserved from this
1427c478bd9Sstevel@tonic-gate * purpose : xxx000; where x is 0 or 1 (note the last 2 bits are
1437c478bd9Sstevel@tonic-gate * 00) -- see RFC 2474.
1447c478bd9Sstevel@tonic-gate */
1457c478bd9Sstevel@tonic-gate
1467c478bd9Sstevel@tonic-gate if (is_v4) {
1477c478bd9Sstevel@tonic-gate ipha->ipha_type_of_service = new_dscp;
1481d8c4025Svi117747 /*
1491d8c4025Svi117747 * If the hardware supports checksumming, we don't need
1501d8c4025Svi117747 * to do anything.
1511d8c4025Svi117747 */
1521d8c4025Svi117747 if (!(mp->b_datap->db_struioun.cksum.flags &
1531d8c4025Svi117747 HCK_IPV4_HDRCKSUM)) {
1547c478bd9Sstevel@tonic-gate ipha->ipha_hdr_checksum = 0;
1557c478bd9Sstevel@tonic-gate ipha->ipha_hdr_checksum = ip_csum_hdr(ipha);
1567c478bd9Sstevel@tonic-gate }
1571d8c4025Svi117747 } else {
1587c478bd9Sstevel@tonic-gate
1597c478bd9Sstevel@tonic-gate /*
1607c478bd9Sstevel@tonic-gate * IPv6 : DSCP field structure is as given -- RFC 2474
1617c478bd9Sstevel@tonic-gate *
1627c478bd9Sstevel@tonic-gate * 0 1 2 3 4 5 6 7
1637c478bd9Sstevel@tonic-gate * +---+---+---+---+---+---+---+---+
1647c478bd9Sstevel@tonic-gate * | DSCP | CU |
1657c478bd9Sstevel@tonic-gate * | | |
1667c478bd9Sstevel@tonic-gate * +---+---+---+---+---+---+---+---+
1677c478bd9Sstevel@tonic-gate *
1687c478bd9Sstevel@tonic-gate * CU -- Currently Unused
1691d8c4025Svi117747 *
1707c478bd9Sstevel@tonic-gate * the 32 bit vcf consists of version (4 bits), Traffic class (8 bits)
1717c478bd9Sstevel@tonic-gate * and flow id (20 bits). Need to take care of Big/Little-Endianess.
1727c478bd9Sstevel@tonic-gate */
1737c478bd9Sstevel@tonic-gate #ifdef _BIG_ENDIAN
1747c478bd9Sstevel@tonic-gate ip6_hdr->ip6_vcf = (ip6_hdr->ip6_vcf & TCLASS_MASK) |
1757c478bd9Sstevel@tonic-gate (new_dscp << 20);
1767c478bd9Sstevel@tonic-gate #else
1777c478bd9Sstevel@tonic-gate ip6_hdr->ip6_vcf = (ip6_hdr->ip6_vcf & TCLASS_MASK) |
1787c478bd9Sstevel@tonic-gate ((new_dscp >> 4) | ((new_dscp << 12) & 0xF000));
1797c478bd9Sstevel@tonic-gate #endif
1807c478bd9Sstevel@tonic-gate }
1817c478bd9Sstevel@tonic-gate
1827c478bd9Sstevel@tonic-gate return (0);
1837c478bd9Sstevel@tonic-gate }
184