xref: /freebsd/sys/kern/uipc_mbuf.c (revision 94985f742b83ff093b4f3ce39b5d7749872807b5)
19454b2d8SWarner Losh /*-
2df8bae1dSRodney W. Grimes  * Copyright (c) 1982, 1986, 1988, 1991, 1993
3df8bae1dSRodney W. Grimes  *	The Regents of the University of California.  All rights reserved.
4df8bae1dSRodney W. Grimes  *
5df8bae1dSRodney W. Grimes  * Redistribution and use in source and binary forms, with or without
6df8bae1dSRodney W. Grimes  * modification, are permitted provided that the following conditions
7df8bae1dSRodney W. Grimes  * are met:
8df8bae1dSRodney W. Grimes  * 1. Redistributions of source code must retain the above copyright
9df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer.
10df8bae1dSRodney W. Grimes  * 2. Redistributions in binary form must reproduce the above copyright
11df8bae1dSRodney W. Grimes  *    notice, this list of conditions and the following disclaimer in the
12df8bae1dSRodney W. Grimes  *    documentation and/or other materials provided with the distribution.
13df8bae1dSRodney W. Grimes  * 4. Neither the name of the University nor the names of its contributors
14df8bae1dSRodney W. Grimes  *    may be used to endorse or promote products derived from this software
15df8bae1dSRodney W. Grimes  *    without specific prior written permission.
16df8bae1dSRodney W. Grimes  *
17df8bae1dSRodney W. Grimes  * THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS ``AS IS'' AND
18df8bae1dSRodney W. Grimes  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
19df8bae1dSRodney W. Grimes  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
20df8bae1dSRodney W. Grimes  * ARE DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE
21df8bae1dSRodney W. Grimes  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
22df8bae1dSRodney W. Grimes  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
23df8bae1dSRodney W. Grimes  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
24df8bae1dSRodney W. Grimes  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
25df8bae1dSRodney W. Grimes  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
26df8bae1dSRodney W. Grimes  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
27df8bae1dSRodney W. Grimes  * SUCH DAMAGE.
28df8bae1dSRodney W. Grimes  *
29df8bae1dSRodney W. Grimes  *	@(#)uipc_mbuf.c	8.2 (Berkeley) 1/4/94
30df8bae1dSRodney W. Grimes  */
31df8bae1dSRodney W. Grimes 
32677b542eSDavid E. O'Brien #include <sys/cdefs.h>
33677b542eSDavid E. O'Brien __FBSDID("$FreeBSD$");
34677b542eSDavid E. O'Brien 
35240ef842SDavid E. O'Brien #include "opt_param.h"
36352d050eSMike Silbersack #include "opt_mbuf_stress_test.h"
376eeac1d9SJulian Elischer #include "opt_mbuf_profiling.h"
38e32a5b94SRobert Watson 
39df8bae1dSRodney W. Grimes #include <sys/param.h>
40df8bae1dSRodney W. Grimes #include <sys/systm.h>
41fb919e4dSMark Murray #include <sys/kernel.h>
42beb699c7SMike Silbersack #include <sys/limits.h>
43fb919e4dSMark Murray #include <sys/lock.h>
44f9d0d524SRobert Watson #include <sys/malloc.h>
45df8bae1dSRodney W. Grimes #include <sys/mbuf.h>
46639acc13SGarrett Wollman #include <sys/sysctl.h>
47df8bae1dSRodney W. Grimes #include <sys/domain.h>
48df8bae1dSRodney W. Grimes #include <sys/protosw.h>
49beb699c7SMike Silbersack #include <sys/uio.h>
50fb919e4dSMark Murray 
5128f8db14SBruce Evans int	max_linkhdr;
5228f8db14SBruce Evans int	max_protohdr;
5328f8db14SBruce Evans int	max_hdr;
5428f8db14SBruce Evans int	max_datalen;
5551710a45SMike Silbersack #ifdef MBUF_STRESS_TEST
5655e9f80dSMike Silbersack int	m_defragpackets;
5755e9f80dSMike Silbersack int	m_defragbytes;
5855e9f80dSMike Silbersack int	m_defraguseless;
5955e9f80dSMike Silbersack int	m_defragfailure;
60352d050eSMike Silbersack int	m_defragrandomfailures;
61352d050eSMike Silbersack #endif
627d032714SBosko Milekic 
637d032714SBosko Milekic /*
647d032714SBosko Milekic  * sysctl(8) exported objects
657d032714SBosko Milekic  */
6680444f88SAndre Oppermann SYSCTL_INT(_kern_ipc, KIPC_MAX_LINKHDR, max_linkhdr, CTLFLAG_RD,
6780444f88SAndre Oppermann 	   &max_linkhdr, 0, "Size of largest link layer header");
6880444f88SAndre Oppermann SYSCTL_INT(_kern_ipc, KIPC_MAX_PROTOHDR, max_protohdr, CTLFLAG_RD,
6980444f88SAndre Oppermann 	   &max_protohdr, 0, "Size of largest protocol layer header");
7080444f88SAndre Oppermann SYSCTL_INT(_kern_ipc, KIPC_MAX_HDR, max_hdr, CTLFLAG_RD,
7180444f88SAndre Oppermann 	   &max_hdr, 0, "Size of largest link plus protocol header");
7280444f88SAndre Oppermann SYSCTL_INT(_kern_ipc, KIPC_MAX_DATALEN, max_datalen, CTLFLAG_RD,
7380444f88SAndre Oppermann 	   &max_datalen, 0, "Minimum space left in mbuf after max_hdr");
7451710a45SMike Silbersack #ifdef MBUF_STRESS_TEST
7555e9f80dSMike Silbersack SYSCTL_INT(_kern_ipc, OID_AUTO, m_defragpackets, CTLFLAG_RD,
7655e9f80dSMike Silbersack 	   &m_defragpackets, 0, "");
7755e9f80dSMike Silbersack SYSCTL_INT(_kern_ipc, OID_AUTO, m_defragbytes, CTLFLAG_RD,
7855e9f80dSMike Silbersack 	   &m_defragbytes, 0, "");
7955e9f80dSMike Silbersack SYSCTL_INT(_kern_ipc, OID_AUTO, m_defraguseless, CTLFLAG_RD,
8055e9f80dSMike Silbersack 	   &m_defraguseless, 0, "");
8155e9f80dSMike Silbersack SYSCTL_INT(_kern_ipc, OID_AUTO, m_defragfailure, CTLFLAG_RD,
8255e9f80dSMike Silbersack 	   &m_defragfailure, 0, "");
83352d050eSMike Silbersack SYSCTL_INT(_kern_ipc, OID_AUTO, m_defragrandomfailures, CTLFLAG_RW,
84352d050eSMike Silbersack 	   &m_defragrandomfailures, 0, "");
85352d050eSMike Silbersack #endif
86df8bae1dSRodney W. Grimes 
87df8bae1dSRodney W. Grimes /*
88f729ede6SAndre Oppermann  * Ensure the correct size of various mbuf parameters.  It could be off due
89f729ede6SAndre Oppermann  * to compiler-induced padding and alignment artifacts.
90f729ede6SAndre Oppermann  */
91f729ede6SAndre Oppermann CTASSERT(sizeof(struct mbuf) == MSIZE);
92f729ede6SAndre Oppermann CTASSERT(MSIZE - offsetof(struct mbuf, m_dat) == MLEN);
93f729ede6SAndre Oppermann CTASSERT(MSIZE - offsetof(struct mbuf, m_pktdat) == MHLEN);
94f729ede6SAndre Oppermann 
95f729ede6SAndre Oppermann /*
9629110f87SGleb Smirnoff  * m_get2() allocates minimum mbuf that would fit "size" argument.
9729110f87SGleb Smirnoff  */
9829110f87SGleb Smirnoff struct mbuf *
9941a7572bSGleb Smirnoff m_get2(int size, int how, short type, int flags)
10029110f87SGleb Smirnoff {
10129110f87SGleb Smirnoff 	struct mb_args args;
10229110f87SGleb Smirnoff 	struct mbuf *m, *n;
10329110f87SGleb Smirnoff 
10429110f87SGleb Smirnoff 	args.flags = flags;
10529110f87SGleb Smirnoff 	args.type = type;
10629110f87SGleb Smirnoff 
10729110f87SGleb Smirnoff 	if (size <= MHLEN || (size <= MLEN && (flags & M_PKTHDR) == 0))
10829110f87SGleb Smirnoff 		return (uma_zalloc_arg(zone_mbuf, &args, how));
10929110f87SGleb Smirnoff 	if (size <= MCLBYTES)
11029110f87SGleb Smirnoff 		return (uma_zalloc_arg(zone_pack, &args, how));
1113112ae76SGleb Smirnoff 
1123112ae76SGleb Smirnoff 	if (size > MJUMPAGESIZE)
11329110f87SGleb Smirnoff 		return (NULL);
11429110f87SGleb Smirnoff 
11529110f87SGleb Smirnoff 	m = uma_zalloc_arg(zone_mbuf, &args, how);
11629110f87SGleb Smirnoff 	if (m == NULL)
11729110f87SGleb Smirnoff 		return (NULL);
11829110f87SGleb Smirnoff 
1193112ae76SGleb Smirnoff 	n = uma_zalloc_arg(zone_jumbop, m, how);
12029110f87SGleb Smirnoff 	if (n == NULL) {
12129110f87SGleb Smirnoff 		uma_zfree(zone_mbuf, m);
12229110f87SGleb Smirnoff 		return (NULL);
12329110f87SGleb Smirnoff 	}
12429110f87SGleb Smirnoff 
12529110f87SGleb Smirnoff 	return (m);
12629110f87SGleb Smirnoff }
12729110f87SGleb Smirnoff 
12829110f87SGleb Smirnoff /*
12929110f87SGleb Smirnoff  * m_getjcl() returns an mbuf with a cluster of the specified size attached.
13029110f87SGleb Smirnoff  * For size it takes MCLBYTES, MJUMPAGESIZE, MJUM9BYTES, MJUM16BYTES.
13129110f87SGleb Smirnoff  */
13229110f87SGleb Smirnoff struct mbuf *
13329110f87SGleb Smirnoff m_getjcl(int how, short type, int flags, int size)
13429110f87SGleb Smirnoff {
13529110f87SGleb Smirnoff 	struct mb_args args;
13629110f87SGleb Smirnoff 	struct mbuf *m, *n;
13729110f87SGleb Smirnoff 	uma_zone_t zone;
13829110f87SGleb Smirnoff 
13929110f87SGleb Smirnoff 	if (size == MCLBYTES)
14029110f87SGleb Smirnoff 		return m_getcl(how, type, flags);
14129110f87SGleb Smirnoff 
14229110f87SGleb Smirnoff 	args.flags = flags;
14329110f87SGleb Smirnoff 	args.type = type;
14429110f87SGleb Smirnoff 
14529110f87SGleb Smirnoff 	m = uma_zalloc_arg(zone_mbuf, &args, how);
14629110f87SGleb Smirnoff 	if (m == NULL)
14729110f87SGleb Smirnoff 		return (NULL);
14829110f87SGleb Smirnoff 
14929110f87SGleb Smirnoff 	zone = m_getzone(size);
15029110f87SGleb Smirnoff 	n = uma_zalloc_arg(zone, m, how);
15129110f87SGleb Smirnoff 	if (n == NULL) {
15229110f87SGleb Smirnoff 		uma_zfree(zone_mbuf, m);
15329110f87SGleb Smirnoff 		return (NULL);
15429110f87SGleb Smirnoff 	}
15529110f87SGleb Smirnoff 	return (m);
15629110f87SGleb Smirnoff }
15729110f87SGleb Smirnoff 
15829110f87SGleb Smirnoff /*
159099a0e58SBosko Milekic  * Allocate a given length worth of mbufs and/or clusters (whatever fits
160099a0e58SBosko Milekic  * best) and return a pointer to the top of the allocated chain.  If an
161099a0e58SBosko Milekic  * existing mbuf chain is provided, then we will append the new chain
162099a0e58SBosko Milekic  * to the existing one but still return the top of the newly allocated
163099a0e58SBosko Milekic  * chain.
164099a0e58SBosko Milekic  */
165099a0e58SBosko Milekic struct mbuf *
1665e20f43dSAndre Oppermann m_getm2(struct mbuf *m, int len, int how, short type, int flags)
167099a0e58SBosko Milekic {
1685e20f43dSAndre Oppermann 	struct mbuf *mb, *nm = NULL, *mtail = NULL;
169099a0e58SBosko Milekic 
1705e20f43dSAndre Oppermann 	KASSERT(len >= 0, ("%s: len is < 0", __func__));
171099a0e58SBosko Milekic 
1725e20f43dSAndre Oppermann 	/* Validate flags. */
1735e20f43dSAndre Oppermann 	flags &= (M_PKTHDR | M_EOR);
1745e20f43dSAndre Oppermann 
1755e20f43dSAndre Oppermann 	/* Packet header mbuf must be first in chain. */
1765e20f43dSAndre Oppermann 	if ((flags & M_PKTHDR) && m != NULL)
1775e20f43dSAndre Oppermann 		flags &= ~M_PKTHDR;
1785e20f43dSAndre Oppermann 
1795e20f43dSAndre Oppermann 	/* Loop and append maximum sized mbufs to the chain tail. */
1805e20f43dSAndre Oppermann 	while (len > 0) {
1815e20f43dSAndre Oppermann 		if (len > MCLBYTES)
1825e20f43dSAndre Oppermann 			mb = m_getjcl(how, type, (flags & M_PKTHDR),
1835e20f43dSAndre Oppermann 			    MJUMPAGESIZE);
1845e20f43dSAndre Oppermann 		else if (len >= MINCLSIZE)
1855e20f43dSAndre Oppermann 			mb = m_getcl(how, type, (flags & M_PKTHDR));
1865e20f43dSAndre Oppermann 		else if (flags & M_PKTHDR)
1875e20f43dSAndre Oppermann 			mb = m_gethdr(how, type);
188099a0e58SBosko Milekic 		else
1895e20f43dSAndre Oppermann 			mb = m_get(how, type);
190099a0e58SBosko Milekic 
1915e20f43dSAndre Oppermann 		/* Fail the whole operation if one mbuf can't be allocated. */
1925e20f43dSAndre Oppermann 		if (mb == NULL) {
1935e20f43dSAndre Oppermann 			if (nm != NULL)
1945e20f43dSAndre Oppermann 				m_freem(nm);
1955e20f43dSAndre Oppermann 			return (NULL);
196099a0e58SBosko Milekic 		}
197099a0e58SBosko Milekic 
1985e20f43dSAndre Oppermann 		/* Book keeping. */
1995e20f43dSAndre Oppermann 		len -= (mb->m_flags & M_EXT) ? mb->m_ext.ext_size :
2005e20f43dSAndre Oppermann 			((mb->m_flags & M_PKTHDR) ? MHLEN : MLEN);
201099a0e58SBosko Milekic 		if (mtail != NULL)
2025e20f43dSAndre Oppermann 			mtail->m_next = mb;
2035e20f43dSAndre Oppermann 		else
2045e20f43dSAndre Oppermann 			nm = mb;
2055e20f43dSAndre Oppermann 		mtail = mb;
2065e20f43dSAndre Oppermann 		flags &= ~M_PKTHDR;	/* Only valid on the first mbuf. */
2075e20f43dSAndre Oppermann 	}
2085e20f43dSAndre Oppermann 	if (flags & M_EOR)
2095e20f43dSAndre Oppermann 		mtail->m_flags |= M_EOR;  /* Only valid on the last mbuf. */
2105e20f43dSAndre Oppermann 
2115e20f43dSAndre Oppermann 	/* If mbuf was supplied, append new chain to the end of it. */
2125e20f43dSAndre Oppermann 	if (m != NULL) {
2135e20f43dSAndre Oppermann 		for (mtail = m; mtail->m_next != NULL; mtail = mtail->m_next)
2145e20f43dSAndre Oppermann 			;
2155e20f43dSAndre Oppermann 		mtail->m_next = nm;
2165e20f43dSAndre Oppermann 		mtail->m_flags &= ~M_EOR;
2175e20f43dSAndre Oppermann 	} else
2185e20f43dSAndre Oppermann 		m = nm;
2195e20f43dSAndre Oppermann 
2205e20f43dSAndre Oppermann 	return (m);
221099a0e58SBosko Milekic }
222099a0e58SBosko Milekic 
223099a0e58SBosko Milekic /*
224099a0e58SBosko Milekic  * Free an entire chain of mbufs and associated external buffers, if
225099a0e58SBosko Milekic  * applicable.
226099a0e58SBosko Milekic  */
227099a0e58SBosko Milekic void
228099a0e58SBosko Milekic m_freem(struct mbuf *mb)
229099a0e58SBosko Milekic {
230099a0e58SBosko Milekic 
231099a0e58SBosko Milekic 	while (mb != NULL)
232099a0e58SBosko Milekic 		mb = m_free(mb);
233099a0e58SBosko Milekic }
234099a0e58SBosko Milekic 
2351a996ed1SEdward Tomasz Napierala /*-
236099a0e58SBosko Milekic  * Configure a provided mbuf to refer to the provided external storage
237099a0e58SBosko Milekic  * buffer and setup a reference count for said buffer.  If the setting
238099a0e58SBosko Milekic  * up of the reference count fails, the M_EXT bit will not be set.  If
239099a0e58SBosko Milekic  * successfull, the M_EXT bit is set in the mbuf's flags.
240099a0e58SBosko Milekic  *
241099a0e58SBosko Milekic  * Arguments:
242099a0e58SBosko Milekic  *    mb     The existing mbuf to which to attach the provided buffer.
243099a0e58SBosko Milekic  *    buf    The address of the provided external storage buffer.
244099a0e58SBosko Milekic  *    size   The size of the provided buffer.
245099a0e58SBosko Milekic  *    freef  A pointer to a routine that is responsible for freeing the
246099a0e58SBosko Milekic  *           provided external storage buffer.
247099a0e58SBosko Milekic  *    args   A pointer to an argument structure (of any type) to be passed
248099a0e58SBosko Milekic  *           to the provided freef routine (may be NULL).
249099a0e58SBosko Milekic  *    flags  Any other flags to be passed to the provided mbuf.
250099a0e58SBosko Milekic  *    type   The type that the external storage buffer should be
251099a0e58SBosko Milekic  *           labeled with.
252099a0e58SBosko Milekic  *
253099a0e58SBosko Milekic  * Returns:
254099a0e58SBosko Milekic  *    Nothing.
255099a0e58SBosko Milekic  */
2568c629bdfSGleb Smirnoff int
257099a0e58SBosko Milekic m_extadd(struct mbuf *mb, caddr_t buf, u_int size,
258bb25e5abSAndre Oppermann     int (*freef)(struct mbuf *, void *, void *), void *arg1, void *arg2,
2599a736876SAndre Oppermann     int flags, int type, int wait)
260099a0e58SBosko Milekic {
26156a4e45aSAndre Oppermann 	KASSERT(type != EXT_CLUSTER, ("%s: EXT_CLUSTER not allowed", __func__));
262099a0e58SBosko Milekic 
26356a4e45aSAndre Oppermann 	if (type != EXT_EXTREF)
2648c629bdfSGleb Smirnoff 		mb->m_ext.ref_cnt = uma_zalloc(zone_ext_refcnt, wait);
2658c629bdfSGleb Smirnoff 
2668c629bdfSGleb Smirnoff 	if (mb->m_ext.ref_cnt == NULL)
2678c629bdfSGleb Smirnoff 		return (ENOMEM);
2688c629bdfSGleb Smirnoff 
269099a0e58SBosko Milekic 	*(mb->m_ext.ref_cnt) = 1;
270099a0e58SBosko Milekic 	mb->m_flags |= (M_EXT | flags);
271099a0e58SBosko Milekic 	mb->m_ext.ext_buf = buf;
272099a0e58SBosko Milekic 	mb->m_data = mb->m_ext.ext_buf;
273099a0e58SBosko Milekic 	mb->m_ext.ext_size = size;
274099a0e58SBosko Milekic 	mb->m_ext.ext_free = freef;
275cf827063SPoul-Henning Kamp 	mb->m_ext.ext_arg1 = arg1;
276cf827063SPoul-Henning Kamp 	mb->m_ext.ext_arg2 = arg2;
277099a0e58SBosko Milekic 	mb->m_ext.ext_type = type;
278894734cbSAndre Oppermann 	mb->m_ext.ext_flags = 0;
2798c629bdfSGleb Smirnoff 
2808c629bdfSGleb Smirnoff 	return (0);
281099a0e58SBosko Milekic }
282099a0e58SBosko Milekic 
283099a0e58SBosko Milekic /*
284099a0e58SBosko Milekic  * Non-directly-exported function to clean up after mbufs with M_EXT
28556a4e45aSAndre Oppermann  * storage attached to them if the reference count hits 1.
286099a0e58SBosko Milekic  */
287099a0e58SBosko Milekic void
288099a0e58SBosko Milekic mb_free_ext(struct mbuf *m)
289099a0e58SBosko Milekic {
2901227f20dSAndre Oppermann 	int skipmbuf;
291457869b9SKip Macy 
29256a4e45aSAndre Oppermann 	KASSERT((m->m_flags & M_EXT) == M_EXT, ("%s: M_EXT not set", __func__));
29356a4e45aSAndre Oppermann 	KASSERT(m->m_ext.ref_cnt != NULL, ("%s: ref_cnt not set", __func__));
2943d2a3ff2SBosko Milekic 
2951227f20dSAndre Oppermann 	/*
2961227f20dSAndre Oppermann 	 * check if the header is embedded in the cluster
2971227f20dSAndre Oppermann 	 */
2981227f20dSAndre Oppermann 	skipmbuf = (m->m_flags & M_NOFREE);
2991227f20dSAndre Oppermann 
30056a4e45aSAndre Oppermann 	/* Free attached storage if this mbuf is the only reference to it. */
30156a4e45aSAndre Oppermann 	if (*(m->m_ext.ref_cnt) == 1 ||
302adf5d1c6SRandall Stewart 	    atomic_fetchadd_int(m->m_ext.ref_cnt, -1) == 1) {
30356a4e45aSAndre Oppermann 		switch (m->m_ext.ext_type) {
304cd5bb63bSAndre Oppermann 		case EXT_PACKET:	/* The packet zone is special. */
305a5f77087SAndre Oppermann 			if (*(m->m_ext.ref_cnt) == 0)
306a5f77087SAndre Oppermann 				*(m->m_ext.ref_cnt) = 1;
307099a0e58SBosko Milekic 			uma_zfree(zone_pack, m);
30856a4e45aSAndre Oppermann 			return;		/* Job done. */
309cd5bb63bSAndre Oppermann 		case EXT_CLUSTER:
310cd5bb63bSAndre Oppermann 			uma_zfree(zone_clust, m->m_ext.ext_buf);
31156a4e45aSAndre Oppermann 			break;
312ec63cb90SAndre Oppermann 		case EXT_JUMBOP:
313ec63cb90SAndre Oppermann 			uma_zfree(zone_jumbop, m->m_ext.ext_buf);
314d5269a63SAndre Oppermann 			break;
31556a4e45aSAndre Oppermann 		case EXT_JUMBO9:
31656a4e45aSAndre Oppermann 			uma_zfree(zone_jumbo9, m->m_ext.ext_buf);
31756a4e45aSAndre Oppermann 			break;
31856a4e45aSAndre Oppermann 		case EXT_JUMBO16:
31956a4e45aSAndre Oppermann 			uma_zfree(zone_jumbo16, m->m_ext.ext_buf);
32056a4e45aSAndre Oppermann 			break;
32156a4e45aSAndre Oppermann 		case EXT_SFBUF:
32256a4e45aSAndre Oppermann 		case EXT_NET_DRV:
32356a4e45aSAndre Oppermann 		case EXT_MOD_TYPE:
32456a4e45aSAndre Oppermann 		case EXT_DISPOSABLE:
32556a4e45aSAndre Oppermann 			*(m->m_ext.ref_cnt) = 0;
32656a4e45aSAndre Oppermann 			uma_zfree(zone_ext_refcnt, __DEVOLATILE(u_int *,
32756a4e45aSAndre Oppermann 				m->m_ext.ref_cnt));
32856a4e45aSAndre Oppermann 			/* FALLTHROUGH */
32956a4e45aSAndre Oppermann 		case EXT_EXTREF:
33056a4e45aSAndre Oppermann 			KASSERT(m->m_ext.ext_free != NULL,
33156a4e45aSAndre Oppermann 				("%s: ext_free not set", __func__));
332bb25e5abSAndre Oppermann 			(void)(*(m->m_ext.ext_free))(m, m->m_ext.ext_arg1,
333cf827063SPoul-Henning Kamp 			    m->m_ext.ext_arg2);
33456a4e45aSAndre Oppermann 			break;
33556a4e45aSAndre Oppermann 		default:
33656a4e45aSAndre Oppermann 			KASSERT(m->m_ext.ext_type == 0,
33756a4e45aSAndre Oppermann 				("%s: unknown ext_type", __func__));
3383d2a3ff2SBosko Milekic 		}
33956a4e45aSAndre Oppermann 	}
3401227f20dSAndre Oppermann 	if (skipmbuf)
3411227f20dSAndre Oppermann 		return;
342457869b9SKip Macy 
34356a4e45aSAndre Oppermann 	/*
34456a4e45aSAndre Oppermann 	 * Free this mbuf back to the mbuf zone with all m_ext
34556a4e45aSAndre Oppermann 	 * information purged.
34656a4e45aSAndre Oppermann 	 */
34796e12413SBosko Milekic 	m->m_ext.ext_buf = NULL;
34856a4e45aSAndre Oppermann 	m->m_ext.ext_free = NULL;
349cf827063SPoul-Henning Kamp 	m->m_ext.ext_arg1 = NULL;
350cf827063SPoul-Henning Kamp 	m->m_ext.ext_arg2 = NULL;
35156a4e45aSAndre Oppermann 	m->m_ext.ref_cnt = NULL;
35256a4e45aSAndre Oppermann 	m->m_ext.ext_size = 0;
35356a4e45aSAndre Oppermann 	m->m_ext.ext_type = 0;
354894734cbSAndre Oppermann 	m->m_ext.ext_flags = 0;
35556a4e45aSAndre Oppermann 	m->m_flags &= ~M_EXT;
35696e12413SBosko Milekic 	uma_zfree(zone_mbuf, m);
357b5b2ea9aSBosko Milekic }
358099a0e58SBosko Milekic 
359099a0e58SBosko Milekic /*
3606bccea7cSRebecca Cran  * Attach the cluster from *m to *n, set up m_ext in *n
36156a4e45aSAndre Oppermann  * and bump the refcount of the cluster.
36256a4e45aSAndre Oppermann  */
36356a4e45aSAndre Oppermann static void
36456a4e45aSAndre Oppermann mb_dupcl(struct mbuf *n, struct mbuf *m)
36556a4e45aSAndre Oppermann {
36656a4e45aSAndre Oppermann 	KASSERT((m->m_flags & M_EXT) == M_EXT, ("%s: M_EXT not set", __func__));
36756a4e45aSAndre Oppermann 	KASSERT(m->m_ext.ref_cnt != NULL, ("%s: ref_cnt not set", __func__));
36856a4e45aSAndre Oppermann 	KASSERT((n->m_flags & M_EXT) == 0, ("%s: M_EXT set", __func__));
36956a4e45aSAndre Oppermann 
37056a4e45aSAndre Oppermann 	if (*(m->m_ext.ref_cnt) == 1)
37156a4e45aSAndre Oppermann 		*(m->m_ext.ref_cnt) += 1;
37256a4e45aSAndre Oppermann 	else
37356a4e45aSAndre Oppermann 		atomic_add_int(m->m_ext.ref_cnt, 1);
37456a4e45aSAndre Oppermann 	n->m_ext.ext_buf = m->m_ext.ext_buf;
37556a4e45aSAndre Oppermann 	n->m_ext.ext_free = m->m_ext.ext_free;
376cf827063SPoul-Henning Kamp 	n->m_ext.ext_arg1 = m->m_ext.ext_arg1;
377cf827063SPoul-Henning Kamp 	n->m_ext.ext_arg2 = m->m_ext.ext_arg2;
37856a4e45aSAndre Oppermann 	n->m_ext.ext_size = m->m_ext.ext_size;
37956a4e45aSAndre Oppermann 	n->m_ext.ref_cnt = m->m_ext.ref_cnt;
38056a4e45aSAndre Oppermann 	n->m_ext.ext_type = m->m_ext.ext_type;
381894734cbSAndre Oppermann 	n->m_ext.ext_flags = m->m_ext.ext_flags;
38256a4e45aSAndre Oppermann 	n->m_flags |= M_EXT;
38332a8b1d8SColin Percival 	n->m_flags |= m->m_flags & M_RDONLY;
38456a4e45aSAndre Oppermann }
38556a4e45aSAndre Oppermann 
38656a4e45aSAndre Oppermann /*
387ed111688SAndre Oppermann  * Clean up mbuf (chain) from any tags and packet headers.
388e0068c3aSAndre Oppermann  * If "all" is set then the first mbuf in the chain will be
389e0068c3aSAndre Oppermann  * cleaned too.
390ed111688SAndre Oppermann  */
391ed111688SAndre Oppermann void
392e0068c3aSAndre Oppermann m_demote(struct mbuf *m0, int all)
393ed111688SAndre Oppermann {
394ed111688SAndre Oppermann 	struct mbuf *m;
395ed111688SAndre Oppermann 
396ed111688SAndre Oppermann 	for (m = all ? m0 : m0->m_next; m != NULL; m = m->m_next) {
397ed111688SAndre Oppermann 		if (m->m_flags & M_PKTHDR) {
398ed111688SAndre Oppermann 			m_tag_delete_chain(m, NULL);
399ed111688SAndre Oppermann 			m->m_flags &= ~M_PKTHDR;
400ed111688SAndre Oppermann 			bzero(&m->m_pkthdr, sizeof(struct pkthdr));
401ed111688SAndre Oppermann 		}
4020cb6db1dSAndre Oppermann 		if (m != m0 && m->m_nextpkt != NULL) {
4030cb6db1dSAndre Oppermann 			KASSERT(m->m_nextpkt == NULL,
4040cb6db1dSAndre Oppermann 			    ("%s: m_nextpkt not NULL", __func__));
4050cb6db1dSAndre Oppermann 			m_freem(m->m_nextpkt);
406ed111688SAndre Oppermann 			m->m_nextpkt = NULL;
4070cb6db1dSAndre Oppermann 		}
4081227f20dSAndre Oppermann 		m->m_flags = m->m_flags & (M_EXT|M_RDONLY|M_NOFREE);
409ed111688SAndre Oppermann 	}
410ed111688SAndre Oppermann }
411ed111688SAndre Oppermann 
412ed111688SAndre Oppermann /*
413fdcc028dSAndre Oppermann  * Sanity checks on mbuf (chain) for use in KASSERT() and general
414fdcc028dSAndre Oppermann  * debugging.
415fdcc028dSAndre Oppermann  * Returns 0 or panics when bad and 1 on all tests passed.
416fdcc028dSAndre Oppermann  * Sanitize, 0 to run M_SANITY_ACTION, 1 to garble things so they
417fdcc028dSAndre Oppermann  * blow up later.
418a048affbSAndre Oppermann  */
419a048affbSAndre Oppermann int
420a048affbSAndre Oppermann m_sanity(struct mbuf *m0, int sanitize)
421a048affbSAndre Oppermann {
422a048affbSAndre Oppermann 	struct mbuf *m;
423a048affbSAndre Oppermann 	caddr_t a, b;
424a048affbSAndre Oppermann 	int pktlen = 0;
425a048affbSAndre Oppermann 
42621ee3e7aSKip Macy #ifdef INVARIANTS
42721ee3e7aSKip Macy #define	M_SANITY_ACTION(s)	panic("mbuf %p: " s, m)
42821ee3e7aSKip Macy #else
42921ee3e7aSKip Macy #define	M_SANITY_ACTION(s)	printf("mbuf %p: " s, m)
43021ee3e7aSKip Macy #endif
431a048affbSAndre Oppermann 
432fdcc028dSAndre Oppermann 	for (m = m0; m != NULL; m = m->m_next) {
433a048affbSAndre Oppermann 		/*
434a048affbSAndre Oppermann 		 * Basic pointer checks.  If any of these fails then some
435a048affbSAndre Oppermann 		 * unrelated kernel memory before or after us is trashed.
436a048affbSAndre Oppermann 		 * No way to recover from that.
437a048affbSAndre Oppermann 		 */
438fdcc028dSAndre Oppermann 		a = ((m->m_flags & M_EXT) ? m->m_ext.ext_buf :
439fdcc028dSAndre Oppermann 			((m->m_flags & M_PKTHDR) ? (caddr_t)(&m->m_pktdat) :
440a048affbSAndre Oppermann 			 (caddr_t)(&m->m_dat)) );
441a048affbSAndre Oppermann 		b = (caddr_t)(a + (m->m_flags & M_EXT ? m->m_ext.ext_size :
442fdcc028dSAndre Oppermann 			((m->m_flags & M_PKTHDR) ? MHLEN : MLEN)));
443a048affbSAndre Oppermann 		if ((caddr_t)m->m_data < a)
444a048affbSAndre Oppermann 			M_SANITY_ACTION("m_data outside mbuf data range left");
445a048affbSAndre Oppermann 		if ((caddr_t)m->m_data > b)
446a048affbSAndre Oppermann 			M_SANITY_ACTION("m_data outside mbuf data range right");
447a048affbSAndre Oppermann 		if ((caddr_t)m->m_data + m->m_len > b)
448a048affbSAndre Oppermann 			M_SANITY_ACTION("m_data + m_len exeeds mbuf space");
449a048affbSAndre Oppermann 
450a048affbSAndre Oppermann 		/* m->m_nextpkt may only be set on first mbuf in chain. */
451fdcc028dSAndre Oppermann 		if (m != m0 && m->m_nextpkt != NULL) {
452a048affbSAndre Oppermann 			if (sanitize) {
453a048affbSAndre Oppermann 				m_freem(m->m_nextpkt);
454a048affbSAndre Oppermann 				m->m_nextpkt = (struct mbuf *)0xDEADC0DE;
455a048affbSAndre Oppermann 			} else
456a048affbSAndre Oppermann 				M_SANITY_ACTION("m->m_nextpkt on in-chain mbuf");
457a048affbSAndre Oppermann 		}
458a048affbSAndre Oppermann 
459a048affbSAndre Oppermann 		/* packet length (not mbuf length!) calculation */
460a048affbSAndre Oppermann 		if (m0->m_flags & M_PKTHDR)
461a048affbSAndre Oppermann 			pktlen += m->m_len;
462a048affbSAndre Oppermann 
463a048affbSAndre Oppermann 		/* m_tags may only be attached to first mbuf in chain. */
464a048affbSAndre Oppermann 		if (m != m0 && m->m_flags & M_PKTHDR &&
465a048affbSAndre Oppermann 		    !SLIST_EMPTY(&m->m_pkthdr.tags)) {
466a048affbSAndre Oppermann 			if (sanitize) {
467a048affbSAndre Oppermann 				m_tag_delete_chain(m, NULL);
468a048affbSAndre Oppermann 				/* put in 0xDEADC0DE perhaps? */
469fdcc028dSAndre Oppermann 			} else
470a048affbSAndre Oppermann 				M_SANITY_ACTION("m_tags on in-chain mbuf");
471a048affbSAndre Oppermann 		}
472a048affbSAndre Oppermann 
473a048affbSAndre Oppermann 		/* M_PKTHDR may only be set on first mbuf in chain */
474a048affbSAndre Oppermann 		if (m != m0 && m->m_flags & M_PKTHDR) {
475a048affbSAndre Oppermann 			if (sanitize) {
476a048affbSAndre Oppermann 				bzero(&m->m_pkthdr, sizeof(m->m_pkthdr));
477a048affbSAndre Oppermann 				m->m_flags &= ~M_PKTHDR;
478a048affbSAndre Oppermann 				/* put in 0xDEADCODE and leave hdr flag in */
479a048affbSAndre Oppermann 			} else
480a048affbSAndre Oppermann 				M_SANITY_ACTION("M_PKTHDR on in-chain mbuf");
481a048affbSAndre Oppermann 		}
482a048affbSAndre Oppermann 	}
483fdcc028dSAndre Oppermann 	m = m0;
484fdcc028dSAndre Oppermann 	if (pktlen && pktlen != m->m_pkthdr.len) {
485a048affbSAndre Oppermann 		if (sanitize)
486fdcc028dSAndre Oppermann 			m->m_pkthdr.len = 0;
487a048affbSAndre Oppermann 		else
488a048affbSAndre Oppermann 			M_SANITY_ACTION("m_pkthdr.len != mbuf chain length");
489a048affbSAndre Oppermann 	}
490a048affbSAndre Oppermann 	return 1;
491fdcc028dSAndre Oppermann 
492fdcc028dSAndre Oppermann #undef	M_SANITY_ACTION
493a048affbSAndre Oppermann }
494a048affbSAndre Oppermann 
495a048affbSAndre Oppermann 
496a048affbSAndre Oppermann /*
4979967cafcSSam Leffler  * "Move" mbuf pkthdr from "from" to "to".
498e37b1fcdSRobert Watson  * "from" must have M_PKTHDR set, and "to" must be empty.
499e37b1fcdSRobert Watson  */
500e37b1fcdSRobert Watson void
5019967cafcSSam Leffler m_move_pkthdr(struct mbuf *to, struct mbuf *from)
502e37b1fcdSRobert Watson {
503e37b1fcdSRobert Watson 
504e37b1fcdSRobert Watson #if 0
5059967cafcSSam Leffler 	/* see below for why these are not enabled */
506fe584538SDag-Erling Smørgrav 	M_ASSERTPKTHDR(to);
507225bff6fSRobert Watson 	/* Note: with MAC, this may not be a good assertion. */
5089967cafcSSam Leffler 	KASSERT(SLIST_EMPTY(&to->m_pkthdr.tags),
5099967cafcSSam Leffler 	    ("m_move_pkthdr: to has tags"));
510e37b1fcdSRobert Watson #endif
511e32a5b94SRobert Watson #ifdef MAC
512225bff6fSRobert Watson 	/*
513225bff6fSRobert Watson 	 * XXXMAC: It could be this should also occur for non-MAC?
514225bff6fSRobert Watson 	 */
515e32a5b94SRobert Watson 	if (to->m_flags & M_PKTHDR)
516225bff6fSRobert Watson 		m_tag_delete_chain(to, NULL);
517e32a5b94SRobert Watson #endif
518a4e71429SSam Leffler 	to->m_flags = (from->m_flags & M_COPYFLAGS) | (to->m_flags & M_EXT);
519a4e71429SSam Leffler 	if ((to->m_flags & M_EXT) == 0)
5209967cafcSSam Leffler 		to->m_data = to->m_pktdat;
5219967cafcSSam Leffler 	to->m_pkthdr = from->m_pkthdr;		/* especially tags */
5229967cafcSSam Leffler 	SLIST_INIT(&from->m_pkthdr.tags);	/* purge tags from src */
5239967cafcSSam Leffler 	from->m_flags &= ~M_PKTHDR;
5249967cafcSSam Leffler }
5259967cafcSSam Leffler 
5269967cafcSSam Leffler /*
5279967cafcSSam Leffler  * Duplicate "from"'s mbuf pkthdr in "to".
5289967cafcSSam Leffler  * "from" must have M_PKTHDR set, and "to" must be empty.
5299967cafcSSam Leffler  * In particular, this does a deep copy of the packet tags.
5309967cafcSSam Leffler  */
5319967cafcSSam Leffler int
5329967cafcSSam Leffler m_dup_pkthdr(struct mbuf *to, struct mbuf *from, int how)
5339967cafcSSam Leffler {
5349967cafcSSam Leffler 
5359967cafcSSam Leffler #if 0
5369967cafcSSam Leffler 	/*
5379967cafcSSam Leffler 	 * The mbuf allocator only initializes the pkthdr
538c95be8b5SGleb Smirnoff 	 * when the mbuf is allocated with m_gethdr(). Many users
539c95be8b5SGleb Smirnoff 	 * (e.g. m_copy*, m_prepend) use m_get() and then
5409967cafcSSam Leffler 	 * smash the pkthdr as needed causing these
5419967cafcSSam Leffler 	 * assertions to trip.  For now just disable them.
5429967cafcSSam Leffler 	 */
543fe584538SDag-Erling Smørgrav 	M_ASSERTPKTHDR(to);
544225bff6fSRobert Watson 	/* Note: with MAC, this may not be a good assertion. */
5459967cafcSSam Leffler 	KASSERT(SLIST_EMPTY(&to->m_pkthdr.tags), ("m_dup_pkthdr: to has tags"));
5469967cafcSSam Leffler #endif
547063d8114SAlfred Perlstein 	MBUF_CHECKSLEEP(how);
5489967cafcSSam Leffler #ifdef MAC
5499967cafcSSam Leffler 	if (to->m_flags & M_PKTHDR)
550225bff6fSRobert Watson 		m_tag_delete_chain(to, NULL);
5519967cafcSSam Leffler #endif
552df8c7fc9SMike Silbersack 	to->m_flags = (from->m_flags & M_COPYFLAGS) | (to->m_flags & M_EXT);
553df8c7fc9SMike Silbersack 	if ((to->m_flags & M_EXT) == 0)
5549967cafcSSam Leffler 		to->m_data = to->m_pktdat;
555e37b1fcdSRobert Watson 	to->m_pkthdr = from->m_pkthdr;
5569967cafcSSam Leffler 	SLIST_INIT(&to->m_pkthdr.tags);
557*94985f74SGleb Smirnoff 	return (m_tag_copy_chain(to, from, how));
558e37b1fcdSRobert Watson }
559e37b1fcdSRobert Watson 
560e37b1fcdSRobert Watson /*
561df8bae1dSRodney W. Grimes  * Lesser-used path for M_PREPEND:
562df8bae1dSRodney W. Grimes  * allocate new mbuf to prepend to chain,
563df8bae1dSRodney W. Grimes  * copy junk along.
564df8bae1dSRodney W. Grimes  */
565df8bae1dSRodney W. Grimes struct mbuf *
566122a814aSBosko Milekic m_prepend(struct mbuf *m, int len, int how)
567df8bae1dSRodney W. Grimes {
568df8bae1dSRodney W. Grimes 	struct mbuf *mn;
569df8bae1dSRodney W. Grimes 
570f8bf8e39SMike Silbersack 	if (m->m_flags & M_PKTHDR)
571c95be8b5SGleb Smirnoff 		mn = m_gethdr(how, m->m_type);
572f8bf8e39SMike Silbersack 	else
573c95be8b5SGleb Smirnoff 		mn = m_get(how, m->m_type);
574122a814aSBosko Milekic 	if (mn == NULL) {
575df8bae1dSRodney W. Grimes 		m_freem(m);
576122a814aSBosko Milekic 		return (NULL);
577df8bae1dSRodney W. Grimes 	}
578225bff6fSRobert Watson 	if (m->m_flags & M_PKTHDR)
579c95be8b5SGleb Smirnoff 		m_move_pkthdr(mn, m);
580df8bae1dSRodney W. Grimes 	mn->m_next = m;
581df8bae1dSRodney W. Grimes 	m = mn;
5825288989fSRandall Stewart 	if(m->m_flags & M_PKTHDR) {
583df8bae1dSRodney W. Grimes 		if (len < MHLEN)
584df8bae1dSRodney W. Grimes 			MH_ALIGN(m, len);
5855288989fSRandall Stewart 	} else {
5865288989fSRandall Stewart 		if (len < MLEN)
5875288989fSRandall Stewart 			M_ALIGN(m, len);
5885288989fSRandall Stewart 	}
589df8bae1dSRodney W. Grimes 	m->m_len = len;
590df8bae1dSRodney W. Grimes 	return (m);
591df8bae1dSRodney W. Grimes }
592df8bae1dSRodney W. Grimes 
593df8bae1dSRodney W. Grimes /*
594df8bae1dSRodney W. Grimes  * Make a copy of an mbuf chain starting "off0" bytes from the beginning,
595df8bae1dSRodney W. Grimes  * continuing for "len" bytes.  If len is M_COPYALL, copy to end of mbuf.
596eb1b1807SGleb Smirnoff  * The wait parameter is a choice of M_WAITOK/M_NOWAIT from caller.
5971c38f2eaSArchie Cobbs  * Note that the copy is read-only, because clusters are not copied,
5981c38f2eaSArchie Cobbs  * only their reference counts are incremented.
599df8bae1dSRodney W. Grimes  */
600df8bae1dSRodney W. Grimes struct mbuf *
601122a814aSBosko Milekic m_copym(struct mbuf *m, int off0, int len, int wait)
602df8bae1dSRodney W. Grimes {
603122a814aSBosko Milekic 	struct mbuf *n, **np;
604122a814aSBosko Milekic 	int off = off0;
605df8bae1dSRodney W. Grimes 	struct mbuf *top;
606df8bae1dSRodney W. Grimes 	int copyhdr = 0;
607df8bae1dSRodney W. Grimes 
608e0a653ddSAlfred Perlstein 	KASSERT(off >= 0, ("m_copym, negative off %d", off));
609e0a653ddSAlfred Perlstein 	KASSERT(len >= 0, ("m_copym, negative len %d", len));
610063d8114SAlfred Perlstein 	MBUF_CHECKSLEEP(wait);
611df8bae1dSRodney W. Grimes 	if (off == 0 && m->m_flags & M_PKTHDR)
612df8bae1dSRodney W. Grimes 		copyhdr = 1;
613df8bae1dSRodney W. Grimes 	while (off > 0) {
614e0a653ddSAlfred Perlstein 		KASSERT(m != NULL, ("m_copym, offset > size of mbuf chain"));
615df8bae1dSRodney W. Grimes 		if (off < m->m_len)
616df8bae1dSRodney W. Grimes 			break;
617df8bae1dSRodney W. Grimes 		off -= m->m_len;
618df8bae1dSRodney W. Grimes 		m = m->m_next;
619df8bae1dSRodney W. Grimes 	}
620df8bae1dSRodney W. Grimes 	np = &top;
621df8bae1dSRodney W. Grimes 	top = 0;
622df8bae1dSRodney W. Grimes 	while (len > 0) {
623122a814aSBosko Milekic 		if (m == NULL) {
624e0a653ddSAlfred Perlstein 			KASSERT(len == M_COPYALL,
625e0a653ddSAlfred Perlstein 			    ("m_copym, length > size of mbuf chain"));
626df8bae1dSRodney W. Grimes 			break;
627df8bae1dSRodney W. Grimes 		}
628f8bf8e39SMike Silbersack 		if (copyhdr)
629c95be8b5SGleb Smirnoff 			n = m_gethdr(wait, m->m_type);
630f8bf8e39SMike Silbersack 		else
631c95be8b5SGleb Smirnoff 			n = m_get(wait, m->m_type);
632df8bae1dSRodney W. Grimes 		*np = n;
633122a814aSBosko Milekic 		if (n == NULL)
634df8bae1dSRodney W. Grimes 			goto nospace;
635df8bae1dSRodney W. Grimes 		if (copyhdr) {
6369967cafcSSam Leffler 			if (!m_dup_pkthdr(n, m, wait))
6379967cafcSSam Leffler 				goto nospace;
638df8bae1dSRodney W. Grimes 			if (len == M_COPYALL)
639df8bae1dSRodney W. Grimes 				n->m_pkthdr.len -= off0;
640df8bae1dSRodney W. Grimes 			else
641df8bae1dSRodney W. Grimes 				n->m_pkthdr.len = len;
642df8bae1dSRodney W. Grimes 			copyhdr = 0;
643df8bae1dSRodney W. Grimes 		}
644df8bae1dSRodney W. Grimes 		n->m_len = min(len, m->m_len - off);
645df8bae1dSRodney W. Grimes 		if (m->m_flags & M_EXT) {
646df8bae1dSRodney W. Grimes 			n->m_data = m->m_data + off;
64756a4e45aSAndre Oppermann 			mb_dupcl(n, m);
648df8bae1dSRodney W. Grimes 		} else
649df8bae1dSRodney W. Grimes 			bcopy(mtod(m, caddr_t)+off, mtod(n, caddr_t),
650bd395ae8SBosko Milekic 			    (u_int)n->m_len);
651df8bae1dSRodney W. Grimes 		if (len != M_COPYALL)
652df8bae1dSRodney W. Grimes 			len -= n->m_len;
653df8bae1dSRodney W. Grimes 		off = 0;
654df8bae1dSRodney W. Grimes 		m = m->m_next;
655df8bae1dSRodney W. Grimes 		np = &n->m_next;
656df8bae1dSRodney W. Grimes 	}
65708442f8aSBosko Milekic 
658df8bae1dSRodney W. Grimes 	return (top);
659df8bae1dSRodney W. Grimes nospace:
660df8bae1dSRodney W. Grimes 	m_freem(top);
661122a814aSBosko Milekic 	return (NULL);
662df8bae1dSRodney W. Grimes }
663df8bae1dSRodney W. Grimes 
664df8bae1dSRodney W. Grimes /*
6654da84431SAndre Oppermann  * Returns mbuf chain with new head for the prepending case.
6664da84431SAndre Oppermann  * Copies from mbuf (chain) n from off for len to mbuf (chain) m
6674da84431SAndre Oppermann  * either prepending or appending the data.
6684da84431SAndre Oppermann  * The resulting mbuf (chain) m is fully writeable.
6694da84431SAndre Oppermann  * m is destination (is made writeable)
6704da84431SAndre Oppermann  * n is source, off is offset in source, len is len from offset
6714da84431SAndre Oppermann  * dir, 0 append, 1 prepend
6724da84431SAndre Oppermann  * how, wait or nowait
6734da84431SAndre Oppermann  */
6744da84431SAndre Oppermann 
6754da84431SAndre Oppermann static int
6764da84431SAndre Oppermann m_bcopyxxx(void *s, void *t, u_int len)
6774da84431SAndre Oppermann {
6784da84431SAndre Oppermann 	bcopy(s, t, (size_t)len);
6794da84431SAndre Oppermann 	return 0;
6804da84431SAndre Oppermann }
6814da84431SAndre Oppermann 
6824da84431SAndre Oppermann struct mbuf *
6834da84431SAndre Oppermann m_copymdata(struct mbuf *m, struct mbuf *n, int off, int len,
6844da84431SAndre Oppermann     int prep, int how)
6854da84431SAndre Oppermann {
68656a4e45aSAndre Oppermann 	struct mbuf *mm, *x, *z, *prev = NULL;
6874da84431SAndre Oppermann 	caddr_t p;
68856a4e45aSAndre Oppermann 	int i, nlen = 0;
6894da84431SAndre Oppermann 	caddr_t buf[MLEN];
6904da84431SAndre Oppermann 
6914da84431SAndre Oppermann 	KASSERT(m != NULL && n != NULL, ("m_copymdata, no target or source"));
6924da84431SAndre Oppermann 	KASSERT(off >= 0, ("m_copymdata, negative off %d", off));
6934da84431SAndre Oppermann 	KASSERT(len >= 0, ("m_copymdata, negative len %d", len));
6944da84431SAndre Oppermann 	KASSERT(prep == 0 || prep == 1, ("m_copymdata, unknown direction %d", prep));
6954da84431SAndre Oppermann 
69656a4e45aSAndre Oppermann 	mm = m;
69756a4e45aSAndre Oppermann 	if (!prep) {
69856a4e45aSAndre Oppermann 		while(mm->m_next) {
69956a4e45aSAndre Oppermann 			prev = mm;
70056a4e45aSAndre Oppermann 			mm = mm->m_next;
7014da84431SAndre Oppermann 		}
7024da84431SAndre Oppermann 	}
7034da84431SAndre Oppermann 	for (z = n; z != NULL; z = z->m_next)
7044da84431SAndre Oppermann 		nlen += z->m_len;
7054da84431SAndre Oppermann 	if (len == M_COPYALL)
7064da84431SAndre Oppermann 		len = nlen - off;
7074da84431SAndre Oppermann 	if (off + len > nlen || len < 1)
7084da84431SAndre Oppermann 		return NULL;
7094da84431SAndre Oppermann 
71056a4e45aSAndre Oppermann 	if (!M_WRITABLE(mm)) {
71156a4e45aSAndre Oppermann 		/* XXX: Use proper m_xxx function instead. */
71256a4e45aSAndre Oppermann 		x = m_getcl(how, MT_DATA, mm->m_flags);
71356a4e45aSAndre Oppermann 		if (x == NULL)
71456a4e45aSAndre Oppermann 			return NULL;
71556a4e45aSAndre Oppermann 		bcopy(mm->m_ext.ext_buf, x->m_ext.ext_buf, x->m_ext.ext_size);
71656a4e45aSAndre Oppermann 		p = x->m_ext.ext_buf + (mm->m_data - mm->m_ext.ext_buf);
71756a4e45aSAndre Oppermann 		x->m_data = p;
71856a4e45aSAndre Oppermann 		mm->m_next = NULL;
71956a4e45aSAndre Oppermann 		if (mm != m)
72056a4e45aSAndre Oppermann 			prev->m_next = x;
72156a4e45aSAndre Oppermann 		m_free(mm);
72256a4e45aSAndre Oppermann 		mm = x;
72356a4e45aSAndre Oppermann 	}
72456a4e45aSAndre Oppermann 
7254da84431SAndre Oppermann 	/*
7264da84431SAndre Oppermann 	 * Append/prepend the data.  Allocating mbufs as necessary.
7274da84431SAndre Oppermann 	 */
7284da84431SAndre Oppermann 	/* Shortcut if enough free space in first/last mbuf. */
7294da84431SAndre Oppermann 	if (!prep && M_TRAILINGSPACE(mm) >= len) {
7304da84431SAndre Oppermann 		m_apply(n, off, len, m_bcopyxxx, mtod(mm, caddr_t) +
7314da84431SAndre Oppermann 			 mm->m_len);
7324da84431SAndre Oppermann 		mm->m_len += len;
7334da84431SAndre Oppermann 		mm->m_pkthdr.len += len;
7344da84431SAndre Oppermann 		return m;
7354da84431SAndre Oppermann 	}
7364da84431SAndre Oppermann 	if (prep && M_LEADINGSPACE(mm) >= len) {
7374da84431SAndre Oppermann 		mm->m_data = mtod(mm, caddr_t) - len;
7384da84431SAndre Oppermann 		m_apply(n, off, len, m_bcopyxxx, mtod(mm, caddr_t));
7394da84431SAndre Oppermann 		mm->m_len += len;
7404da84431SAndre Oppermann 		mm->m_pkthdr.len += len;
7414da84431SAndre Oppermann 		return mm;
7424da84431SAndre Oppermann 	}
7434da84431SAndre Oppermann 
7444da84431SAndre Oppermann 	/* Expand first/last mbuf to cluster if possible. */
7454da84431SAndre Oppermann 	if (!prep && !(mm->m_flags & M_EXT) && len > M_TRAILINGSPACE(mm)) {
7464da84431SAndre Oppermann 		bcopy(mm->m_data, &buf, mm->m_len);
7474da84431SAndre Oppermann 		m_clget(mm, how);
7484da84431SAndre Oppermann 		if (!(mm->m_flags & M_EXT))
7494da84431SAndre Oppermann 			return NULL;
7504da84431SAndre Oppermann 		bcopy(&buf, mm->m_ext.ext_buf, mm->m_len);
7514da84431SAndre Oppermann 		mm->m_data = mm->m_ext.ext_buf;
7524da84431SAndre Oppermann 	}
7534da84431SAndre Oppermann 	if (prep && !(mm->m_flags & M_EXT) && len > M_LEADINGSPACE(mm)) {
7544da84431SAndre Oppermann 		bcopy(mm->m_data, &buf, mm->m_len);
7554da84431SAndre Oppermann 		m_clget(mm, how);
7564da84431SAndre Oppermann 		if (!(mm->m_flags & M_EXT))
7574da84431SAndre Oppermann 			return NULL;
7584da84431SAndre Oppermann 		bcopy(&buf, (caddr_t *)mm->m_ext.ext_buf +
7594da84431SAndre Oppermann 		       mm->m_ext.ext_size - mm->m_len, mm->m_len);
7604da84431SAndre Oppermann 		mm->m_data = (caddr_t)mm->m_ext.ext_buf +
7614da84431SAndre Oppermann 			      mm->m_ext.ext_size - mm->m_len;
7624da84431SAndre Oppermann 	}
7634da84431SAndre Oppermann 
7644da84431SAndre Oppermann 	/* Append/prepend as many mbuf (clusters) as necessary to fit len. */
7654da84431SAndre Oppermann 	if (!prep && len > M_TRAILINGSPACE(mm)) {
7664da84431SAndre Oppermann 		if (!m_getm(mm, len - M_TRAILINGSPACE(mm), how, MT_DATA))
7674da84431SAndre Oppermann 			return NULL;
7684da84431SAndre Oppermann 	}
7694da84431SAndre Oppermann 	if (prep && len > M_LEADINGSPACE(mm)) {
7704da84431SAndre Oppermann 		if (!(z = m_getm(NULL, len - M_LEADINGSPACE(mm), how, MT_DATA)))
7714da84431SAndre Oppermann 			return NULL;
7724da84431SAndre Oppermann 		i = 0;
7734da84431SAndre Oppermann 		for (x = z; x != NULL; x = x->m_next) {
7744da84431SAndre Oppermann 			i += x->m_flags & M_EXT ? x->m_ext.ext_size :
7754da84431SAndre Oppermann 			      (x->m_flags & M_PKTHDR ? MHLEN : MLEN);
7764da84431SAndre Oppermann 			if (!x->m_next)
7774da84431SAndre Oppermann 				break;
7784da84431SAndre Oppermann 		}
7794da84431SAndre Oppermann 		z->m_data += i - len;
7804da84431SAndre Oppermann 		m_move_pkthdr(mm, z);
7814da84431SAndre Oppermann 		x->m_next = mm;
7824da84431SAndre Oppermann 		mm = z;
7834da84431SAndre Oppermann 	}
7844da84431SAndre Oppermann 
7854da84431SAndre Oppermann 	/* Seek to start position in source mbuf. Optimization for long chains. */
7864da84431SAndre Oppermann 	while (off > 0) {
7874da84431SAndre Oppermann 		if (off < n->m_len)
7884da84431SAndre Oppermann 			break;
7894da84431SAndre Oppermann 		off -= n->m_len;
7904da84431SAndre Oppermann 		n = n->m_next;
7914da84431SAndre Oppermann 	}
7924da84431SAndre Oppermann 
7934da84431SAndre Oppermann 	/* Copy data into target mbuf. */
7944da84431SAndre Oppermann 	z = mm;
7954da84431SAndre Oppermann 	while (len > 0) {
7964da84431SAndre Oppermann 		KASSERT(z != NULL, ("m_copymdata, falling off target edge"));
7974da84431SAndre Oppermann 		i = M_TRAILINGSPACE(z);
7984da84431SAndre Oppermann 		m_apply(n, off, i, m_bcopyxxx, mtod(z, caddr_t) + z->m_len);
7994da84431SAndre Oppermann 		z->m_len += i;
8004da84431SAndre Oppermann 		/* fixup pkthdr.len if necessary */
8014da84431SAndre Oppermann 		if ((prep ? mm : m)->m_flags & M_PKTHDR)
8024da84431SAndre Oppermann 			(prep ? mm : m)->m_pkthdr.len += i;
8034da84431SAndre Oppermann 		off += i;
8044da84431SAndre Oppermann 		len -= i;
8054da84431SAndre Oppermann 		z = z->m_next;
8064da84431SAndre Oppermann 	}
8074da84431SAndre Oppermann 	return (prep ? mm : m);
8084da84431SAndre Oppermann }
8094da84431SAndre Oppermann 
8104da84431SAndre Oppermann /*
8116a06dea0SGarrett Wollman  * Copy an entire packet, including header (which must be present).
8126a06dea0SGarrett Wollman  * An optimization of the common case `m_copym(m, 0, M_COPYALL, how)'.
8131c38f2eaSArchie Cobbs  * Note that the copy is read-only, because clusters are not copied,
8141c38f2eaSArchie Cobbs  * only their reference counts are incremented.
8155fe86675SLuigi Rizzo  * Preserve alignment of the first mbuf so if the creator has left
8165fe86675SLuigi Rizzo  * some room at the beginning (e.g. for inserting protocol headers)
8175fe86675SLuigi Rizzo  * the copies still have the room available.
8186a06dea0SGarrett Wollman  */
8196a06dea0SGarrett Wollman struct mbuf *
820122a814aSBosko Milekic m_copypacket(struct mbuf *m, int how)
8216a06dea0SGarrett Wollman {
8226a06dea0SGarrett Wollman 	struct mbuf *top, *n, *o;
8236a06dea0SGarrett Wollman 
824063d8114SAlfred Perlstein 	MBUF_CHECKSLEEP(how);
825c95be8b5SGleb Smirnoff 	n = m_get(how, m->m_type);
8266a06dea0SGarrett Wollman 	top = n;
827122a814aSBosko Milekic 	if (n == NULL)
8286a06dea0SGarrett Wollman 		goto nospace;
8296a06dea0SGarrett Wollman 
8309967cafcSSam Leffler 	if (!m_dup_pkthdr(n, m, how))
8319967cafcSSam Leffler 		goto nospace;
8326a06dea0SGarrett Wollman 	n->m_len = m->m_len;
8336a06dea0SGarrett Wollman 	if (m->m_flags & M_EXT) {
8346a06dea0SGarrett Wollman 		n->m_data = m->m_data;
83556a4e45aSAndre Oppermann 		mb_dupcl(n, m);
8366a06dea0SGarrett Wollman 	} else {
8375fe86675SLuigi Rizzo 		n->m_data = n->m_pktdat + (m->m_data - m->m_pktdat );
8386a06dea0SGarrett Wollman 		bcopy(mtod(m, char *), mtod(n, char *), n->m_len);
8396a06dea0SGarrett Wollman 	}
8406a06dea0SGarrett Wollman 
8416a06dea0SGarrett Wollman 	m = m->m_next;
8426a06dea0SGarrett Wollman 	while (m) {
843c95be8b5SGleb Smirnoff 		o = m_get(how, m->m_type);
844122a814aSBosko Milekic 		if (o == NULL)
8456a06dea0SGarrett Wollman 			goto nospace;
8466a06dea0SGarrett Wollman 
8476a06dea0SGarrett Wollman 		n->m_next = o;
8486a06dea0SGarrett Wollman 		n = n->m_next;
8496a06dea0SGarrett Wollman 
8506a06dea0SGarrett Wollman 		n->m_len = m->m_len;
8516a06dea0SGarrett Wollman 		if (m->m_flags & M_EXT) {
8526a06dea0SGarrett Wollman 			n->m_data = m->m_data;
85356a4e45aSAndre Oppermann 			mb_dupcl(n, m);
8546a06dea0SGarrett Wollman 		} else {
8556a06dea0SGarrett Wollman 			bcopy(mtod(m, char *), mtod(n, char *), n->m_len);
8566a06dea0SGarrett Wollman 		}
8576a06dea0SGarrett Wollman 
8586a06dea0SGarrett Wollman 		m = m->m_next;
8596a06dea0SGarrett Wollman 	}
8606a06dea0SGarrett Wollman 	return top;
8616a06dea0SGarrett Wollman nospace:
8626a06dea0SGarrett Wollman 	m_freem(top);
863122a814aSBosko Milekic 	return (NULL);
8646a06dea0SGarrett Wollman }
8656a06dea0SGarrett Wollman 
8666a06dea0SGarrett Wollman /*
867df8bae1dSRodney W. Grimes  * Copy data from an mbuf chain starting "off" bytes from the beginning,
868df8bae1dSRodney W. Grimes  * continuing for "len" bytes, into the indicated buffer.
869df8bae1dSRodney W. Grimes  */
87026f9a767SRodney W. Grimes void
871a8cfc0eeSJulian Elischer m_copydata(const struct mbuf *m, int off, int len, caddr_t cp)
872df8bae1dSRodney W. Grimes {
873bd395ae8SBosko Milekic 	u_int count;
874df8bae1dSRodney W. Grimes 
875e0a653ddSAlfred Perlstein 	KASSERT(off >= 0, ("m_copydata, negative off %d", off));
876e0a653ddSAlfred Perlstein 	KASSERT(len >= 0, ("m_copydata, negative len %d", len));
877df8bae1dSRodney W. Grimes 	while (off > 0) {
878e0a653ddSAlfred Perlstein 		KASSERT(m != NULL, ("m_copydata, offset > size of mbuf chain"));
879df8bae1dSRodney W. Grimes 		if (off < m->m_len)
880df8bae1dSRodney W. Grimes 			break;
881df8bae1dSRodney W. Grimes 		off -= m->m_len;
882df8bae1dSRodney W. Grimes 		m = m->m_next;
883df8bae1dSRodney W. Grimes 	}
884df8bae1dSRodney W. Grimes 	while (len > 0) {
885e0a653ddSAlfred Perlstein 		KASSERT(m != NULL, ("m_copydata, length > size of mbuf chain"));
886df8bae1dSRodney W. Grimes 		count = min(m->m_len - off, len);
887df8bae1dSRodney W. Grimes 		bcopy(mtod(m, caddr_t) + off, cp, count);
888df8bae1dSRodney W. Grimes 		len -= count;
889df8bae1dSRodney W. Grimes 		cp += count;
890df8bae1dSRodney W. Grimes 		off = 0;
891df8bae1dSRodney W. Grimes 		m = m->m_next;
892df8bae1dSRodney W. Grimes 	}
893df8bae1dSRodney W. Grimes }
894df8bae1dSRodney W. Grimes 
895df8bae1dSRodney W. Grimes /*
8961c38f2eaSArchie Cobbs  * Copy a packet header mbuf chain into a completely new chain, including
8971c38f2eaSArchie Cobbs  * copying any mbuf clusters.  Use this instead of m_copypacket() when
8981c38f2eaSArchie Cobbs  * you need a writable copy of an mbuf chain.
8991c38f2eaSArchie Cobbs  */
9001c38f2eaSArchie Cobbs struct mbuf *
901122a814aSBosko Milekic m_dup(struct mbuf *m, int how)
9021c38f2eaSArchie Cobbs {
9031c38f2eaSArchie Cobbs 	struct mbuf **p, *top = NULL;
9041c38f2eaSArchie Cobbs 	int remain, moff, nsize;
9051c38f2eaSArchie Cobbs 
906063d8114SAlfred Perlstein 	MBUF_CHECKSLEEP(how);
9071c38f2eaSArchie Cobbs 	/* Sanity check */
9081c38f2eaSArchie Cobbs 	if (m == NULL)
909122a814aSBosko Milekic 		return (NULL);
910fe584538SDag-Erling Smørgrav 	M_ASSERTPKTHDR(m);
9111c38f2eaSArchie Cobbs 
9121c38f2eaSArchie Cobbs 	/* While there's more data, get a new mbuf, tack it on, and fill it */
9131c38f2eaSArchie Cobbs 	remain = m->m_pkthdr.len;
9141c38f2eaSArchie Cobbs 	moff = 0;
9151c38f2eaSArchie Cobbs 	p = &top;
9161c38f2eaSArchie Cobbs 	while (remain > 0 || top == NULL) {	/* allow m->m_pkthdr.len == 0 */
9171c38f2eaSArchie Cobbs 		struct mbuf *n;
9181c38f2eaSArchie Cobbs 
9191c38f2eaSArchie Cobbs 		/* Get the next new mbuf */
920099a0e58SBosko Milekic 		if (remain >= MINCLSIZE) {
921099a0e58SBosko Milekic 			n = m_getcl(how, m->m_type, 0);
922099a0e58SBosko Milekic 			nsize = MCLBYTES;
923099a0e58SBosko Milekic 		} else {
924099a0e58SBosko Milekic 			n = m_get(how, m->m_type);
925099a0e58SBosko Milekic 			nsize = MLEN;
926099a0e58SBosko Milekic 		}
9271c38f2eaSArchie Cobbs 		if (n == NULL)
9281c38f2eaSArchie Cobbs 			goto nospace;
929099a0e58SBosko Milekic 
930099a0e58SBosko Milekic 		if (top == NULL) {		/* First one, must be PKTHDR */
931099a0e58SBosko Milekic 			if (!m_dup_pkthdr(n, m, how)) {
932099a0e58SBosko Milekic 				m_free(n);
9331c38f2eaSArchie Cobbs 				goto nospace;
9341c38f2eaSArchie Cobbs 			}
93563e6f390SEd Maste 			if ((n->m_flags & M_EXT) == 0)
936099a0e58SBosko Milekic 				nsize = MHLEN;
9371c38f2eaSArchie Cobbs 		}
9381c38f2eaSArchie Cobbs 		n->m_len = 0;
9391c38f2eaSArchie Cobbs 
9401c38f2eaSArchie Cobbs 		/* Link it into the new chain */
9411c38f2eaSArchie Cobbs 		*p = n;
9421c38f2eaSArchie Cobbs 		p = &n->m_next;
9431c38f2eaSArchie Cobbs 
9441c38f2eaSArchie Cobbs 		/* Copy data from original mbuf(s) into new mbuf */
9451c38f2eaSArchie Cobbs 		while (n->m_len < nsize && m != NULL) {
9461c38f2eaSArchie Cobbs 			int chunk = min(nsize - n->m_len, m->m_len - moff);
9471c38f2eaSArchie Cobbs 
9481c38f2eaSArchie Cobbs 			bcopy(m->m_data + moff, n->m_data + n->m_len, chunk);
9491c38f2eaSArchie Cobbs 			moff += chunk;
9501c38f2eaSArchie Cobbs 			n->m_len += chunk;
9511c38f2eaSArchie Cobbs 			remain -= chunk;
9521c38f2eaSArchie Cobbs 			if (moff == m->m_len) {
9531c38f2eaSArchie Cobbs 				m = m->m_next;
9541c38f2eaSArchie Cobbs 				moff = 0;
9551c38f2eaSArchie Cobbs 			}
9561c38f2eaSArchie Cobbs 		}
9571c38f2eaSArchie Cobbs 
9581c38f2eaSArchie Cobbs 		/* Check correct total mbuf length */
9591c38f2eaSArchie Cobbs 		KASSERT((remain > 0 && m != NULL) || (remain == 0 && m == NULL),
960a48740b6SDavid E. O'Brien 		    	("%s: bogus m_pkthdr.len", __func__));
9611c38f2eaSArchie Cobbs 	}
9621c38f2eaSArchie Cobbs 	return (top);
9631c38f2eaSArchie Cobbs 
9641c38f2eaSArchie Cobbs nospace:
9651c38f2eaSArchie Cobbs 	m_freem(top);
966122a814aSBosko Milekic 	return (NULL);
9671c38f2eaSArchie Cobbs }
9681c38f2eaSArchie Cobbs 
9691c38f2eaSArchie Cobbs /*
970df8bae1dSRodney W. Grimes  * Concatenate mbuf chain n to m.
971df8bae1dSRodney W. Grimes  * Both chains must be of the same type (e.g. MT_DATA).
972df8bae1dSRodney W. Grimes  * Any m_pkthdr is not updated.
973df8bae1dSRodney W. Grimes  */
97426f9a767SRodney W. Grimes void
975122a814aSBosko Milekic m_cat(struct mbuf *m, struct mbuf *n)
976df8bae1dSRodney W. Grimes {
977df8bae1dSRodney W. Grimes 	while (m->m_next)
978df8bae1dSRodney W. Grimes 		m = m->m_next;
979df8bae1dSRodney W. Grimes 	while (n) {
98014d7c5b1SAndre Oppermann 		if (!M_WRITABLE(m) ||
98114d7c5b1SAndre Oppermann 		    M_TRAILINGSPACE(m) < n->m_len) {
982df8bae1dSRodney W. Grimes 			/* just join the two chains */
983df8bae1dSRodney W. Grimes 			m->m_next = n;
984df8bae1dSRodney W. Grimes 			return;
985df8bae1dSRodney W. Grimes 		}
986df8bae1dSRodney W. Grimes 		/* splat the data from one into the other */
987df8bae1dSRodney W. Grimes 		bcopy(mtod(n, caddr_t), mtod(m, caddr_t) + m->m_len,
988df8bae1dSRodney W. Grimes 		    (u_int)n->m_len);
989df8bae1dSRodney W. Grimes 		m->m_len += n->m_len;
990df8bae1dSRodney W. Grimes 		n = m_free(n);
991df8bae1dSRodney W. Grimes 	}
992df8bae1dSRodney W. Grimes }
993df8bae1dSRodney W. Grimes 
99426f9a767SRodney W. Grimes void
995122a814aSBosko Milekic m_adj(struct mbuf *mp, int req_len)
996df8bae1dSRodney W. Grimes {
997122a814aSBosko Milekic 	int len = req_len;
998122a814aSBosko Milekic 	struct mbuf *m;
999122a814aSBosko Milekic 	int count;
1000df8bae1dSRodney W. Grimes 
1001df8bae1dSRodney W. Grimes 	if ((m = mp) == NULL)
1002df8bae1dSRodney W. Grimes 		return;
1003df8bae1dSRodney W. Grimes 	if (len >= 0) {
1004df8bae1dSRodney W. Grimes 		/*
1005df8bae1dSRodney W. Grimes 		 * Trim from head.
1006df8bae1dSRodney W. Grimes 		 */
1007df8bae1dSRodney W. Grimes 		while (m != NULL && len > 0) {
1008df8bae1dSRodney W. Grimes 			if (m->m_len <= len) {
1009df8bae1dSRodney W. Grimes 				len -= m->m_len;
1010df8bae1dSRodney W. Grimes 				m->m_len = 0;
1011df8bae1dSRodney W. Grimes 				m = m->m_next;
1012df8bae1dSRodney W. Grimes 			} else {
1013df8bae1dSRodney W. Grimes 				m->m_len -= len;
1014df8bae1dSRodney W. Grimes 				m->m_data += len;
1015df8bae1dSRodney W. Grimes 				len = 0;
1016df8bae1dSRodney W. Grimes 			}
1017df8bae1dSRodney W. Grimes 		}
1018df8bae1dSRodney W. Grimes 		if (mp->m_flags & M_PKTHDR)
1019a83baab6SMarko Zec 			mp->m_pkthdr.len -= (req_len - len);
1020df8bae1dSRodney W. Grimes 	} else {
1021df8bae1dSRodney W. Grimes 		/*
1022df8bae1dSRodney W. Grimes 		 * Trim from tail.  Scan the mbuf chain,
1023df8bae1dSRodney W. Grimes 		 * calculating its length and finding the last mbuf.
1024df8bae1dSRodney W. Grimes 		 * If the adjustment only affects this mbuf, then just
1025df8bae1dSRodney W. Grimes 		 * adjust and return.  Otherwise, rescan and truncate
1026df8bae1dSRodney W. Grimes 		 * after the remaining size.
1027df8bae1dSRodney W. Grimes 		 */
1028df8bae1dSRodney W. Grimes 		len = -len;
1029df8bae1dSRodney W. Grimes 		count = 0;
1030df8bae1dSRodney W. Grimes 		for (;;) {
1031df8bae1dSRodney W. Grimes 			count += m->m_len;
1032df8bae1dSRodney W. Grimes 			if (m->m_next == (struct mbuf *)0)
1033df8bae1dSRodney W. Grimes 				break;
1034df8bae1dSRodney W. Grimes 			m = m->m_next;
1035df8bae1dSRodney W. Grimes 		}
1036df8bae1dSRodney W. Grimes 		if (m->m_len >= len) {
1037df8bae1dSRodney W. Grimes 			m->m_len -= len;
1038df8bae1dSRodney W. Grimes 			if (mp->m_flags & M_PKTHDR)
1039df8bae1dSRodney W. Grimes 				mp->m_pkthdr.len -= len;
1040df8bae1dSRodney W. Grimes 			return;
1041df8bae1dSRodney W. Grimes 		}
1042df8bae1dSRodney W. Grimes 		count -= len;
1043df8bae1dSRodney W. Grimes 		if (count < 0)
1044df8bae1dSRodney W. Grimes 			count = 0;
1045df8bae1dSRodney W. Grimes 		/*
1046df8bae1dSRodney W. Grimes 		 * Correct length for chain is "count".
1047df8bae1dSRodney W. Grimes 		 * Find the mbuf with last data, adjust its length,
1048df8bae1dSRodney W. Grimes 		 * and toss data from remaining mbufs on chain.
1049df8bae1dSRodney W. Grimes 		 */
1050df8bae1dSRodney W. Grimes 		m = mp;
1051df8bae1dSRodney W. Grimes 		if (m->m_flags & M_PKTHDR)
1052df8bae1dSRodney W. Grimes 			m->m_pkthdr.len = count;
1053df8bae1dSRodney W. Grimes 		for (; m; m = m->m_next) {
1054df8bae1dSRodney W. Grimes 			if (m->m_len >= count) {
1055df8bae1dSRodney W. Grimes 				m->m_len = count;
105659d8b310SSam Leffler 				if (m->m_next != NULL) {
105759d8b310SSam Leffler 					m_freem(m->m_next);
105859d8b310SSam Leffler 					m->m_next = NULL;
105959d8b310SSam Leffler 				}
1060df8bae1dSRodney W. Grimes 				break;
1061df8bae1dSRodney W. Grimes 			}
1062df8bae1dSRodney W. Grimes 			count -= m->m_len;
1063df8bae1dSRodney W. Grimes 		}
1064df8bae1dSRodney W. Grimes 	}
1065df8bae1dSRodney W. Grimes }
1066df8bae1dSRodney W. Grimes 
1067df8bae1dSRodney W. Grimes /*
1068df8bae1dSRodney W. Grimes  * Rearange an mbuf chain so that len bytes are contiguous
1069a2c36a02SKevin Lo  * and in the data area of an mbuf (so that mtod will work
1070a2c36a02SKevin Lo  * for a structure of size len).  Returns the resulting
1071df8bae1dSRodney W. Grimes  * mbuf chain on success, frees it and returns null on failure.
1072df8bae1dSRodney W. Grimes  * If there is room, it will add up to max_protohdr-len extra bytes to the
1073df8bae1dSRodney W. Grimes  * contiguous region in an attempt to avoid being called next time.
1074df8bae1dSRodney W. Grimes  */
1075df8bae1dSRodney W. Grimes struct mbuf *
1076122a814aSBosko Milekic m_pullup(struct mbuf *n, int len)
1077df8bae1dSRodney W. Grimes {
1078122a814aSBosko Milekic 	struct mbuf *m;
1079122a814aSBosko Milekic 	int count;
1080df8bae1dSRodney W. Grimes 	int space;
1081df8bae1dSRodney W. Grimes 
1082df8bae1dSRodney W. Grimes 	/*
1083df8bae1dSRodney W. Grimes 	 * If first mbuf has no cluster, and has room for len bytes
1084df8bae1dSRodney W. Grimes 	 * without shifting current data, pullup into it,
1085df8bae1dSRodney W. Grimes 	 * otherwise allocate a new mbuf to prepend to the chain.
1086df8bae1dSRodney W. Grimes 	 */
1087df8bae1dSRodney W. Grimes 	if ((n->m_flags & M_EXT) == 0 &&
1088df8bae1dSRodney W. Grimes 	    n->m_data + len < &n->m_dat[MLEN] && n->m_next) {
1089df8bae1dSRodney W. Grimes 		if (n->m_len >= len)
1090df8bae1dSRodney W. Grimes 			return (n);
1091df8bae1dSRodney W. Grimes 		m = n;
1092df8bae1dSRodney W. Grimes 		n = n->m_next;
1093df8bae1dSRodney W. Grimes 		len -= m->m_len;
1094df8bae1dSRodney W. Grimes 	} else {
1095df8bae1dSRodney W. Grimes 		if (len > MHLEN)
1096df8bae1dSRodney W. Grimes 			goto bad;
1097c95be8b5SGleb Smirnoff 		m = m_get(M_NOWAIT, n->m_type);
1098122a814aSBosko Milekic 		if (m == NULL)
1099df8bae1dSRodney W. Grimes 			goto bad;
11009967cafcSSam Leffler 		if (n->m_flags & M_PKTHDR)
1101c95be8b5SGleb Smirnoff 			m_move_pkthdr(m, n);
1102df8bae1dSRodney W. Grimes 	}
1103df8bae1dSRodney W. Grimes 	space = &m->m_dat[MLEN] - (m->m_data + m->m_len);
1104df8bae1dSRodney W. Grimes 	do {
1105df8bae1dSRodney W. Grimes 		count = min(min(max(len, max_protohdr), space), n->m_len);
1106df8bae1dSRodney W. Grimes 		bcopy(mtod(n, caddr_t), mtod(m, caddr_t) + m->m_len,
1107bd395ae8SBosko Milekic 		  (u_int)count);
1108df8bae1dSRodney W. Grimes 		len -= count;
1109df8bae1dSRodney W. Grimes 		m->m_len += count;
1110df8bae1dSRodney W. Grimes 		n->m_len -= count;
1111df8bae1dSRodney W. Grimes 		space -= count;
1112df8bae1dSRodney W. Grimes 		if (n->m_len)
1113df8bae1dSRodney W. Grimes 			n->m_data += count;
1114df8bae1dSRodney W. Grimes 		else
1115df8bae1dSRodney W. Grimes 			n = m_free(n);
1116df8bae1dSRodney W. Grimes 	} while (len > 0 && n);
1117df8bae1dSRodney W. Grimes 	if (len > 0) {
1118df8bae1dSRodney W. Grimes 		(void) m_free(m);
1119df8bae1dSRodney W. Grimes 		goto bad;
1120df8bae1dSRodney W. Grimes 	}
1121df8bae1dSRodney W. Grimes 	m->m_next = n;
1122df8bae1dSRodney W. Grimes 	return (m);
1123df8bae1dSRodney W. Grimes bad:
1124df8bae1dSRodney W. Grimes 	m_freem(n);
1125122a814aSBosko Milekic 	return (NULL);
1126df8bae1dSRodney W. Grimes }
1127df8bae1dSRodney W. Grimes 
1128df8bae1dSRodney W. Grimes /*
11297ac139a9SJohn-Mark Gurney  * Like m_pullup(), except a new mbuf is always allocated, and we allow
11307ac139a9SJohn-Mark Gurney  * the amount of empty space before the data in the new mbuf to be specified
11317ac139a9SJohn-Mark Gurney  * (in the event that the caller expects to prepend later).
11327ac139a9SJohn-Mark Gurney  */
11337ac139a9SJohn-Mark Gurney int MSFail;
11347ac139a9SJohn-Mark Gurney 
11357ac139a9SJohn-Mark Gurney struct mbuf *
11367ac139a9SJohn-Mark Gurney m_copyup(struct mbuf *n, int len, int dstoff)
11377ac139a9SJohn-Mark Gurney {
11387ac139a9SJohn-Mark Gurney 	struct mbuf *m;
11397ac139a9SJohn-Mark Gurney 	int count, space;
11407ac139a9SJohn-Mark Gurney 
11417ac139a9SJohn-Mark Gurney 	if (len > (MHLEN - dstoff))
11427ac139a9SJohn-Mark Gurney 		goto bad;
1143c95be8b5SGleb Smirnoff 	m = m_get(M_NOWAIT, n->m_type);
11447ac139a9SJohn-Mark Gurney 	if (m == NULL)
11457ac139a9SJohn-Mark Gurney 		goto bad;
11467ac139a9SJohn-Mark Gurney 	if (n->m_flags & M_PKTHDR)
1147c95be8b5SGleb Smirnoff 		m_move_pkthdr(m, n);
11487ac139a9SJohn-Mark Gurney 	m->m_data += dstoff;
11497ac139a9SJohn-Mark Gurney 	space = &m->m_dat[MLEN] - (m->m_data + m->m_len);
11507ac139a9SJohn-Mark Gurney 	do {
11517ac139a9SJohn-Mark Gurney 		count = min(min(max(len, max_protohdr), space), n->m_len);
11527ac139a9SJohn-Mark Gurney 		memcpy(mtod(m, caddr_t) + m->m_len, mtod(n, caddr_t),
11537ac139a9SJohn-Mark Gurney 		    (unsigned)count);
11547ac139a9SJohn-Mark Gurney 		len -= count;
11557ac139a9SJohn-Mark Gurney 		m->m_len += count;
11567ac139a9SJohn-Mark Gurney 		n->m_len -= count;
11577ac139a9SJohn-Mark Gurney 		space -= count;
11587ac139a9SJohn-Mark Gurney 		if (n->m_len)
11597ac139a9SJohn-Mark Gurney 			n->m_data += count;
11607ac139a9SJohn-Mark Gurney 		else
11617ac139a9SJohn-Mark Gurney 			n = m_free(n);
11627ac139a9SJohn-Mark Gurney 	} while (len > 0 && n);
11637ac139a9SJohn-Mark Gurney 	if (len > 0) {
11647ac139a9SJohn-Mark Gurney 		(void) m_free(m);
11657ac139a9SJohn-Mark Gurney 		goto bad;
11667ac139a9SJohn-Mark Gurney 	}
11677ac139a9SJohn-Mark Gurney 	m->m_next = n;
11687ac139a9SJohn-Mark Gurney 	return (m);
11697ac139a9SJohn-Mark Gurney  bad:
11707ac139a9SJohn-Mark Gurney 	m_freem(n);
11717ac139a9SJohn-Mark Gurney 	MSFail++;
11727ac139a9SJohn-Mark Gurney 	return (NULL);
11737ac139a9SJohn-Mark Gurney }
11747ac139a9SJohn-Mark Gurney 
11757ac139a9SJohn-Mark Gurney /*
1176df8bae1dSRodney W. Grimes  * Partition an mbuf chain in two pieces, returning the tail --
1177df8bae1dSRodney W. Grimes  * all but the first len0 bytes.  In case of failure, it returns NULL and
1178df8bae1dSRodney W. Grimes  * attempts to restore the chain to its original state.
117948d183faSArchie Cobbs  *
118048d183faSArchie Cobbs  * Note that the resulting mbufs might be read-only, because the new
118148d183faSArchie Cobbs  * mbuf can end up sharing an mbuf cluster with the original mbuf if
118248d183faSArchie Cobbs  * the "breaking point" happens to lie within a cluster mbuf. Use the
118348d183faSArchie Cobbs  * M_WRITABLE() macro to check for this case.
1184df8bae1dSRodney W. Grimes  */
1185df8bae1dSRodney W. Grimes struct mbuf *
1186122a814aSBosko Milekic m_split(struct mbuf *m0, int len0, int wait)
1187df8bae1dSRodney W. Grimes {
1188122a814aSBosko Milekic 	struct mbuf *m, *n;
1189bd395ae8SBosko Milekic 	u_int len = len0, remain;
1190df8bae1dSRodney W. Grimes 
1191063d8114SAlfred Perlstein 	MBUF_CHECKSLEEP(wait);
1192df8bae1dSRodney W. Grimes 	for (m = m0; m && len > m->m_len; m = m->m_next)
1193df8bae1dSRodney W. Grimes 		len -= m->m_len;
1194122a814aSBosko Milekic 	if (m == NULL)
1195122a814aSBosko Milekic 		return (NULL);
1196df8bae1dSRodney W. Grimes 	remain = m->m_len - len;
119721f39848SGleb Smirnoff 	if (m0->m_flags & M_PKTHDR && remain == 0) {
119821f39848SGleb Smirnoff 		n = m_gethdr(wait, m0->m_type);
119977badb18SGleb Smirnoff 		if (n == NULL)
120021f39848SGleb Smirnoff 			return (NULL);
120121f39848SGleb Smirnoff 		n->m_next = m->m_next;
120221f39848SGleb Smirnoff 		m->m_next = NULL;
120321f39848SGleb Smirnoff 		n->m_pkthdr.rcvif = m0->m_pkthdr.rcvif;
120421f39848SGleb Smirnoff 		n->m_pkthdr.len = m0->m_pkthdr.len - len0;
120521f39848SGleb Smirnoff 		m0->m_pkthdr.len = len0;
120621f39848SGleb Smirnoff 		return (n);
120721f39848SGleb Smirnoff 	} else if (m0->m_flags & M_PKTHDR) {
1208c95be8b5SGleb Smirnoff 		n = m_gethdr(wait, m0->m_type);
1209122a814aSBosko Milekic 		if (n == NULL)
1210122a814aSBosko Milekic 			return (NULL);
1211df8bae1dSRodney W. Grimes 		n->m_pkthdr.rcvif = m0->m_pkthdr.rcvif;
1212df8bae1dSRodney W. Grimes 		n->m_pkthdr.len = m0->m_pkthdr.len - len0;
1213df8bae1dSRodney W. Grimes 		m0->m_pkthdr.len = len0;
1214df8bae1dSRodney W. Grimes 		if (m->m_flags & M_EXT)
1215df8bae1dSRodney W. Grimes 			goto extpacket;
1216df8bae1dSRodney W. Grimes 		if (remain > MHLEN) {
1217df8bae1dSRodney W. Grimes 			/* m can't be the lead packet */
1218df8bae1dSRodney W. Grimes 			MH_ALIGN(n, 0);
1219df8bae1dSRodney W. Grimes 			n->m_next = m_split(m, len, wait);
1220122a814aSBosko Milekic 			if (n->m_next == NULL) {
1221df8bae1dSRodney W. Grimes 				(void) m_free(n);
1222122a814aSBosko Milekic 				return (NULL);
122340376987SJeffrey Hsu 			} else {
122440376987SJeffrey Hsu 				n->m_len = 0;
1225df8bae1dSRodney W. Grimes 				return (n);
122640376987SJeffrey Hsu 			}
1227df8bae1dSRodney W. Grimes 		} else
1228df8bae1dSRodney W. Grimes 			MH_ALIGN(n, remain);
1229df8bae1dSRodney W. Grimes 	} else if (remain == 0) {
1230df8bae1dSRodney W. Grimes 		n = m->m_next;
1231122a814aSBosko Milekic 		m->m_next = NULL;
1232df8bae1dSRodney W. Grimes 		return (n);
1233df8bae1dSRodney W. Grimes 	} else {
1234c95be8b5SGleb Smirnoff 		n = m_get(wait, m->m_type);
1235122a814aSBosko Milekic 		if (n == NULL)
1236122a814aSBosko Milekic 			return (NULL);
1237df8bae1dSRodney W. Grimes 		M_ALIGN(n, remain);
1238df8bae1dSRodney W. Grimes 	}
1239df8bae1dSRodney W. Grimes extpacket:
1240df8bae1dSRodney W. Grimes 	if (m->m_flags & M_EXT) {
1241df8bae1dSRodney W. Grimes 		n->m_data = m->m_data + len;
124256a4e45aSAndre Oppermann 		mb_dupcl(n, m);
1243df8bae1dSRodney W. Grimes 	} else {
1244df8bae1dSRodney W. Grimes 		bcopy(mtod(m, caddr_t) + len, mtod(n, caddr_t), remain);
1245df8bae1dSRodney W. Grimes 	}
1246df8bae1dSRodney W. Grimes 	n->m_len = remain;
1247df8bae1dSRodney W. Grimes 	m->m_len = len;
1248df8bae1dSRodney W. Grimes 	n->m_next = m->m_next;
1249122a814aSBosko Milekic 	m->m_next = NULL;
1250df8bae1dSRodney W. Grimes 	return (n);
1251df8bae1dSRodney W. Grimes }
1252df8bae1dSRodney W. Grimes /*
1253df8bae1dSRodney W. Grimes  * Routine to copy from device local memory into mbufs.
1254f5eece3fSBosko Milekic  * Note that `off' argument is offset into first mbuf of target chain from
1255f5eece3fSBosko Milekic  * which to begin copying the data to.
1256df8bae1dSRodney W. Grimes  */
1257df8bae1dSRodney W. Grimes struct mbuf *
1258f5eece3fSBosko Milekic m_devget(char *buf, int totlen, int off, struct ifnet *ifp,
1259122a814aSBosko Milekic     void (*copy)(char *from, caddr_t to, u_int len))
1260df8bae1dSRodney W. Grimes {
1261122a814aSBosko Milekic 	struct mbuf *m;
1262099a0e58SBosko Milekic 	struct mbuf *top = NULL, **mp = &top;
1263f5eece3fSBosko Milekic 	int len;
1264df8bae1dSRodney W. Grimes 
1265f5eece3fSBosko Milekic 	if (off < 0 || off > MHLEN)
1266f5eece3fSBosko Milekic 		return (NULL);
1267f5eece3fSBosko Milekic 
1268df8bae1dSRodney W. Grimes 	while (totlen > 0) {
1269099a0e58SBosko Milekic 		if (top == NULL) {	/* First one, must be PKTHDR */
1270f5eece3fSBosko Milekic 			if (totlen + off >= MINCLSIZE) {
1271eb1b1807SGleb Smirnoff 				m = m_getcl(M_NOWAIT, MT_DATA, M_PKTHDR);
1272f5eece3fSBosko Milekic 				len = MCLBYTES;
1273df8bae1dSRodney W. Grimes 			} else {
1274eb1b1807SGleb Smirnoff 				m = m_gethdr(M_NOWAIT, MT_DATA);
1275099a0e58SBosko Milekic 				len = MHLEN;
1276099a0e58SBosko Milekic 
1277099a0e58SBosko Milekic 				/* Place initial small packet/header at end of mbuf */
1278099a0e58SBosko Milekic 				if (m && totlen + off + max_linkhdr <= MLEN) {
1279df8bae1dSRodney W. Grimes 					m->m_data += max_linkhdr;
1280f5eece3fSBosko Milekic 					len -= max_linkhdr;
1281df8bae1dSRodney W. Grimes 				}
1282f5eece3fSBosko Milekic 			}
1283099a0e58SBosko Milekic 			if (m == NULL)
1284099a0e58SBosko Milekic 				return NULL;
1285099a0e58SBosko Milekic 			m->m_pkthdr.rcvif = ifp;
1286099a0e58SBosko Milekic 			m->m_pkthdr.len = totlen;
1287099a0e58SBosko Milekic 		} else {
1288099a0e58SBosko Milekic 			if (totlen + off >= MINCLSIZE) {
1289eb1b1807SGleb Smirnoff 				m = m_getcl(M_NOWAIT, MT_DATA, 0);
1290099a0e58SBosko Milekic 				len = MCLBYTES;
1291099a0e58SBosko Milekic 			} else {
1292eb1b1807SGleb Smirnoff 				m = m_get(M_NOWAIT, MT_DATA);
1293099a0e58SBosko Milekic 				len = MLEN;
1294099a0e58SBosko Milekic 			}
1295099a0e58SBosko Milekic 			if (m == NULL) {
1296099a0e58SBosko Milekic 				m_freem(top);
1297099a0e58SBosko Milekic 				return NULL;
1298099a0e58SBosko Milekic 			}
1299099a0e58SBosko Milekic 		}
1300f5eece3fSBosko Milekic 		if (off) {
1301f5eece3fSBosko Milekic 			m->m_data += off;
1302f5eece3fSBosko Milekic 			len -= off;
1303f5eece3fSBosko Milekic 			off = 0;
1304f5eece3fSBosko Milekic 		}
1305f5eece3fSBosko Milekic 		m->m_len = len = min(totlen, len);
1306df8bae1dSRodney W. Grimes 		if (copy)
1307bd395ae8SBosko Milekic 			copy(buf, mtod(m, caddr_t), (u_int)len);
1308df8bae1dSRodney W. Grimes 		else
1309bd395ae8SBosko Milekic 			bcopy(buf, mtod(m, caddr_t), (u_int)len);
1310f5eece3fSBosko Milekic 		buf += len;
1311df8bae1dSRodney W. Grimes 		*mp = m;
1312df8bae1dSRodney W. Grimes 		mp = &m->m_next;
1313df8bae1dSRodney W. Grimes 		totlen -= len;
1314df8bae1dSRodney W. Grimes 	}
1315df8bae1dSRodney W. Grimes 	return (top);
1316df8bae1dSRodney W. Grimes }
1317c5789ba3SPoul-Henning Kamp 
1318c5789ba3SPoul-Henning Kamp /*
1319c5789ba3SPoul-Henning Kamp  * Copy data from a buffer back into the indicated mbuf chain,
1320c5789ba3SPoul-Henning Kamp  * starting "off" bytes from the beginning, extending the mbuf
1321c5789ba3SPoul-Henning Kamp  * chain if necessary.
1322c5789ba3SPoul-Henning Kamp  */
1323c5789ba3SPoul-Henning Kamp void
132424665342SLuigi Rizzo m_copyback(struct mbuf *m0, int off, int len, c_caddr_t cp)
1325c5789ba3SPoul-Henning Kamp {
1326122a814aSBosko Milekic 	int mlen;
1327122a814aSBosko Milekic 	struct mbuf *m = m0, *n;
1328c5789ba3SPoul-Henning Kamp 	int totlen = 0;
1329c5789ba3SPoul-Henning Kamp 
1330122a814aSBosko Milekic 	if (m0 == NULL)
1331c5789ba3SPoul-Henning Kamp 		return;
1332c5789ba3SPoul-Henning Kamp 	while (off > (mlen = m->m_len)) {
1333c5789ba3SPoul-Henning Kamp 		off -= mlen;
1334c5789ba3SPoul-Henning Kamp 		totlen += mlen;
1335122a814aSBosko Milekic 		if (m->m_next == NULL) {
1336eb1b1807SGleb Smirnoff 			n = m_get(M_NOWAIT, m->m_type);
1337122a814aSBosko Milekic 			if (n == NULL)
1338c5789ba3SPoul-Henning Kamp 				goto out;
1339099a0e58SBosko Milekic 			bzero(mtod(n, caddr_t), MLEN);
1340c5789ba3SPoul-Henning Kamp 			n->m_len = min(MLEN, len + off);
1341c5789ba3SPoul-Henning Kamp 			m->m_next = n;
1342c5789ba3SPoul-Henning Kamp 		}
1343c5789ba3SPoul-Henning Kamp 		m = m->m_next;
1344c5789ba3SPoul-Henning Kamp 	}
1345c5789ba3SPoul-Henning Kamp 	while (len > 0) {
1346129c5c81SAlexander Motin 		if (m->m_next == NULL && (len > m->m_len - off)) {
1347129c5c81SAlexander Motin 			m->m_len += min(len - (m->m_len - off),
1348129c5c81SAlexander Motin 			    M_TRAILINGSPACE(m));
1349129c5c81SAlexander Motin 		}
1350c5789ba3SPoul-Henning Kamp 		mlen = min (m->m_len - off, len);
1351bd395ae8SBosko Milekic 		bcopy(cp, off + mtod(m, caddr_t), (u_int)mlen);
1352c5789ba3SPoul-Henning Kamp 		cp += mlen;
1353c5789ba3SPoul-Henning Kamp 		len -= mlen;
1354c5789ba3SPoul-Henning Kamp 		mlen += off;
1355c5789ba3SPoul-Henning Kamp 		off = 0;
1356c5789ba3SPoul-Henning Kamp 		totlen += mlen;
1357c5789ba3SPoul-Henning Kamp 		if (len == 0)
1358c5789ba3SPoul-Henning Kamp 			break;
1359122a814aSBosko Milekic 		if (m->m_next == NULL) {
1360eb1b1807SGleb Smirnoff 			n = m_get(M_NOWAIT, m->m_type);
1361122a814aSBosko Milekic 			if (n == NULL)
1362c5789ba3SPoul-Henning Kamp 				break;
1363c5789ba3SPoul-Henning Kamp 			n->m_len = min(MLEN, len);
1364c5789ba3SPoul-Henning Kamp 			m->m_next = n;
1365c5789ba3SPoul-Henning Kamp 		}
1366c5789ba3SPoul-Henning Kamp 		m = m->m_next;
1367c5789ba3SPoul-Henning Kamp 	}
1368c5789ba3SPoul-Henning Kamp out:	if (((m = m0)->m_flags & M_PKTHDR) && (m->m_pkthdr.len < totlen))
1369c5789ba3SPoul-Henning Kamp 		m->m_pkthdr.len = totlen;
1370c5789ba3SPoul-Henning Kamp }
1371ce4a64f7SPoul-Henning Kamp 
137237621fd5SBruce M Simpson /*
13734873d175SSam Leffler  * Append the specified data to the indicated mbuf chain,
13744873d175SSam Leffler  * Extend the mbuf chain if the new data does not fit in
13754873d175SSam Leffler  * existing space.
13764873d175SSam Leffler  *
13774873d175SSam Leffler  * Return 1 if able to complete the job; otherwise 0.
13784873d175SSam Leffler  */
13794873d175SSam Leffler int
13804873d175SSam Leffler m_append(struct mbuf *m0, int len, c_caddr_t cp)
13814873d175SSam Leffler {
13824873d175SSam Leffler 	struct mbuf *m, *n;
13834873d175SSam Leffler 	int remainder, space;
13844873d175SSam Leffler 
13854873d175SSam Leffler 	for (m = m0; m->m_next != NULL; m = m->m_next)
13864873d175SSam Leffler 		;
13874873d175SSam Leffler 	remainder = len;
13884873d175SSam Leffler 	space = M_TRAILINGSPACE(m);
13894873d175SSam Leffler 	if (space > 0) {
13904873d175SSam Leffler 		/*
13914873d175SSam Leffler 		 * Copy into available space.
13924873d175SSam Leffler 		 */
13934873d175SSam Leffler 		if (space > remainder)
13944873d175SSam Leffler 			space = remainder;
13954873d175SSam Leffler 		bcopy(cp, mtod(m, caddr_t) + m->m_len, space);
13964873d175SSam Leffler 		m->m_len += space;
13974873d175SSam Leffler 		cp += space, remainder -= space;
13984873d175SSam Leffler 	}
13994873d175SSam Leffler 	while (remainder > 0) {
14004873d175SSam Leffler 		/*
14014873d175SSam Leffler 		 * Allocate a new mbuf; could check space
14024873d175SSam Leffler 		 * and allocate a cluster instead.
14034873d175SSam Leffler 		 */
1404eb1b1807SGleb Smirnoff 		n = m_get(M_NOWAIT, m->m_type);
14054873d175SSam Leffler 		if (n == NULL)
14064873d175SSam Leffler 			break;
14074873d175SSam Leffler 		n->m_len = min(MLEN, remainder);
1408a37c415eSSam Leffler 		bcopy(cp, mtod(n, caddr_t), n->m_len);
1409a37c415eSSam Leffler 		cp += n->m_len, remainder -= n->m_len;
14104873d175SSam Leffler 		m->m_next = n;
14114873d175SSam Leffler 		m = n;
14124873d175SSam Leffler 	}
14134873d175SSam Leffler 	if (m0->m_flags & M_PKTHDR)
14144873d175SSam Leffler 		m0->m_pkthdr.len += len - remainder;
14154873d175SSam Leffler 	return (remainder == 0);
14164873d175SSam Leffler }
14174873d175SSam Leffler 
14184873d175SSam Leffler /*
141937621fd5SBruce M Simpson  * Apply function f to the data in an mbuf chain starting "off" bytes from
142037621fd5SBruce M Simpson  * the beginning, continuing for "len" bytes.
142137621fd5SBruce M Simpson  */
142237621fd5SBruce M Simpson int
142337621fd5SBruce M Simpson m_apply(struct mbuf *m, int off, int len,
142454065297SBruce M Simpson     int (*f)(void *, void *, u_int), void *arg)
142537621fd5SBruce M Simpson {
142654065297SBruce M Simpson 	u_int count;
142737621fd5SBruce M Simpson 	int rval;
142837621fd5SBruce M Simpson 
142937621fd5SBruce M Simpson 	KASSERT(off >= 0, ("m_apply, negative off %d", off));
143037621fd5SBruce M Simpson 	KASSERT(len >= 0, ("m_apply, negative len %d", len));
143137621fd5SBruce M Simpson 	while (off > 0) {
143237621fd5SBruce M Simpson 		KASSERT(m != NULL, ("m_apply, offset > size of mbuf chain"));
143337621fd5SBruce M Simpson 		if (off < m->m_len)
143437621fd5SBruce M Simpson 			break;
143537621fd5SBruce M Simpson 		off -= m->m_len;
143637621fd5SBruce M Simpson 		m = m->m_next;
143737621fd5SBruce M Simpson 	}
143837621fd5SBruce M Simpson 	while (len > 0) {
143937621fd5SBruce M Simpson 		KASSERT(m != NULL, ("m_apply, offset > size of mbuf chain"));
144037621fd5SBruce M Simpson 		count = min(m->m_len - off, len);
144137621fd5SBruce M Simpson 		rval = (*f)(arg, mtod(m, caddr_t) + off, count);
144237621fd5SBruce M Simpson 		if (rval)
144337621fd5SBruce M Simpson 			return (rval);
144437621fd5SBruce M Simpson 		len -= count;
144537621fd5SBruce M Simpson 		off = 0;
144637621fd5SBruce M Simpson 		m = m->m_next;
144737621fd5SBruce M Simpson 	}
144837621fd5SBruce M Simpson 	return (0);
144937621fd5SBruce M Simpson }
145037621fd5SBruce M Simpson 
145137621fd5SBruce M Simpson /*
145237621fd5SBruce M Simpson  * Return a pointer to mbuf/offset of location in mbuf chain.
145337621fd5SBruce M Simpson  */
145437621fd5SBruce M Simpson struct mbuf *
145537621fd5SBruce M Simpson m_getptr(struct mbuf *m, int loc, int *off)
145637621fd5SBruce M Simpson {
145737621fd5SBruce M Simpson 
145837621fd5SBruce M Simpson 	while (loc >= 0) {
145954065297SBruce M Simpson 		/* Normal end of search. */
146037621fd5SBruce M Simpson 		if (m->m_len > loc) {
146137621fd5SBruce M Simpson 			*off = loc;
146237621fd5SBruce M Simpson 			return (m);
146337621fd5SBruce M Simpson 		} else {
146437621fd5SBruce M Simpson 			loc -= m->m_len;
146537621fd5SBruce M Simpson 			if (m->m_next == NULL) {
146637621fd5SBruce M Simpson 				if (loc == 0) {
146754065297SBruce M Simpson 					/* Point at the end of valid data. */
146837621fd5SBruce M Simpson 					*off = m->m_len;
146937621fd5SBruce M Simpson 					return (m);
147054065297SBruce M Simpson 				}
147137621fd5SBruce M Simpson 				return (NULL);
147254065297SBruce M Simpson 			}
147337621fd5SBruce M Simpson 			m = m->m_next;
147437621fd5SBruce M Simpson 		}
147537621fd5SBruce M Simpson 	}
147637621fd5SBruce M Simpson 	return (NULL);
147737621fd5SBruce M Simpson }
147837621fd5SBruce M Simpson 
1479ce4a64f7SPoul-Henning Kamp void
14807b125090SJohn-Mark Gurney m_print(const struct mbuf *m, int maxlen)
1481ce4a64f7SPoul-Henning Kamp {
1482ce4a64f7SPoul-Henning Kamp 	int len;
14837b125090SJohn-Mark Gurney 	int pdata;
14846357e7b5SEivind Eklund 	const struct mbuf *m2;
1485ce4a64f7SPoul-Henning Kamp 
14867e949c46SKenneth D. Merry 	if (m == NULL) {
14877e949c46SKenneth D. Merry 		printf("mbuf: %p\n", m);
14887e949c46SKenneth D. Merry 		return;
14897e949c46SKenneth D. Merry 	}
14907e949c46SKenneth D. Merry 
14917b125090SJohn-Mark Gurney 	if (m->m_flags & M_PKTHDR)
1492ce4a64f7SPoul-Henning Kamp 		len = m->m_pkthdr.len;
14937b125090SJohn-Mark Gurney 	else
14947b125090SJohn-Mark Gurney 		len = -1;
1495ce4a64f7SPoul-Henning Kamp 	m2 = m;
14967b125090SJohn-Mark Gurney 	while (m2 != NULL && (len == -1 || len)) {
14977b125090SJohn-Mark Gurney 		pdata = m2->m_len;
14987b125090SJohn-Mark Gurney 		if (maxlen != -1 && pdata > maxlen)
14997b125090SJohn-Mark Gurney 			pdata = maxlen;
15007b125090SJohn-Mark Gurney 		printf("mbuf: %p len: %d, next: %p, %b%s", m2, m2->m_len,
15017b125090SJohn-Mark Gurney 		    m2->m_next, m2->m_flags, "\20\20freelist\17skipfw"
15027b125090SJohn-Mark Gurney 		    "\11proto5\10proto4\7proto3\6proto2\5proto1\4rdonly"
15037b125090SJohn-Mark Gurney 		    "\3eor\2pkthdr\1ext", pdata ? "" : "\n");
15047b125090SJohn-Mark Gurney 		if (pdata)
150545e0d0aaSJohn-Mark Gurney 			printf(", %*D\n", pdata, (u_char *)m2->m_data, "-");
15067b125090SJohn-Mark Gurney 		if (len != -1)
1507ce4a64f7SPoul-Henning Kamp 			len -= m2->m_len;
1508ce4a64f7SPoul-Henning Kamp 		m2 = m2->m_next;
1509ce4a64f7SPoul-Henning Kamp 	}
15107b125090SJohn-Mark Gurney 	if (len > 0)
15117b125090SJohn-Mark Gurney 		printf("%d bytes unaccounted for.\n", len);
1512ce4a64f7SPoul-Henning Kamp 	return;
1513ce4a64f7SPoul-Henning Kamp }
15143f2e06c5SPoul-Henning Kamp 
1515bd395ae8SBosko Milekic u_int
15163f2e06c5SPoul-Henning Kamp m_fixhdr(struct mbuf *m0)
15173f2e06c5SPoul-Henning Kamp {
1518bd395ae8SBosko Milekic 	u_int len;
15193f2e06c5SPoul-Henning Kamp 
1520ac6e585dSPoul-Henning Kamp 	len = m_length(m0, NULL);
15213f2e06c5SPoul-Henning Kamp 	m0->m_pkthdr.len = len;
1522ac6e585dSPoul-Henning Kamp 	return (len);
1523ac6e585dSPoul-Henning Kamp }
1524ac6e585dSPoul-Henning Kamp 
1525bd395ae8SBosko Milekic u_int
1526ac6e585dSPoul-Henning Kamp m_length(struct mbuf *m0, struct mbuf **last)
1527ac6e585dSPoul-Henning Kamp {
1528ac6e585dSPoul-Henning Kamp 	struct mbuf *m;
1529bd395ae8SBosko Milekic 	u_int len;
1530ac6e585dSPoul-Henning Kamp 
1531ac6e585dSPoul-Henning Kamp 	len = 0;
1532ac6e585dSPoul-Henning Kamp 	for (m = m0; m != NULL; m = m->m_next) {
1533ac6e585dSPoul-Henning Kamp 		len += m->m_len;
1534ac6e585dSPoul-Henning Kamp 		if (m->m_next == NULL)
1535ac6e585dSPoul-Henning Kamp 			break;
1536ac6e585dSPoul-Henning Kamp 	}
1537ac6e585dSPoul-Henning Kamp 	if (last != NULL)
1538ac6e585dSPoul-Henning Kamp 		*last = m;
1539ac6e585dSPoul-Henning Kamp 	return (len);
15403f2e06c5SPoul-Henning Kamp }
154155e9f80dSMike Silbersack 
154255e9f80dSMike Silbersack /*
154355e9f80dSMike Silbersack  * Defragment a mbuf chain, returning the shortest possible
154455e9f80dSMike Silbersack  * chain of mbufs and clusters.  If allocation fails and
154555e9f80dSMike Silbersack  * this cannot be completed, NULL will be returned, but
154655e9f80dSMike Silbersack  * the passed in chain will be unchanged.  Upon success,
154755e9f80dSMike Silbersack  * the original chain will be freed, and the new chain
154855e9f80dSMike Silbersack  * will be returned.
154955e9f80dSMike Silbersack  *
155055e9f80dSMike Silbersack  * If a non-packet header is passed in, the original
155155e9f80dSMike Silbersack  * mbuf (chain?) will be returned unharmed.
155255e9f80dSMike Silbersack  */
155355e9f80dSMike Silbersack struct mbuf *
155455e9f80dSMike Silbersack m_defrag(struct mbuf *m0, int how)
155555e9f80dSMike Silbersack {
155655e9f80dSMike Silbersack 	struct mbuf *m_new = NULL, *m_final = NULL;
155755e9f80dSMike Silbersack 	int progress = 0, length;
155855e9f80dSMike Silbersack 
1559063d8114SAlfred Perlstein 	MBUF_CHECKSLEEP(how);
156055e9f80dSMike Silbersack 	if (!(m0->m_flags & M_PKTHDR))
156155e9f80dSMike Silbersack 		return (m0);
156255e9f80dSMike Silbersack 
1563f8bf8e39SMike Silbersack 	m_fixhdr(m0); /* Needed sanity check */
1564f8bf8e39SMike Silbersack 
1565352d050eSMike Silbersack #ifdef MBUF_STRESS_TEST
1566352d050eSMike Silbersack 	if (m_defragrandomfailures) {
1567352d050eSMike Silbersack 		int temp = arc4random() & 0xff;
1568352d050eSMike Silbersack 		if (temp == 0xba)
1569352d050eSMike Silbersack 			goto nospace;
1570352d050eSMike Silbersack 	}
1571352d050eSMike Silbersack #endif
157255e9f80dSMike Silbersack 
157355e9f80dSMike Silbersack 	if (m0->m_pkthdr.len > MHLEN)
157455e9f80dSMike Silbersack 		m_final = m_getcl(how, MT_DATA, M_PKTHDR);
157555e9f80dSMike Silbersack 	else
157655e9f80dSMike Silbersack 		m_final = m_gethdr(how, MT_DATA);
157755e9f80dSMike Silbersack 
157855e9f80dSMike Silbersack 	if (m_final == NULL)
157955e9f80dSMike Silbersack 		goto nospace;
158055e9f80dSMike Silbersack 
1581a89ec05eSPeter Wemm 	if (m_dup_pkthdr(m_final, m0, how) == 0)
158255e9f80dSMike Silbersack 		goto nospace;
158355e9f80dSMike Silbersack 
158455e9f80dSMike Silbersack 	m_new = m_final;
158555e9f80dSMike Silbersack 
158655e9f80dSMike Silbersack 	while (progress < m0->m_pkthdr.len) {
158755e9f80dSMike Silbersack 		length = m0->m_pkthdr.len - progress;
158855e9f80dSMike Silbersack 		if (length > MCLBYTES)
158955e9f80dSMike Silbersack 			length = MCLBYTES;
159055e9f80dSMike Silbersack 
159155e9f80dSMike Silbersack 		if (m_new == NULL) {
159255e9f80dSMike Silbersack 			if (length > MLEN)
159355e9f80dSMike Silbersack 				m_new = m_getcl(how, MT_DATA, 0);
159455e9f80dSMike Silbersack 			else
159555e9f80dSMike Silbersack 				m_new = m_get(how, MT_DATA);
159655e9f80dSMike Silbersack 			if (m_new == NULL)
159755e9f80dSMike Silbersack 				goto nospace;
159855e9f80dSMike Silbersack 		}
159955e9f80dSMike Silbersack 
160055e9f80dSMike Silbersack 		m_copydata(m0, progress, length, mtod(m_new, caddr_t));
160155e9f80dSMike Silbersack 		progress += length;
160255e9f80dSMike Silbersack 		m_new->m_len = length;
160355e9f80dSMike Silbersack 		if (m_new != m_final)
160455e9f80dSMike Silbersack 			m_cat(m_final, m_new);
160555e9f80dSMike Silbersack 		m_new = NULL;
160655e9f80dSMike Silbersack 	}
160751710a45SMike Silbersack #ifdef MBUF_STRESS_TEST
160855e9f80dSMike Silbersack 	if (m0->m_next == NULL)
160955e9f80dSMike Silbersack 		m_defraguseless++;
161051710a45SMike Silbersack #endif
161155e9f80dSMike Silbersack 	m_freem(m0);
161255e9f80dSMike Silbersack 	m0 = m_final;
161351710a45SMike Silbersack #ifdef MBUF_STRESS_TEST
161455e9f80dSMike Silbersack 	m_defragpackets++;
161555e9f80dSMike Silbersack 	m_defragbytes += m0->m_pkthdr.len;
161651710a45SMike Silbersack #endif
161755e9f80dSMike Silbersack 	return (m0);
161855e9f80dSMike Silbersack nospace:
161951710a45SMike Silbersack #ifdef MBUF_STRESS_TEST
162055e9f80dSMike Silbersack 	m_defragfailure++;
162151710a45SMike Silbersack #endif
162255e9f80dSMike Silbersack 	if (m_final)
162355e9f80dSMike Silbersack 		m_freem(m_final);
162455e9f80dSMike Silbersack 	return (NULL);
162555e9f80dSMike Silbersack }
16263390d476SMike Silbersack 
1627eeb76a18SSam Leffler /*
1628eeb76a18SSam Leffler  * Defragment an mbuf chain, returning at most maxfrags separate
1629eeb76a18SSam Leffler  * mbufs+clusters.  If this is not possible NULL is returned and
1630eeb76a18SSam Leffler  * the original mbuf chain is left in it's present (potentially
1631eeb76a18SSam Leffler  * modified) state.  We use two techniques: collapsing consecutive
1632eeb76a18SSam Leffler  * mbufs and replacing consecutive mbufs by a cluster.
1633eeb76a18SSam Leffler  *
1634eeb76a18SSam Leffler  * NB: this should really be named m_defrag but that name is taken
1635eeb76a18SSam Leffler  */
1636eeb76a18SSam Leffler struct mbuf *
1637eeb76a18SSam Leffler m_collapse(struct mbuf *m0, int how, int maxfrags)
1638eeb76a18SSam Leffler {
1639eeb76a18SSam Leffler 	struct mbuf *m, *n, *n2, **prev;
1640eeb76a18SSam Leffler 	u_int curfrags;
1641eeb76a18SSam Leffler 
1642eeb76a18SSam Leffler 	/*
1643eeb76a18SSam Leffler 	 * Calculate the current number of frags.
1644eeb76a18SSam Leffler 	 */
1645eeb76a18SSam Leffler 	curfrags = 0;
1646eeb76a18SSam Leffler 	for (m = m0; m != NULL; m = m->m_next)
1647eeb76a18SSam Leffler 		curfrags++;
1648eeb76a18SSam Leffler 	/*
1649eeb76a18SSam Leffler 	 * First, try to collapse mbufs.  Note that we always collapse
1650eeb76a18SSam Leffler 	 * towards the front so we don't need to deal with moving the
1651eeb76a18SSam Leffler 	 * pkthdr.  This may be suboptimal if the first mbuf has much
1652eeb76a18SSam Leffler 	 * less data than the following.
1653eeb76a18SSam Leffler 	 */
1654eeb76a18SSam Leffler 	m = m0;
1655eeb76a18SSam Leffler again:
1656eeb76a18SSam Leffler 	for (;;) {
1657eeb76a18SSam Leffler 		n = m->m_next;
1658eeb76a18SSam Leffler 		if (n == NULL)
1659eeb76a18SSam Leffler 			break;
166014d7c5b1SAndre Oppermann 		if (M_WRITABLE(m) &&
1661eeb76a18SSam Leffler 		    n->m_len < M_TRAILINGSPACE(m)) {
1662eeb76a18SSam Leffler 			bcopy(mtod(n, void *), mtod(m, char *) + m->m_len,
1663eeb76a18SSam Leffler 				n->m_len);
1664eeb76a18SSam Leffler 			m->m_len += n->m_len;
1665eeb76a18SSam Leffler 			m->m_next = n->m_next;
1666eeb76a18SSam Leffler 			m_free(n);
1667eeb76a18SSam Leffler 			if (--curfrags <= maxfrags)
1668eeb76a18SSam Leffler 				return m0;
1669eeb76a18SSam Leffler 		} else
1670eeb76a18SSam Leffler 			m = n;
1671eeb76a18SSam Leffler 	}
1672eeb76a18SSam Leffler 	KASSERT(maxfrags > 1,
1673eeb76a18SSam Leffler 		("maxfrags %u, but normal collapse failed", maxfrags));
1674eeb76a18SSam Leffler 	/*
1675eeb76a18SSam Leffler 	 * Collapse consecutive mbufs to a cluster.
1676eeb76a18SSam Leffler 	 */
1677eeb76a18SSam Leffler 	prev = &m0->m_next;		/* NB: not the first mbuf */
1678eeb76a18SSam Leffler 	while ((n = *prev) != NULL) {
1679eeb76a18SSam Leffler 		if ((n2 = n->m_next) != NULL &&
1680eeb76a18SSam Leffler 		    n->m_len + n2->m_len < MCLBYTES) {
1681eeb76a18SSam Leffler 			m = m_getcl(how, MT_DATA, 0);
1682eeb76a18SSam Leffler 			if (m == NULL)
1683eeb76a18SSam Leffler 				goto bad;
1684eeb76a18SSam Leffler 			bcopy(mtod(n, void *), mtod(m, void *), n->m_len);
1685eeb76a18SSam Leffler 			bcopy(mtod(n2, void *), mtod(m, char *) + n->m_len,
1686eeb76a18SSam Leffler 				n2->m_len);
1687eeb76a18SSam Leffler 			m->m_len = n->m_len + n2->m_len;
1688eeb76a18SSam Leffler 			m->m_next = n2->m_next;
1689eeb76a18SSam Leffler 			*prev = m;
1690eeb76a18SSam Leffler 			m_free(n);
1691eeb76a18SSam Leffler 			m_free(n2);
1692eeb76a18SSam Leffler 			if (--curfrags <= maxfrags)	/* +1 cl -2 mbufs */
1693eeb76a18SSam Leffler 				return m0;
1694eeb76a18SSam Leffler 			/*
1695eeb76a18SSam Leffler 			 * Still not there, try the normal collapse
1696eeb76a18SSam Leffler 			 * again before we allocate another cluster.
1697eeb76a18SSam Leffler 			 */
1698eeb76a18SSam Leffler 			goto again;
1699eeb76a18SSam Leffler 		}
1700eeb76a18SSam Leffler 		prev = &n->m_next;
1701eeb76a18SSam Leffler 	}
1702eeb76a18SSam Leffler 	/*
1703eeb76a18SSam Leffler 	 * No place where we can collapse to a cluster; punt.
1704eeb76a18SSam Leffler 	 * This can occur if, for example, you request 2 frags
1705eeb76a18SSam Leffler 	 * but the packet requires that both be clusters (we
1706eeb76a18SSam Leffler 	 * never reallocate the first mbuf to avoid moving the
1707eeb76a18SSam Leffler 	 * packet header).
1708eeb76a18SSam Leffler 	 */
1709eeb76a18SSam Leffler bad:
1710eeb76a18SSam Leffler 	return NULL;
1711eeb76a18SSam Leffler }
1712eeb76a18SSam Leffler 
17133390d476SMike Silbersack #ifdef MBUF_STRESS_TEST
17143390d476SMike Silbersack 
17153390d476SMike Silbersack /*
17163390d476SMike Silbersack  * Fragment an mbuf chain.  There's no reason you'd ever want to do
17173390d476SMike Silbersack  * this in normal usage, but it's great for stress testing various
17183390d476SMike Silbersack  * mbuf consumers.
17193390d476SMike Silbersack  *
17203390d476SMike Silbersack  * If fragmentation is not possible, the original chain will be
17213390d476SMike Silbersack  * returned.
17223390d476SMike Silbersack  *
17233390d476SMike Silbersack  * Possible length values:
17243390d476SMike Silbersack  * 0	 no fragmentation will occur
17253390d476SMike Silbersack  * > 0	each fragment will be of the specified length
17263390d476SMike Silbersack  * -1	each fragment will be the same random value in length
17273390d476SMike Silbersack  * -2	each fragment's length will be entirely random
17283390d476SMike Silbersack  * (Random values range from 1 to 256)
17293390d476SMike Silbersack  */
17303390d476SMike Silbersack struct mbuf *
17313390d476SMike Silbersack m_fragment(struct mbuf *m0, int how, int length)
17323390d476SMike Silbersack {
17333390d476SMike Silbersack 	struct mbuf *m_new = NULL, *m_final = NULL;
17343390d476SMike Silbersack 	int progress = 0;
17353390d476SMike Silbersack 
17363390d476SMike Silbersack 	if (!(m0->m_flags & M_PKTHDR))
17373390d476SMike Silbersack 		return (m0);
17383390d476SMike Silbersack 
17393390d476SMike Silbersack 	if ((length == 0) || (length < -2))
17403390d476SMike Silbersack 		return (m0);
17413390d476SMike Silbersack 
17423390d476SMike Silbersack 	m_fixhdr(m0); /* Needed sanity check */
17433390d476SMike Silbersack 
17443390d476SMike Silbersack 	m_final = m_getcl(how, MT_DATA, M_PKTHDR);
17453390d476SMike Silbersack 
17463390d476SMike Silbersack 	if (m_final == NULL)
17473390d476SMike Silbersack 		goto nospace;
17483390d476SMike Silbersack 
17498dee2f67SMike Silbersack 	if (m_dup_pkthdr(m_final, m0, how) == 0)
17503390d476SMike Silbersack 		goto nospace;
17513390d476SMike Silbersack 
17523390d476SMike Silbersack 	m_new = m_final;
17533390d476SMike Silbersack 
17543390d476SMike Silbersack 	if (length == -1)
17553390d476SMike Silbersack 		length = 1 + (arc4random() & 255);
17563390d476SMike Silbersack 
17573390d476SMike Silbersack 	while (progress < m0->m_pkthdr.len) {
17583390d476SMike Silbersack 		int fraglen;
17593390d476SMike Silbersack 
17603390d476SMike Silbersack 		if (length > 0)
17613390d476SMike Silbersack 			fraglen = length;
17623390d476SMike Silbersack 		else
17633390d476SMike Silbersack 			fraglen = 1 + (arc4random() & 255);
17643390d476SMike Silbersack 		if (fraglen > m0->m_pkthdr.len - progress)
17653390d476SMike Silbersack 			fraglen = m0->m_pkthdr.len - progress;
17663390d476SMike Silbersack 
17673390d476SMike Silbersack 		if (fraglen > MCLBYTES)
17683390d476SMike Silbersack 			fraglen = MCLBYTES;
17693390d476SMike Silbersack 
17703390d476SMike Silbersack 		if (m_new == NULL) {
17713390d476SMike Silbersack 			m_new = m_getcl(how, MT_DATA, 0);
17723390d476SMike Silbersack 			if (m_new == NULL)
17733390d476SMike Silbersack 				goto nospace;
17743390d476SMike Silbersack 		}
17753390d476SMike Silbersack 
17763390d476SMike Silbersack 		m_copydata(m0, progress, fraglen, mtod(m_new, caddr_t));
17773390d476SMike Silbersack 		progress += fraglen;
17783390d476SMike Silbersack 		m_new->m_len = fraglen;
17793390d476SMike Silbersack 		if (m_new != m_final)
17803390d476SMike Silbersack 			m_cat(m_final, m_new);
17813390d476SMike Silbersack 		m_new = NULL;
17823390d476SMike Silbersack 	}
17833390d476SMike Silbersack 	m_freem(m0);
17843390d476SMike Silbersack 	m0 = m_final;
17853390d476SMike Silbersack 	return (m0);
17863390d476SMike Silbersack nospace:
17873390d476SMike Silbersack 	if (m_final)
17883390d476SMike Silbersack 		m_freem(m_final);
17893390d476SMike Silbersack 	/* Return the original chain on failure */
17903390d476SMike Silbersack 	return (m0);
17913390d476SMike Silbersack }
17923390d476SMike Silbersack 
17933390d476SMike Silbersack #endif
1794beb699c7SMike Silbersack 
17955e20f43dSAndre Oppermann /*
17965e20f43dSAndre Oppermann  * Copy the contents of uio into a properly sized mbuf chain.
17975e20f43dSAndre Oppermann  */
1798beb699c7SMike Silbersack struct mbuf *
17995e20f43dSAndre Oppermann m_uiotombuf(struct uio *uio, int how, int len, int align, int flags)
1800beb699c7SMike Silbersack {
18015e20f43dSAndre Oppermann 	struct mbuf *m, *mb;
1802526d0bd5SKonstantin Belousov 	int error, length;
1803526d0bd5SKonstantin Belousov 	ssize_t total;
18045e20f43dSAndre Oppermann 	int progress = 0;
1805beb699c7SMike Silbersack 
18065e20f43dSAndre Oppermann 	/*
18075e20f43dSAndre Oppermann 	 * len can be zero or an arbitrary large value bound by
18085e20f43dSAndre Oppermann 	 * the total data supplied by the uio.
18095e20f43dSAndre Oppermann 	 */
1810beb699c7SMike Silbersack 	if (len > 0)
1811beb699c7SMike Silbersack 		total = min(uio->uio_resid, len);
1812beb699c7SMike Silbersack 	else
1813beb699c7SMike Silbersack 		total = uio->uio_resid;
18145e20f43dSAndre Oppermann 
18155e20f43dSAndre Oppermann 	/*
18165e20f43dSAndre Oppermann 	 * The smallest unit returned by m_getm2() is a single mbuf
18179128ec21SAndrew Thompson 	 * with pkthdr.  We can't align past it.
18185e20f43dSAndre Oppermann 	 */
181975ae2570SMaksim Yevmenkin 	if (align >= MHLEN)
1820beb699c7SMike Silbersack 		return (NULL);
18215e20f43dSAndre Oppermann 
18227c32173bSAndre Oppermann 	/*
18237c32173bSAndre Oppermann 	 * Give us the full allocation or nothing.
18247c32173bSAndre Oppermann 	 * If len is zero return the smallest empty mbuf.
18257c32173bSAndre Oppermann 	 */
18267c32173bSAndre Oppermann 	m = m_getm2(NULL, max(total + align, 1), how, MT_DATA, flags);
18275e20f43dSAndre Oppermann 	if (m == NULL)
18285e20f43dSAndre Oppermann 		return (NULL);
18295e20f43dSAndre Oppermann 	m->m_data += align;
18305e20f43dSAndre Oppermann 
18315e20f43dSAndre Oppermann 	/* Fill all mbufs with uio data and update header information. */
18325e20f43dSAndre Oppermann 	for (mb = m; mb != NULL; mb = mb->m_next) {
18335e20f43dSAndre Oppermann 		length = min(M_TRAILINGSPACE(mb), total - progress);
18345e20f43dSAndre Oppermann 
18355e20f43dSAndre Oppermann 		error = uiomove(mtod(mb, void *), length, uio);
18365e20f43dSAndre Oppermann 		if (error) {
18375e20f43dSAndre Oppermann 			m_freem(m);
18385e20f43dSAndre Oppermann 			return (NULL);
18395e20f43dSAndre Oppermann 		}
18405e20f43dSAndre Oppermann 
18415e20f43dSAndre Oppermann 		mb->m_len = length;
18425e20f43dSAndre Oppermann 		progress += length;
18435e20f43dSAndre Oppermann 		if (flags & M_PKTHDR)
18445e20f43dSAndre Oppermann 			m->m_pkthdr.len += length;
18455e20f43dSAndre Oppermann 	}
18465e20f43dSAndre Oppermann 	KASSERT(progress == total, ("%s: progress != total", __func__));
18475e20f43dSAndre Oppermann 
18485e20f43dSAndre Oppermann 	return (m);
1849beb699c7SMike Silbersack }
1850ab8ab90cSSam Leffler 
1851ab8ab90cSSam Leffler /*
1852bc05b2f6SAndre Oppermann  * Copy an mbuf chain into a uio limited by len if set.
1853bc05b2f6SAndre Oppermann  */
1854bc05b2f6SAndre Oppermann int
1855bc05b2f6SAndre Oppermann m_mbuftouio(struct uio *uio, struct mbuf *m, int len)
1856bc05b2f6SAndre Oppermann {
1857bc05b2f6SAndre Oppermann 	int error, length, total;
1858bc05b2f6SAndre Oppermann 	int progress = 0;
1859bc05b2f6SAndre Oppermann 
1860bc05b2f6SAndre Oppermann 	if (len > 0)
1861bc05b2f6SAndre Oppermann 		total = min(uio->uio_resid, len);
1862bc05b2f6SAndre Oppermann 	else
1863bc05b2f6SAndre Oppermann 		total = uio->uio_resid;
1864bc05b2f6SAndre Oppermann 
1865bc05b2f6SAndre Oppermann 	/* Fill the uio with data from the mbufs. */
1866bc05b2f6SAndre Oppermann 	for (; m != NULL; m = m->m_next) {
1867bc05b2f6SAndre Oppermann 		length = min(m->m_len, total - progress);
1868bc05b2f6SAndre Oppermann 
1869bc05b2f6SAndre Oppermann 		error = uiomove(mtod(m, void *), length, uio);
1870bc05b2f6SAndre Oppermann 		if (error)
1871bc05b2f6SAndre Oppermann 			return (error);
1872bc05b2f6SAndre Oppermann 
1873bc05b2f6SAndre Oppermann 		progress += length;
1874bc05b2f6SAndre Oppermann 	}
1875bc05b2f6SAndre Oppermann 
1876bc05b2f6SAndre Oppermann 	return (0);
1877bc05b2f6SAndre Oppermann }
1878bc05b2f6SAndre Oppermann 
1879bc05b2f6SAndre Oppermann /*
1880ab8ab90cSSam Leffler  * Set the m_data pointer of a newly-allocated mbuf
1881ab8ab90cSSam Leffler  * to place an object of the specified size at the
1882ab8ab90cSSam Leffler  * end of the mbuf, longword aligned.
1883ab8ab90cSSam Leffler  */
1884ab8ab90cSSam Leffler void
1885ab8ab90cSSam Leffler m_align(struct mbuf *m, int len)
1886ab8ab90cSSam Leffler {
18874f67e143SGleb Smirnoff #ifdef INVARIANTS
18884f67e143SGleb Smirnoff 	const char *msg = "%s: not a virgin mbuf";
18894f67e143SGleb Smirnoff #endif
1890ab8ab90cSSam Leffler 	int adjust;
1891ab8ab90cSSam Leffler 
18924f67e143SGleb Smirnoff 	if (m->m_flags & M_EXT) {
18934f67e143SGleb Smirnoff 		KASSERT(m->m_data == m->m_ext.ext_buf, (msg, __func__));
1894ab8ab90cSSam Leffler 		adjust = m->m_ext.ext_size - len;
18954f67e143SGleb Smirnoff 	} else if (m->m_flags & M_PKTHDR) {
18964f67e143SGleb Smirnoff 		KASSERT(m->m_data == m->m_pktdat, (msg, __func__));
1897ab8ab90cSSam Leffler 		adjust = MHLEN - len;
18984f67e143SGleb Smirnoff 	} else {
18994f67e143SGleb Smirnoff 		KASSERT(m->m_data == m->m_dat, (msg, __func__));
1900ab8ab90cSSam Leffler 		adjust = MLEN - len;
19014f67e143SGleb Smirnoff 	}
19024f67e143SGleb Smirnoff 
1903ab8ab90cSSam Leffler 	m->m_data += adjust &~ (sizeof(long)-1);
1904ab8ab90cSSam Leffler }
190547e2996eSSam Leffler 
190647e2996eSSam Leffler /*
190747e2996eSSam Leffler  * Create a writable copy of the mbuf chain.  While doing this
190847e2996eSSam Leffler  * we compact the chain with a goal of producing a chain with
190947e2996eSSam Leffler  * at most two mbufs.  The second mbuf in this chain is likely
191047e2996eSSam Leffler  * to be a cluster.  The primary purpose of this work is to create
191147e2996eSSam Leffler  * a writable packet for encryption, compression, etc.  The
191247e2996eSSam Leffler  * secondary goal is to linearize the data so the data can be
191347e2996eSSam Leffler  * passed to crypto hardware in the most efficient manner possible.
191447e2996eSSam Leffler  */
191547e2996eSSam Leffler struct mbuf *
191647e2996eSSam Leffler m_unshare(struct mbuf *m0, int how)
191747e2996eSSam Leffler {
191847e2996eSSam Leffler 	struct mbuf *m, *mprev;
191947e2996eSSam Leffler 	struct mbuf *n, *mfirst, *mlast;
192047e2996eSSam Leffler 	int len, off;
192147e2996eSSam Leffler 
192247e2996eSSam Leffler 	mprev = NULL;
192347e2996eSSam Leffler 	for (m = m0; m != NULL; m = mprev->m_next) {
192447e2996eSSam Leffler 		/*
192547e2996eSSam Leffler 		 * Regular mbufs are ignored unless there's a cluster
192647e2996eSSam Leffler 		 * in front of it that we can use to coalesce.  We do
192747e2996eSSam Leffler 		 * the latter mainly so later clusters can be coalesced
192847e2996eSSam Leffler 		 * also w/o having to handle them specially (i.e. convert
192947e2996eSSam Leffler 		 * mbuf+cluster -> cluster).  This optimization is heavily
193047e2996eSSam Leffler 		 * influenced by the assumption that we're running over
193147e2996eSSam Leffler 		 * Ethernet where MCLBYTES is large enough that the max
193247e2996eSSam Leffler 		 * packet size will permit lots of coalescing into a
193347e2996eSSam Leffler 		 * single cluster.  This in turn permits efficient
193447e2996eSSam Leffler 		 * crypto operations, especially when using hardware.
193547e2996eSSam Leffler 		 */
193647e2996eSSam Leffler 		if ((m->m_flags & M_EXT) == 0) {
193747e2996eSSam Leffler 			if (mprev && (mprev->m_flags & M_EXT) &&
193847e2996eSSam Leffler 			    m->m_len <= M_TRAILINGSPACE(mprev)) {
193947e2996eSSam Leffler 				/* XXX: this ignores mbuf types */
194047e2996eSSam Leffler 				memcpy(mtod(mprev, caddr_t) + mprev->m_len,
194147e2996eSSam Leffler 				       mtod(m, caddr_t), m->m_len);
194247e2996eSSam Leffler 				mprev->m_len += m->m_len;
194347e2996eSSam Leffler 				mprev->m_next = m->m_next;	/* unlink from chain */
194447e2996eSSam Leffler 				m_free(m);			/* reclaim mbuf */
194547e2996eSSam Leffler #if 0
194647e2996eSSam Leffler 				newipsecstat.ips_mbcoalesced++;
194747e2996eSSam Leffler #endif
194847e2996eSSam Leffler 			} else {
194947e2996eSSam Leffler 				mprev = m;
195047e2996eSSam Leffler 			}
195147e2996eSSam Leffler 			continue;
195247e2996eSSam Leffler 		}
195347e2996eSSam Leffler 		/*
195447e2996eSSam Leffler 		 * Writable mbufs are left alone (for now).
195547e2996eSSam Leffler 		 */
195647e2996eSSam Leffler 		if (M_WRITABLE(m)) {
195747e2996eSSam Leffler 			mprev = m;
195847e2996eSSam Leffler 			continue;
195947e2996eSSam Leffler 		}
196047e2996eSSam Leffler 
196147e2996eSSam Leffler 		/*
196247e2996eSSam Leffler 		 * Not writable, replace with a copy or coalesce with
196347e2996eSSam Leffler 		 * the previous mbuf if possible (since we have to copy
196447e2996eSSam Leffler 		 * it anyway, we try to reduce the number of mbufs and
196547e2996eSSam Leffler 		 * clusters so that future work is easier).
196647e2996eSSam Leffler 		 */
196747e2996eSSam Leffler 		KASSERT(m->m_flags & M_EXT, ("m_flags 0x%x", m->m_flags));
196847e2996eSSam Leffler 		/* NB: we only coalesce into a cluster or larger */
196947e2996eSSam Leffler 		if (mprev != NULL && (mprev->m_flags & M_EXT) &&
197047e2996eSSam Leffler 		    m->m_len <= M_TRAILINGSPACE(mprev)) {
197147e2996eSSam Leffler 			/* XXX: this ignores mbuf types */
197247e2996eSSam Leffler 			memcpy(mtod(mprev, caddr_t) + mprev->m_len,
197347e2996eSSam Leffler 			       mtod(m, caddr_t), m->m_len);
197447e2996eSSam Leffler 			mprev->m_len += m->m_len;
197547e2996eSSam Leffler 			mprev->m_next = m->m_next;	/* unlink from chain */
197647e2996eSSam Leffler 			m_free(m);			/* reclaim mbuf */
197747e2996eSSam Leffler #if 0
197847e2996eSSam Leffler 			newipsecstat.ips_clcoalesced++;
197947e2996eSSam Leffler #endif
198047e2996eSSam Leffler 			continue;
198147e2996eSSam Leffler 		}
198247e2996eSSam Leffler 
198347e2996eSSam Leffler 		/*
19845368b81eSGleb Smirnoff 		 * Allocate new space to hold the copy and copy the data.
19855368b81eSGleb Smirnoff 		 * We deal with jumbo mbufs (i.e. m_len > MCLBYTES) by
19865368b81eSGleb Smirnoff 		 * splitting them into clusters.  We could just malloc a
19875368b81eSGleb Smirnoff 		 * buffer and make it external but too many device drivers
19885368b81eSGleb Smirnoff 		 * don't know how to break up the non-contiguous memory when
19895368b81eSGleb Smirnoff 		 * doing DMA.
199047e2996eSSam Leffler 		 */
199147e2996eSSam Leffler 		n = m_getcl(how, m->m_type, m->m_flags);
199247e2996eSSam Leffler 		if (n == NULL) {
199347e2996eSSam Leffler 			m_freem(m0);
199447e2996eSSam Leffler 			return (NULL);
199547e2996eSSam Leffler 		}
199647e2996eSSam Leffler 		len = m->m_len;
199747e2996eSSam Leffler 		off = 0;
199847e2996eSSam Leffler 		mfirst = n;
199947e2996eSSam Leffler 		mlast = NULL;
200047e2996eSSam Leffler 		for (;;) {
200147e2996eSSam Leffler 			int cc = min(len, MCLBYTES);
200247e2996eSSam Leffler 			memcpy(mtod(n, caddr_t), mtod(m, caddr_t) + off, cc);
200347e2996eSSam Leffler 			n->m_len = cc;
200447e2996eSSam Leffler 			if (mlast != NULL)
200547e2996eSSam Leffler 				mlast->m_next = n;
200647e2996eSSam Leffler 			mlast = n;
200747e2996eSSam Leffler #if 0
200847e2996eSSam Leffler 			newipsecstat.ips_clcopied++;
200947e2996eSSam Leffler #endif
201047e2996eSSam Leffler 
201147e2996eSSam Leffler 			len -= cc;
201247e2996eSSam Leffler 			if (len <= 0)
201347e2996eSSam Leffler 				break;
201447e2996eSSam Leffler 			off += cc;
201547e2996eSSam Leffler 
201647e2996eSSam Leffler 			n = m_getcl(how, m->m_type, m->m_flags);
201747e2996eSSam Leffler 			if (n == NULL) {
201847e2996eSSam Leffler 				m_freem(mfirst);
201947e2996eSSam Leffler 				m_freem(m0);
202047e2996eSSam Leffler 				return (NULL);
202147e2996eSSam Leffler 			}
202247e2996eSSam Leffler 		}
202347e2996eSSam Leffler 		n->m_next = m->m_next;
202447e2996eSSam Leffler 		if (mprev == NULL)
202547e2996eSSam Leffler 			m0 = mfirst;		/* new head of chain */
202647e2996eSSam Leffler 		else
202747e2996eSSam Leffler 			mprev->m_next = mfirst;	/* replace old mbuf */
202847e2996eSSam Leffler 		m_free(m);			/* release old mbuf */
202947e2996eSSam Leffler 		mprev = mfirst;
203047e2996eSSam Leffler 	}
203147e2996eSSam Leffler 	return (m0);
203247e2996eSSam Leffler }
20336eeac1d9SJulian Elischer 
20346eeac1d9SJulian Elischer #ifdef MBUF_PROFILING
20356eeac1d9SJulian Elischer 
20366eeac1d9SJulian Elischer #define MP_BUCKETS 32 /* don't just change this as things may overflow.*/
20376eeac1d9SJulian Elischer struct mbufprofile {
20382182c0cfSJulian Elischer 	uintmax_t wasted[MP_BUCKETS];
20392182c0cfSJulian Elischer 	uintmax_t used[MP_BUCKETS];
20402182c0cfSJulian Elischer 	uintmax_t segments[MP_BUCKETS];
20416eeac1d9SJulian Elischer } mbprof;
20426eeac1d9SJulian Elischer 
20436eeac1d9SJulian Elischer #define MP_MAXDIGITS 21	/* strlen("16,000,000,000,000,000,000") == 21 */
20446eeac1d9SJulian Elischer #define MP_NUMLINES 6
20456eeac1d9SJulian Elischer #define MP_NUMSPERLINE 16
20466eeac1d9SJulian Elischer #define MP_EXTRABYTES 64	/* > strlen("used:\nwasted:\nsegments:\n") */
20476eeac1d9SJulian Elischer /* work out max space needed and add a bit of spare space too */
20486eeac1d9SJulian Elischer #define MP_MAXLINE ((MP_MAXDIGITS+1) * MP_NUMSPERLINE)
20496eeac1d9SJulian Elischer #define MP_BUFSIZE ((MP_MAXLINE * MP_NUMLINES) + 1 + MP_EXTRABYTES)
20506eeac1d9SJulian Elischer 
20516eeac1d9SJulian Elischer char mbprofbuf[MP_BUFSIZE];
20526eeac1d9SJulian Elischer 
20536eeac1d9SJulian Elischer void
20546eeac1d9SJulian Elischer m_profile(struct mbuf *m)
20556eeac1d9SJulian Elischer {
20566eeac1d9SJulian Elischer 	int segments = 0;
20576eeac1d9SJulian Elischer 	int used = 0;
20586eeac1d9SJulian Elischer 	int wasted = 0;
20596eeac1d9SJulian Elischer 
20606eeac1d9SJulian Elischer 	while (m) {
20616eeac1d9SJulian Elischer 		segments++;
20626eeac1d9SJulian Elischer 		used += m->m_len;
20636eeac1d9SJulian Elischer 		if (m->m_flags & M_EXT) {
20646eeac1d9SJulian Elischer 			wasted += MHLEN - sizeof(m->m_ext) +
20656eeac1d9SJulian Elischer 			    m->m_ext.ext_size - m->m_len;
20666eeac1d9SJulian Elischer 		} else {
20676eeac1d9SJulian Elischer 			if (m->m_flags & M_PKTHDR)
20686eeac1d9SJulian Elischer 				wasted += MHLEN - m->m_len;
20696eeac1d9SJulian Elischer 			else
20706eeac1d9SJulian Elischer 				wasted += MLEN - m->m_len;
20716eeac1d9SJulian Elischer 		}
20726eeac1d9SJulian Elischer 		m = m->m_next;
20736eeac1d9SJulian Elischer 	}
20746eeac1d9SJulian Elischer 	/* be paranoid.. it helps */
20756eeac1d9SJulian Elischer 	if (segments > MP_BUCKETS - 1)
20766eeac1d9SJulian Elischer 		segments = MP_BUCKETS - 1;
20776eeac1d9SJulian Elischer 	if (used > 100000)
20786eeac1d9SJulian Elischer 		used = 100000;
20796eeac1d9SJulian Elischer 	if (wasted > 100000)
20806eeac1d9SJulian Elischer 		wasted = 100000;
20816eeac1d9SJulian Elischer 	/* store in the appropriate bucket */
20826eeac1d9SJulian Elischer 	/* don't bother locking. if it's slightly off, so what? */
20836eeac1d9SJulian Elischer 	mbprof.segments[segments]++;
20846eeac1d9SJulian Elischer 	mbprof.used[fls(used)]++;
20856eeac1d9SJulian Elischer 	mbprof.wasted[fls(wasted)]++;
20866eeac1d9SJulian Elischer }
20876eeac1d9SJulian Elischer 
20886eeac1d9SJulian Elischer static void
20896eeac1d9SJulian Elischer mbprof_textify(void)
20906eeac1d9SJulian Elischer {
20916eeac1d9SJulian Elischer 	int offset;
20926eeac1d9SJulian Elischer 	char *c;
209360ae52f7SEd Schouten 	uint64_t *p;
20946eeac1d9SJulian Elischer 
20956eeac1d9SJulian Elischer 
20966eeac1d9SJulian Elischer 	p = &mbprof.wasted[0];
20976eeac1d9SJulian Elischer 	c = mbprofbuf;
20986eeac1d9SJulian Elischer 	offset = snprintf(c, MP_MAXLINE + 10,
20996eeac1d9SJulian Elischer 	    "wasted:\n"
21002182c0cfSJulian Elischer 	    "%ju %ju %ju %ju %ju %ju %ju %ju "
21012182c0cfSJulian Elischer 	    "%ju %ju %ju %ju %ju %ju %ju %ju\n",
21026eeac1d9SJulian Elischer 	    p[0], p[1], p[2], p[3], p[4], p[5], p[6], p[7],
21036eeac1d9SJulian Elischer 	    p[8], p[9], p[10], p[11], p[12], p[13], p[14], p[15]);
21046eeac1d9SJulian Elischer #ifdef BIG_ARRAY
21056eeac1d9SJulian Elischer 	p = &mbprof.wasted[16];
21066eeac1d9SJulian Elischer 	c += offset;
21076eeac1d9SJulian Elischer 	offset = snprintf(c, MP_MAXLINE,
21082182c0cfSJulian Elischer 	    "%ju %ju %ju %ju %ju %ju %ju %ju "
21092182c0cfSJulian Elischer 	    "%ju %ju %ju %ju %ju %ju %ju %ju\n",
21106eeac1d9SJulian Elischer 	    p[0], p[1], p[2], p[3], p[4], p[5], p[6], p[7],
21116eeac1d9SJulian Elischer 	    p[8], p[9], p[10], p[11], p[12], p[13], p[14], p[15]);
21126eeac1d9SJulian Elischer #endif
21136eeac1d9SJulian Elischer 	p = &mbprof.used[0];
21146eeac1d9SJulian Elischer 	c += offset;
21156eeac1d9SJulian Elischer 	offset = snprintf(c, MP_MAXLINE + 10,
21166eeac1d9SJulian Elischer 	    "used:\n"
21172182c0cfSJulian Elischer 	    "%ju %ju %ju %ju %ju %ju %ju %ju "
21182182c0cfSJulian Elischer 	    "%ju %ju %ju %ju %ju %ju %ju %ju\n",
21196eeac1d9SJulian Elischer 	    p[0], p[1], p[2], p[3], p[4], p[5], p[6], p[7],
21206eeac1d9SJulian Elischer 	    p[8], p[9], p[10], p[11], p[12], p[13], p[14], p[15]);
21216eeac1d9SJulian Elischer #ifdef BIG_ARRAY
21226eeac1d9SJulian Elischer 	p = &mbprof.used[16];
21236eeac1d9SJulian Elischer 	c += offset;
21246eeac1d9SJulian Elischer 	offset = snprintf(c, MP_MAXLINE,
21252182c0cfSJulian Elischer 	    "%ju %ju %ju %ju %ju %ju %ju %ju "
21262182c0cfSJulian Elischer 	    "%ju %ju %ju %ju %ju %ju %ju %ju\n",
21276eeac1d9SJulian Elischer 	    p[0], p[1], p[2], p[3], p[4], p[5], p[6], p[7],
21286eeac1d9SJulian Elischer 	    p[8], p[9], p[10], p[11], p[12], p[13], p[14], p[15]);
21296eeac1d9SJulian Elischer #endif
21306eeac1d9SJulian Elischer 	p = &mbprof.segments[0];
21316eeac1d9SJulian Elischer 	c += offset;
21326eeac1d9SJulian Elischer 	offset = snprintf(c, MP_MAXLINE + 10,
21336eeac1d9SJulian Elischer 	    "segments:\n"
21342182c0cfSJulian Elischer 	    "%ju %ju %ju %ju %ju %ju %ju %ju "
21352182c0cfSJulian Elischer 	    "%ju %ju %ju %ju %ju %ju %ju %ju\n",
21366eeac1d9SJulian Elischer 	    p[0], p[1], p[2], p[3], p[4], p[5], p[6], p[7],
21376eeac1d9SJulian Elischer 	    p[8], p[9], p[10], p[11], p[12], p[13], p[14], p[15]);
21386eeac1d9SJulian Elischer #ifdef BIG_ARRAY
21396eeac1d9SJulian Elischer 	p = &mbprof.segments[16];
21406eeac1d9SJulian Elischer 	c += offset;
21416eeac1d9SJulian Elischer 	offset = snprintf(c, MP_MAXLINE,
21422182c0cfSJulian Elischer 	    "%ju %ju %ju %ju %ju %ju %ju %ju "
21432182c0cfSJulian Elischer 	    "%ju %ju %ju %ju %ju %ju %ju %jju",
21446eeac1d9SJulian Elischer 	    p[0], p[1], p[2], p[3], p[4], p[5], p[6], p[7],
21456eeac1d9SJulian Elischer 	    p[8], p[9], p[10], p[11], p[12], p[13], p[14], p[15]);
21466eeac1d9SJulian Elischer #endif
21476eeac1d9SJulian Elischer }
21486eeac1d9SJulian Elischer 
21496eeac1d9SJulian Elischer static int
21506eeac1d9SJulian Elischer mbprof_handler(SYSCTL_HANDLER_ARGS)
21516eeac1d9SJulian Elischer {
21526eeac1d9SJulian Elischer 	int error;
21536eeac1d9SJulian Elischer 
21546eeac1d9SJulian Elischer 	mbprof_textify();
21556eeac1d9SJulian Elischer 	error = SYSCTL_OUT(req, mbprofbuf, strlen(mbprofbuf) + 1);
21566eeac1d9SJulian Elischer 	return (error);
21576eeac1d9SJulian Elischer }
21586eeac1d9SJulian Elischer 
21596eeac1d9SJulian Elischer static int
21606eeac1d9SJulian Elischer mbprof_clr_handler(SYSCTL_HANDLER_ARGS)
21616eeac1d9SJulian Elischer {
21626eeac1d9SJulian Elischer 	int clear, error;
21636eeac1d9SJulian Elischer 
21646eeac1d9SJulian Elischer 	clear = 0;
21656eeac1d9SJulian Elischer 	error = sysctl_handle_int(oidp, &clear, 0, req);
21666eeac1d9SJulian Elischer 	if (error || !req->newptr)
21676eeac1d9SJulian Elischer 		return (error);
21686eeac1d9SJulian Elischer 
21696eeac1d9SJulian Elischer 	if (clear) {
21706eeac1d9SJulian Elischer 		bzero(&mbprof, sizeof(mbprof));
21716eeac1d9SJulian Elischer 	}
21726eeac1d9SJulian Elischer 
21736eeac1d9SJulian Elischer 	return (error);
21746eeac1d9SJulian Elischer }
21756eeac1d9SJulian Elischer 
21766eeac1d9SJulian Elischer 
21776eeac1d9SJulian Elischer SYSCTL_PROC(_kern_ipc, OID_AUTO, mbufprofile, CTLTYPE_STRING|CTLFLAG_RD,
21786eeac1d9SJulian Elischer 	    NULL, 0, mbprof_handler, "A", "mbuf profiling statistics");
21796eeac1d9SJulian Elischer 
21806eeac1d9SJulian Elischer SYSCTL_PROC(_kern_ipc, OID_AUTO, mbufprofileclr, CTLTYPE_INT|CTLFLAG_RW,
21816eeac1d9SJulian Elischer 	    NULL, 0, mbprof_clr_handler, "I", "clear mbuf profiling statistics");
21826eeac1d9SJulian Elischer #endif
21836eeac1d9SJulian Elischer 
2184