xref: /freebsd/sys/compat/linuxkpi/common/src/linux_skbuff.c (revision 349b042b90057c1e9dbb64dfdb894fe03ea20a1d)
149ed6e97SBjoern A. Zeeb /*-
26baea331SBjoern A. Zeeb  * Copyright (c) 2020-2022 The FreeBSD Foundation
36baea331SBjoern A. Zeeb  * Copyright (c) 2021-2022 Bjoern A. Zeeb
449ed6e97SBjoern A. Zeeb  *
549ed6e97SBjoern A. Zeeb  * This software was developed by Björn Zeeb under sponsorship from
649ed6e97SBjoern A. Zeeb  * the FreeBSD Foundation.
749ed6e97SBjoern A. Zeeb  *
849ed6e97SBjoern A. Zeeb  * Redistribution and use in source and binary forms, with or without
949ed6e97SBjoern A. Zeeb  * modification, are permitted provided that the following conditions
1049ed6e97SBjoern A. Zeeb  * are met:
1149ed6e97SBjoern A. Zeeb  * 1. Redistributions of source code must retain the above copyright
1249ed6e97SBjoern A. Zeeb  *    notice, this list of conditions and the following disclaimer.
1349ed6e97SBjoern A. Zeeb  * 2. Redistributions in binary form must reproduce the above copyright
1449ed6e97SBjoern A. Zeeb  *    notice, this list of conditions and the following disclaimer in the
1549ed6e97SBjoern A. Zeeb  *    documentation and/or other materials provided with the distribution.
1649ed6e97SBjoern A. Zeeb  *
1749ed6e97SBjoern A. Zeeb  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
1849ed6e97SBjoern A. Zeeb  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
1949ed6e97SBjoern A. Zeeb  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
2049ed6e97SBjoern A. Zeeb  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
2149ed6e97SBjoern A. Zeeb  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
2249ed6e97SBjoern A. Zeeb  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
2349ed6e97SBjoern A. Zeeb  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
2449ed6e97SBjoern A. Zeeb  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
2549ed6e97SBjoern A. Zeeb  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
2649ed6e97SBjoern A. Zeeb  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
2749ed6e97SBjoern A. Zeeb  * SUCH DAMAGE.
2849ed6e97SBjoern A. Zeeb  *
2949ed6e97SBjoern A. Zeeb  * $FreeBSD$
3049ed6e97SBjoern A. Zeeb  */
3149ed6e97SBjoern A. Zeeb 
3249ed6e97SBjoern A. Zeeb /*
3349ed6e97SBjoern A. Zeeb  * NOTE: this socket buffer compatibility code is highly EXPERIMENTAL.
3449ed6e97SBjoern A. Zeeb  *       Do not rely on the internals of this implementation.  They are highly
3549ed6e97SBjoern A. Zeeb  *       likely to change as we will improve the integration to FreeBSD mbufs.
3649ed6e97SBjoern A. Zeeb  */
3749ed6e97SBjoern A. Zeeb 
3849ed6e97SBjoern A. Zeeb #include <sys/cdefs.h>
3949ed6e97SBjoern A. Zeeb __FBSDID("$FreeBSD$");
4049ed6e97SBjoern A. Zeeb 
416baea331SBjoern A. Zeeb #include "opt_ddb.h"
426baea331SBjoern A. Zeeb 
4349ed6e97SBjoern A. Zeeb #include <sys/param.h>
4449ed6e97SBjoern A. Zeeb #include <sys/types.h>
4549ed6e97SBjoern A. Zeeb #include <sys/kernel.h>
4649ed6e97SBjoern A. Zeeb #include <sys/malloc.h>
476baea331SBjoern A. Zeeb #include <sys/sysctl.h>
486baea331SBjoern A. Zeeb 
496baea331SBjoern A. Zeeb #ifdef DDB
506baea331SBjoern A. Zeeb #include <ddb/ddb.h>
516baea331SBjoern A. Zeeb #endif
5249ed6e97SBjoern A. Zeeb 
5349ed6e97SBjoern A. Zeeb #include <linux/skbuff.h>
5449ed6e97SBjoern A. Zeeb #include <linux/slab.h>
556baea331SBjoern A. Zeeb #include <linux/gfp.h>
566baea331SBjoern A. Zeeb 
576baea331SBjoern A. Zeeb #ifdef SKB_DEBUG
586baea331SBjoern A. Zeeb SYSCTL_DECL(_compat_linuxkpi);
596baea331SBjoern A. Zeeb SYSCTL_NODE(_compat_linuxkpi, OID_AUTO, skb, CTLFLAG_RW | CTLFLAG_MPSAFE, 0,
606baea331SBjoern A. Zeeb     "LinuxKPI skbuff");
616baea331SBjoern A. Zeeb 
626baea331SBjoern A. Zeeb int linuxkpi_debug_skb;
636baea331SBjoern A. Zeeb SYSCTL_INT(_compat_linuxkpi_skb, OID_AUTO, debug, CTLFLAG_RWTUN,
646baea331SBjoern A. Zeeb     &linuxkpi_debug_skb, 0, "SKB debug level");
656baea331SBjoern A. Zeeb #endif
6649ed6e97SBjoern A. Zeeb 
6749ed6e97SBjoern A. Zeeb static MALLOC_DEFINE(M_LKPISKB, "lkpiskb", "Linux KPI skbuff compat");
6849ed6e97SBjoern A. Zeeb 
6949ed6e97SBjoern A. Zeeb struct sk_buff *
7049ed6e97SBjoern A. Zeeb linuxkpi_alloc_skb(size_t size, gfp_t gfp)
7149ed6e97SBjoern A. Zeeb {
7249ed6e97SBjoern A. Zeeb 	struct sk_buff *skb;
7349ed6e97SBjoern A. Zeeb 	size_t len;
7449ed6e97SBjoern A. Zeeb 
7549ed6e97SBjoern A. Zeeb 	len = sizeof(*skb) + size + sizeof(struct skb_shared_info);
7649ed6e97SBjoern A. Zeeb 	/*
776baea331SBjoern A. Zeeb 	 * Using our own type here not backing my kmalloc.
7849ed6e97SBjoern A. Zeeb 	 * We assume no one calls kfree directly on the skb.
7949ed6e97SBjoern A. Zeeb 	 */
8049ed6e97SBjoern A. Zeeb 	skb = malloc(len, M_LKPISKB, linux_check_m_flags(gfp) | M_ZERO);
8149ed6e97SBjoern A. Zeeb 	if (skb == NULL)
8249ed6e97SBjoern A. Zeeb 		return (skb);
839df5f29cSBjoern A. Zeeb 	skb->_alloc_len = len;
8449ed6e97SBjoern A. Zeeb 	skb->truesize = size;
8549ed6e97SBjoern A. Zeeb 
8649ed6e97SBjoern A. Zeeb 	skb->head = skb->data = skb->tail = (uint8_t *)(skb+1);
8749ed6e97SBjoern A. Zeeb 	skb->end = skb->head + size;
8849ed6e97SBjoern A. Zeeb 
896a8973c3SBjoern A. Zeeb 	skb->prev = skb->next = skb;
906a8973c3SBjoern A. Zeeb 
9149ed6e97SBjoern A. Zeeb 	skb->shinfo = (struct skb_shared_info *)(skb->end);
9249ed6e97SBjoern A. Zeeb 
939df5f29cSBjoern A. Zeeb 	SKB_TRACE_FMT(skb, "data %p size %zu", (skb) ? skb->data : NULL, size);
949df5f29cSBjoern A. Zeeb 	return (skb);
959df5f29cSBjoern A. Zeeb }
969df5f29cSBjoern A. Zeeb 
979df5f29cSBjoern A. Zeeb struct sk_buff *
989df5f29cSBjoern A. Zeeb linuxkpi_dev_alloc_skb(size_t size, gfp_t gfp)
999df5f29cSBjoern A. Zeeb {
1009df5f29cSBjoern A. Zeeb 	struct sk_buff *skb;
1019df5f29cSBjoern A. Zeeb 	size_t len;
1029df5f29cSBjoern A. Zeeb 
1039df5f29cSBjoern A. Zeeb 	len = size + NET_SKB_PAD;
1049df5f29cSBjoern A. Zeeb 	skb = linuxkpi_alloc_skb(len, gfp);
1059df5f29cSBjoern A. Zeeb 
1069df5f29cSBjoern A. Zeeb 	if (skb != NULL)
1079df5f29cSBjoern A. Zeeb 		skb_reserve(skb, NET_SKB_PAD);
1089df5f29cSBjoern A. Zeeb 
1099df5f29cSBjoern A. Zeeb 	SKB_TRACE_FMT(skb, "data %p size %zu len %zu",
1109df5f29cSBjoern A. Zeeb 	    (skb) ? skb->data : NULL, size, len);
11149ed6e97SBjoern A. Zeeb 	return (skb);
11249ed6e97SBjoern A. Zeeb }
11349ed6e97SBjoern A. Zeeb 
114*349b042bSBjoern A. Zeeb struct sk_buff *
115*349b042bSBjoern A. Zeeb linuxkpi_skb_copy(struct sk_buff *skb, gfp_t gfp)
116*349b042bSBjoern A. Zeeb {
117*349b042bSBjoern A. Zeeb 	struct sk_buff *new;
118*349b042bSBjoern A. Zeeb 	struct skb_shared_info *shinfo;
119*349b042bSBjoern A. Zeeb 	size_t len;
120*349b042bSBjoern A. Zeeb 	unsigned int headroom;
121*349b042bSBjoern A. Zeeb 
122*349b042bSBjoern A. Zeeb 	/* Full buffer size + any fragments. */
123*349b042bSBjoern A. Zeeb 	len = skb->end - skb->head + skb->data_len;
124*349b042bSBjoern A. Zeeb 
125*349b042bSBjoern A. Zeeb 	new = linuxkpi_alloc_skb(len, gfp);
126*349b042bSBjoern A. Zeeb 	if (new == NULL)
127*349b042bSBjoern A. Zeeb 		return (NULL);
128*349b042bSBjoern A. Zeeb 
129*349b042bSBjoern A. Zeeb 	headroom = skb_headroom(skb);
130*349b042bSBjoern A. Zeeb 	/* Fixup head and end. */
131*349b042bSBjoern A. Zeeb 	skb_reserve(new, headroom);	/* data and tail move headroom forward. */
132*349b042bSBjoern A. Zeeb 	skb_put(new, skb->len);		/* tail and len get adjusted */
133*349b042bSBjoern A. Zeeb 
134*349b042bSBjoern A. Zeeb 	/* Copy data. */
135*349b042bSBjoern A. Zeeb 	memcpy(new->head, skb->data - headroom, headroom + skb->len);
136*349b042bSBjoern A. Zeeb 
137*349b042bSBjoern A. Zeeb 	/* Deal with fragments. */
138*349b042bSBjoern A. Zeeb 	shinfo = skb->shinfo;
139*349b042bSBjoern A. Zeeb 	if (shinfo->nr_frags > 0) {
140*349b042bSBjoern A. Zeeb 		printf("%s:%d: NOT YET SUPPORTED; missing %d frags\n",
141*349b042bSBjoern A. Zeeb 		    __func__, __LINE__, shinfo->nr_frags);
142*349b042bSBjoern A. Zeeb 		SKB_TODO();
143*349b042bSBjoern A. Zeeb 	}
144*349b042bSBjoern A. Zeeb 
145*349b042bSBjoern A. Zeeb 	/* Deal with header fields. */
146*349b042bSBjoern A. Zeeb 	memcpy(new->cb, skb->cb, sizeof(skb->cb));
147*349b042bSBjoern A. Zeeb 	SKB_IMPROVE("more header fields to copy?");
148*349b042bSBjoern A. Zeeb 
149*349b042bSBjoern A. Zeeb 	return (new);
150*349b042bSBjoern A. Zeeb }
151*349b042bSBjoern A. Zeeb 
15249ed6e97SBjoern A. Zeeb void
15349ed6e97SBjoern A. Zeeb linuxkpi_kfree_skb(struct sk_buff *skb)
15449ed6e97SBjoern A. Zeeb {
15549ed6e97SBjoern A. Zeeb 	struct skb_shared_info *shinfo;
1566baea331SBjoern A. Zeeb 	uint16_t fragno, count;
15749ed6e97SBjoern A. Zeeb 
15849ed6e97SBjoern A. Zeeb 	SKB_TRACE(skb);
15949ed6e97SBjoern A. Zeeb 	if (skb == NULL)
16049ed6e97SBjoern A. Zeeb 		return;
16149ed6e97SBjoern A. Zeeb 
16249ed6e97SBjoern A. Zeeb 	/*
16349ed6e97SBjoern A. Zeeb 	 * XXX TODO this will go away once we have skb backed by mbuf.
16449ed6e97SBjoern A. Zeeb 	 * currently we allow the mbuf to stay around and use a private
16549ed6e97SBjoern A. Zeeb 	 * free function to allow secondary resources to be freed along.
16649ed6e97SBjoern A. Zeeb 	 */
16749ed6e97SBjoern A. Zeeb 	if (skb->m != NULL) {
16849ed6e97SBjoern A. Zeeb 		void *m;
16949ed6e97SBjoern A. Zeeb 
17049ed6e97SBjoern A. Zeeb 		m = skb->m;
17149ed6e97SBjoern A. Zeeb 		skb->m = NULL;
17249ed6e97SBjoern A. Zeeb 
17349ed6e97SBjoern A. Zeeb 		KASSERT(skb->m_free_func != NULL, ("%s: skb %p has m %p but no "
17449ed6e97SBjoern A. Zeeb 		    "m_free_func %p\n", __func__, skb, m, skb->m_free_func));
17549ed6e97SBjoern A. Zeeb 		skb->m_free_func(m);
17649ed6e97SBjoern A. Zeeb 	}
17749ed6e97SBjoern A. Zeeb 	KASSERT(skb->m == NULL,
17849ed6e97SBjoern A. Zeeb 	    ("%s: skb %p m %p != NULL\n", __func__, skb, skb->m));
17949ed6e97SBjoern A. Zeeb 
18049ed6e97SBjoern A. Zeeb 	shinfo = skb->shinfo;
1816baea331SBjoern A. Zeeb 	for (count = fragno = 0;
1826baea331SBjoern A. Zeeb 	    count < shinfo->nr_frags && fragno < nitems(shinfo->frags);
1836baea331SBjoern A. Zeeb 	    fragno++) {
18449ed6e97SBjoern A. Zeeb 
1856baea331SBjoern A. Zeeb 		if (shinfo->frags[fragno].page != NULL) {
1866baea331SBjoern A. Zeeb 			struct page *p;
1876baea331SBjoern A. Zeeb 
1886baea331SBjoern A. Zeeb 			p = shinfo->frags[fragno].page;
1896baea331SBjoern A. Zeeb 			shinfo->frags[fragno].size = 0;
1906baea331SBjoern A. Zeeb 			shinfo->frags[fragno].offset = 0;
1916baea331SBjoern A. Zeeb 			shinfo->frags[fragno].page = NULL;
1926baea331SBjoern A. Zeeb 			__free_page(p);
1936baea331SBjoern A. Zeeb 			count++;
1946baea331SBjoern A. Zeeb 		}
19549ed6e97SBjoern A. Zeeb 	}
19649ed6e97SBjoern A. Zeeb 
19749ed6e97SBjoern A. Zeeb 	free(skb, M_LKPISKB);
19849ed6e97SBjoern A. Zeeb }
1996baea331SBjoern A. Zeeb 
2006baea331SBjoern A. Zeeb #ifdef DDB
2016baea331SBjoern A. Zeeb DB_SHOW_COMMAND(skb, db_show_skb)
2026baea331SBjoern A. Zeeb {
2036baea331SBjoern A. Zeeb 	struct sk_buff *skb;
2046baea331SBjoern A. Zeeb 	int i;
2056baea331SBjoern A. Zeeb 
2066baea331SBjoern A. Zeeb 	if (!have_addr) {
2076baea331SBjoern A. Zeeb 		db_printf("usage: show skb <addr>\n");
2086baea331SBjoern A. Zeeb 			return;
2096baea331SBjoern A. Zeeb 	}
2106baea331SBjoern A. Zeeb 
2116baea331SBjoern A. Zeeb 	skb = (struct sk_buff *)addr;
2126baea331SBjoern A. Zeeb 
2136baea331SBjoern A. Zeeb 	db_printf("skb %p\n", skb);
2146baea331SBjoern A. Zeeb 	db_printf("\tnext %p prev %p\n", skb->next, skb->prev);
2156baea331SBjoern A. Zeeb 	db_printf("\tlist %d\n", skb->list);
2166baea331SBjoern A. Zeeb 	db_printf("\t_alloc_len %u len %u data_len %u truesize %u mac_len %u\n",
2176baea331SBjoern A. Zeeb 	    skb->_alloc_len, skb->len, skb->data_len, skb->truesize,
2186baea331SBjoern A. Zeeb 	    skb->mac_len);
2196baea331SBjoern A. Zeeb 	db_printf("\tcsum %#06x l3hdroff %u l4hdroff %u priority %u qmap %u\n",
2206baea331SBjoern A. Zeeb 	    skb->csum, skb->l3hdroff, skb->l4hdroff, skb->priority, skb->qmap);
2216baea331SBjoern A. Zeeb 	db_printf("\tpkt_type %d dev %p sk %p\n",
2226baea331SBjoern A. Zeeb 	    skb->pkt_type, skb->dev, skb->sk);
2236baea331SBjoern A. Zeeb 	db_printf("\tcsum_offset %d csum_start %d ip_summed %d protocol %d\n",
2246baea331SBjoern A. Zeeb 	    skb->csum_offset, skb->csum_start, skb->ip_summed, skb->protocol);
2256baea331SBjoern A. Zeeb 	db_printf("\thead %p data %p tail %p end %p\n",
2266baea331SBjoern A. Zeeb 	    skb->head, skb->data, skb->tail, skb->end);
2276baea331SBjoern A. Zeeb 	db_printf("\tshinfo %p m %p m_free_func %p\n",
2286baea331SBjoern A. Zeeb 	    skb->shinfo, skb->m, skb->m_free_func);
2296baea331SBjoern A. Zeeb 
2306baea331SBjoern A. Zeeb 	if (skb->shinfo != NULL) {
2316baea331SBjoern A. Zeeb 		struct skb_shared_info *shinfo;
2326baea331SBjoern A. Zeeb 
2336baea331SBjoern A. Zeeb 		shinfo = skb->shinfo;
2346baea331SBjoern A. Zeeb 		db_printf("\t\tgso_type %d gso_size %u nr_frags %u\n",
2356baea331SBjoern A. Zeeb 		    shinfo->gso_type, shinfo->gso_size, shinfo->nr_frags);
2366baea331SBjoern A. Zeeb 		for (i = 0; i < nitems(shinfo->frags); i++) {
2376baea331SBjoern A. Zeeb 			struct skb_frag *frag;
2386baea331SBjoern A. Zeeb 
2396baea331SBjoern A. Zeeb 			frag = &shinfo->frags[i];
2406baea331SBjoern A. Zeeb 			if (frag == NULL || frag->page == NULL)
2416baea331SBjoern A. Zeeb 				continue;
2426baea331SBjoern A. Zeeb 			db_printf("\t\t\tfrag %p fragno %d page %p %p "
2436baea331SBjoern A. Zeeb 			    "offset %ju size %zu\n",
2446baea331SBjoern A. Zeeb 			    frag, i, frag->page, linux_page_address(frag->page),
2456baea331SBjoern A. Zeeb 			    (uintmax_t)frag->offset, frag->size);
2466baea331SBjoern A. Zeeb 		}
2476baea331SBjoern A. Zeeb 	}
2486baea331SBjoern A. Zeeb 	db_printf("\tcb[] %p {", skb->cb);
2496baea331SBjoern A. Zeeb 	for (i = 0; i < nitems(skb->cb); i++) {
2506baea331SBjoern A. Zeeb 		db_printf("%#04x%s",
2516baea331SBjoern A. Zeeb 		    skb->cb[i], (i < (nitems(skb->cb)-1)) ? ", " : "");
2526baea331SBjoern A. Zeeb 	}
2536baea331SBjoern A. Zeeb 	db_printf("}\n");
2546baea331SBjoern A. Zeeb 
2556baea331SBjoern A. Zeeb 	db_printf("\t_spareu16_0 %#06x __scratch[0] %p\n",
2566baea331SBjoern A. Zeeb 	    skb->_spareu16_0, skb->__scratch);
2576baea331SBjoern A. Zeeb };
2586baea331SBjoern A. Zeeb #endif
259